streamlit_app.py

import json
import streamlit as st
from main import main as scraper
import time

# Function to load markdown file


def get_file_content_as_string(path):
    with open(path, "r") as file:
        lines = file.readlines()
    return "".join(lines)

# Function to load cached data from jobs.json


def load_cached_data():
    try:
        with open("jobs.json", "r") as file:
            datas = file.read()
            return json.loads(datas)["jobs"]
    except Exception as e:
        print(e)
        return {}

# Function to save data to jobs.json


def save_data_to_cache(data):
    with open("jobs.json", "w") as file:
        file.write(json.dumps({"jobs": data}))
    st.success("Data saved to cache!")

# Function to clear cache


def clear_cache():
    with open("jobs.json", "w") as file:
        file.write(json.dumps({"jobs": {}}))
    st.success("Cache cleared!")
    st.rerun()  # Rerun the app to reflect the changes

# Function to scrape jobs


def scrape_jobs():
    # Simulate scraping delay
    # time.sleep(5)
    # Replace the following with your actual scraping logic and return the scraped data as a dictionary
    return scraper()

# Function to scrape jobs and display the result


def scrape_and_display(col2):
    global data
    with col2:
        with st.spinner("Scraping jobs... Please wait."):
            if data:
                st.info("Using cached data")
                scraped_data = data
                st.balloons()  # Add a pop-up to notify the user that the data is cached
            else:
                st.info(
                    "No cached data found... Scraping new data. This may take a while.")
                scraped_data = scrape_jobs()
                st.success("Scraping complete!")

        st.text("Total jobs scraped: {}".format(len(scraped_data)))
        return scraped_data

# Main Streamlit app


def main():
    global data
    st.set_page_config(page_title="Amazon Jobs Scraper",
                       page_icon=":briefcase:")

    st.title("Amazon Jobs Scraper")

    data = load_cached_data()

    search_term = st.text_input(
        "Search for a specific Job Category", placeholder="Enter a job category...")

    col1, col2 = st.columns([1, 4])

    with col1:
        if st.button("Scrape Jobs"):
            data = scrape_and_display(col2)

        if st.button("Save to Cache"):
            save_data_to_cache(data)

        if st.button("Clear Cache"):
            clear_cache()

        # if st.button("Clear Content"):
        #     st.text("Content cleared!")
        if st.button("Clear Content"):
            with col2:
                st.text("Content cleared!")
                data = []  # Clear the data displayed on the right side
            # st.json({})  # Clear the displayed JSON content

        if st.download_button("Download Data as JSON", json.dumps(data), "jobs.json", "Click here to download data"):
            st.success("Data downloaded successfully!")
        if st.button("Show Source Code"):
            # st.code(open(__file__).read())
            with col2:
                st.markdown("### Source Code")
                st.code(open(__file__).read())
        if st.button("Show Documentation"):
            with col2:
                st.markdown("### Documentation")
                readme_text = st.markdown(
                    get_file_content_as_string("README.md"))

    with col2:
        if search_term:
            st.text("Showing results for search term: {}".format(search_term))
            filtered_data = [
                job for job in data if search_term.lower() in job["job_category"].lower()]
            if filtered_data:
                data = filtered_data
            else:
                st.warning(
                    "No jobs found for search term: {}".format(search_term))

        if data:
            job_titles = [job["title"] for job in data]
            selected_title = st.selectbox("Select Job Title", job_titles)
            selected_job = next(
                (job for job in data if job["title"] == selected_title), None)
            if selected_job:
                st.table(selected_job)


if __name__ == "__main__":
    main()