Spaces:

PaulMartrenchar
/

jobsearch

Sleeping

App Files Files Community

PaulMartrenchar commited on Jan 2

Commit

6b24d80

1 Parent(s): 4c11d35

Move the DB to a class

Browse files

Files changed (2) hide show

app.py +3 -2
db.py +45 -40

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ from jobspy_indeed import indeed_get_jobs
 from WelcomeToTheJungle import wtoj_get_jobs
 from jobspy_linkedin import linkedin_get_jobs
 from ai_manager import get_extra_information
-from db import add_to_db
 def html_format_page(jobs : List[JobDescription]):
     result = ["<html><head><style>.job{display: flex;width:70%;margin: 5px auto;border: 1px solid;border-radius: 5px;}.logobox{flex: 1;display: flex;align-items: center;justify-content: center;}.logo{width:100px;height:100px}h4{margin: 2px;}</style></head><body>"]
@@ -56,7 +56,8 @@ def search_jobs(search_term, platform):
     for job in selected_jobs:
         job.ai_result = get_extra_information(job.company, job.job_description)
-    add_to_db(selected_jobs)
     return html_format_page(selected_jobs)

 from WelcomeToTheJungle import wtoj_get_jobs
 from jobspy_linkedin import linkedin_get_jobs
 from ai_manager import get_extra_information
+from db import Database
 def html_format_page(jobs : List[JobDescription]):
     result = ["<html><head><style>.job{display: flex;width:70%;margin: 5px auto;border: 1px solid;border-radius: 5px;}.logobox{flex: 1;display: flex;align-items: center;justify-content: center;}.logo{width:100px;height:100px}h4{margin: 2px;}</style></head><body>"]
     for job in selected_jobs:
         job.ai_result = get_extra_information(job.company, job.job_description)
+    db = Database()
+    db.add_to_db(selected_jobs)
     return html_format_page(selected_jobs)

db.py CHANGED Viewed

@@ -6,47 +6,52 @@ import json
 REPO_ID = "jobsearch_database"
 FILE_NAME = "db.json"
-DB : List[JobDescription] = []
 JSON_DATASET_DIR = Path("json_dataset")
 JSON_DATASET_DIR.mkdir(parents=True, exist_ok=True)
 JSON_DATASET_PATH = JSON_DATASET_DIR / FILE_NAME
-def get_current_db() -> List[JobDescription]:
-    filepath = hf_hub_download(repo_id=REPO_ID, filename=FILE_NAME, repo_type="dataset")
-    with open(filepath, 'r') as file:
-        return json.load(file)
-def merge_dbs(list1 : List[JobDescription], list2 : List[JobDescription]):
-    unique_urls = set()
-    merged_list = []
-    for job in list1 + list2:
-        if job.url not in unique_urls:
-            unique_urls.add(job.url)
-            merged_list.append(job)
-    return merged_list
-def add_to_db(new_jobs : List[JobDescription]):
-    #Remove descriptions from the JobDescription
-    for job in new_jobs:
-        job.job_description = ""
-    #get current DB
-    current_db = DB
-    #merge
-    new_db = merge_dbs(current_db, new_jobs)
-    #update
-    api = HfApi()
-    with open(FILE_NAME, 'w') as file:
-        json.dump(new_db, file, indent=4)
-    api.upload_file(
-        path_or_fileobj=FILE_NAME,
-        path_in_repo=FILE_NAME,
-        repo_id=REPO_ID,
-        repo_type="dataset",
-    )
-    DB = new_db

 REPO_ID = "jobsearch_database"
 FILE_NAME = "db.json"
 JSON_DATASET_DIR = Path("json_dataset")
 JSON_DATASET_DIR.mkdir(parents=True, exist_ok=True)
 JSON_DATASET_PATH = JSON_DATASET_DIR / FILE_NAME
+class Database:
+    def __init__(self):
+        self.DB : List[JobDescription] = []
+    def get_current_db(self) -> List[JobDescription]:
+        filepath = hf_hub_download(repo_id=REPO_ID, filename=FILE_NAME, repo_type="dataset")
+        with open(filepath, 'r') as file:
+            return json.load(file)
+    def save_db(self, new_db):
+        api = HfApi()
+        with open(FILE_NAME, 'w') as file:
+            json.dump(new_db, file, indent=4)
+        api.upload_file(
+            path_or_fileobj=FILE_NAME,
+            path_in_repo=FILE_NAME,
+            repo_id=REPO_ID,
+            repo_type="dataset",
+        )
+    def merge_dbs(self, list1 : List[JobDescription], list2 : List[JobDescription]):
+        unique_urls = set()
+        merged_list = []
+        for job in list1 + list2:
+            if job.url not in unique_urls:
+                unique_urls.add(job.url)
+                merged_list.append(job)
+        return merged_list
+    def add_to_db(self, new_jobs : List[JobDescription]):
+        #Remove descriptions from the JobDescription
+        for job in new_jobs:
+            job.job_description = ""
+        #get current DB
+        current_db = self.DB
+        #merge
+        new_db = self.merge_dbs(current_db, new_jobs)
+        #update
+        self.save_db(new_db)
+        self.DB = new_db