diff --git a/.gitignore b/.gitignore index eb39232..2b68f2f 100644 --- a/.gitignore +++ b/.gitignore @@ -143,5 +143,7 @@ scripts/similarity/config.yml *.local.yml # Processed or local files -/Data/Processed/* +/Data/Processed/JobDescription +/Data/Processed/Resumes + *.local.pdf diff --git a/run_first.py b/run_first.py index bebfd19..7ea2524 100644 --- a/run_first.py +++ b/run_first.py @@ -1,14 +1,24 @@ import json import logging import os +import traceback + from scripts import JobDescriptionProcessor, ResumeProcessor from scripts.utils import get_filenames_from_dir, init_logging_config init_logging_config() -PROCESSED_RESUMES_PATH = "Data/Processed/Resumes" -PROCESSED_JOB_DESCRIPTIONS_PATH = "Data/Processed/JobDescription" +processed_Path = os.path.join(os.getcwd(), "Data", "Processed") +if not os.path.exists(os.path.join(processed_Path)): + logging.info('"/Processed/" directory structure is missing, setting up a new one.\n') + os.mkdir(processed_Path) + os.mkdir(os.path.join(processed_Path, "Resumes")) + os.mkdir(os.path.join(processed_Path, "Data")) + + +PROCESSED_RESUMES_PATH = os.path.join(os.getcwd(), "Data", "Processed", "Resumes") +PROCESSED_JOB_DESCRIPTIONS_PATH = os.path.join(os.getcwd(), "Data", "Processed", "JobDescription") def read_json(filename): @@ -44,6 +54,7 @@ def remove_old_files(files_path): logging.error("There are no resumes present in the specified folder.") logging.error("Exiting from the program.") logging.error("Please add resumes in the Data/Resumes folder and try again.") + logging.error(str(traceback.format_exc())) exit(1) # Now after getting the file_names parse the resumes into a JSON Format. @@ -66,6 +77,7 @@ def remove_old_files(files_path): logging.error("There are no job-description present in the specified folder.") logging.error("Exiting from the program.") logging.error("Please add resumes in the Data/JobDescription folder and try again.") + logging.error(str(traceback.format_exc())) exit(1) # Now after getting the file_names parse the resumes into a JSON Format.