recruiter-assistant-jbfxrs / scripts /preprocess-vacancies.py
Vincent Claes
set format output
1c897ec
raw
history blame
412 Bytes
import pandas as pd
import pathlib
current_directory = pathlib.Path(__file__).resolve().parent
df = pd.read_csv(current_directory / "vacancies.csv")
df = df[["Vacancy"]]
df = df.drop_duplicates(subset=["Vacancy"])
# Remove all the new lines from each cell of the 'Resume' column
df["Vacancy"] = df["Vacancy"].replace("\n", ".,", regex=True)
df.to_csv(current_directory/"jobfixers.csv", index=False, header=False)