-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcreate_mock_data.py
91 lines (78 loc) · 2.5 KB
/
create_mock_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
import os
import random
from utils.performance import _log_execution_time
# Lists of positions, companies, countries, and statuses
positions = [
"Analytics Engineer",
"Artificial Intelligence",
"Azure Data Engineer",
"Azure Data Engineer",
"Business Analyst",
"Chapter Lead",
"Climate Data",
"Cloud Architect",
"Cloud Engineer",
"Cloud Software Engineer",
"Data Analyst",
"Data Architect",
"Data Engineer",
"Data Management Specialist",
"Data Manager",
"Data Platform Engineer Advanced",
"Data Scientist ",
"Data Scientist and Process Mining",
"Data Warehouse Architect",
"Data Warehouse Engineer",
]
companies = [
"Roche",
"Eneco",
"Microsoft",
"ING",
"Heineken",
"HelloFresh",
"BasicFit",
"MAN",
"BMW",
"ABN Amro",
"TU Delft",
"Netflix",
"Deloitte",
]
countries = ["NL", "US", "UK", "CA", "DE", "FR", "ES", "AT", "CH"]
statuses = ["R", "IR", "IIR", "H", "G", "CITIO", "VR", "CR", "N", "IIIR", "VIITO"]
# Number of random folders to generate
num_folders = 42
# Root directory for job applications
root_dir = "./data/job_applications"
# Ensure the root directory exists
os.makedirs(root_dir, exist_ok=True)
# Generate random folders
for i in range(num_folders):
# Randomly select position, company, country, and status
position = random.choice(positions)
company = random.choice(companies)
country = random.choice(countries)
status = random.choice(statuses)
# Construct folder name
folder_name = f"{position} - {company} [{country}] ({status})"
# Create the folder path
folder_path = os.path.join(root_dir, folder_name)
os.makedirs(folder_path, exist_ok=True)
# Create dummy job description file
with open(os.path.join(folder_path, "job_description.txt"), "w") as f:
f.write(f"This is a dummy job description for {position} at {company}.")
# Create dummy CV file
candidate_name = f"john_smith" # Unique candidate name
with open(os.path.join(folder_path, f"{candidate_name}_cv.txt"), "w") as f:
f.write(
"This is a John Smith's CV... it can be in other formats .docx, dpf, etc."
)
# Create dummy cover letter file
with open(
os.path.join(folder_path, f"{candidate_name}_cover_letter.txt"), "w"
) as f:
f.write(
"This is a John Smith's cover letter...it can be in other formats .docx, dpf, etc."
)
print(f"{num_folders} folders with dummy files created under '{root_dir}'.")