forked from sigmachirality/indeed-resume-scraper
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathbulk_scraper.py
78 lines (63 loc) · 1019 Bytes
/
bulk_scraper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
from indeed_scraper import process_query
import os
def main():
locationString = ''' New York
Los Angeles
Chicago
Brooklyn
Queens
Houston
Manhattan
Phoenix
Philadelphia
San Antonio
Bronx
San Diego
Dallas
San Jose
Austin
Jacksonville
San Francisco
Columbus
Fort Worth
Indianapolis
Charlotte
Seattle
Denver
Washington
Boston
El Paso
Detroit
Nashville
Memphis
Portland
Oklahoma City
Las Vegas
Louisville
Baltimore
Milwaukee
Albuquerque
Tucson
Fresno
Sacramento
Mesa
Kansas City
Atlanta
Staten Island
Long Beach
Omaha
Raleigh
Colorado Springs
Miami
Virginia Beach
'''
locations = locationString.split("\n")
locations = [i.strip() for i in locations if i != ""]
jobs = ["engineer", "lawyer", "doctor", "journalist", "software engineer", "nurse", "consultant", "executive"]
output_folder = os.path.dirname(os.path.abspath(__file__)) + os.sep + "data"
if not os.path.exists(output_folder):
os.makedirs(output_folder)
for j in jobs:
for l in locations[:10]:
process_query(j, l, output_folder)
main()