forked from mxrch/GHunt
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathconfig.py
16 lines (14 loc) · 862 Bytes
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
regexs = {
"albums": r'href=\"\.\/albumarchive\/\d*?\/album\/(.*?)\" jsaction.*?>(?:<.*?>){5}(.*?)<\/div><.*?>(\d*?) ',
"photos": r'\],\"(https:\/\/lh\d\.googleusercontent\.com\/.*?)\",\[\"\d{21}\"(?:.*?,){16}\"(.*?)\"',
"review_loc_by_id": r'{}\",.*?\[\[null,null,(.*?),(.*?)\]'
}
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; rv:68.0) Gecko/20100101 Firefox/68.0',
'Connection': 'Keep-Alive'
}
headless = True # if True, it doesn't show the browser while scraping GMaps reviews
ytb_hunt_always = False # if True, search the Youtube channel everytime
gmaps_radius = 30 # in km. The radius distance to create groups of gmaps reviews.
gdocs_public_doc = "1jaEEHZL32t1RUN5WuZEnFpqiEPf_APYKrRBG9LhLdvE" # The public Google Doc to use it as an endpoint, to use Google's Search.
data_path = "resources/data.txt"