forked from matthoendorf/atk_scraper
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathget_searches.py
executable file
·43 lines (37 loc) · 2.05 KB
/
get_searches.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/usr/bin/env python
import atkscrape as atk
import os
import argparse
def parse_arguments():
parser = argparse.ArgumentParser(
prog="get_many",
description = "scrape ATK recipes to images, mealie json, or both")
parser.add_argument('-e', '--email', required=True, help="ATK email for login.")
parser.add_argument('-p', '--password', required=True, help="SINGLE QUOTED ATK password for login. For example 'my_password!*'")
parser.add_argument('-r', '--recipes', required=True, help="Text file containing a list of ATK pages to grab recipes from. See recipes.txt for an example")
parser.add_argument('-i', '--image', required=False, default=False, help="Get recipes as images (default False)")
parser.add_argument('-j', '--json', required=False, default=True, help="Get recipes as json for mealie (default True)")
parser.add_argument('--sortby', required=False, default='popularity', help='Method to sort recipes for retrieval. Can be "popularity" or "date" (default "popularity")')
parser.add_argument('-o', '--out_path', default='./recipes/', help="Location to save images/json (default './recipes/')")
parser.add_argument('--driver', default='./chromedriver', help="Path to the chromedriver. (default './chromedriver')")
parser.add_argument('--verbose', action='store_true', default=False, help="verbose output")
args = parser.parse_args()
return args
if __name__ == "__main__":
args = parse_arguments()
pages = atk.read_pages(args.recipes)
if not os.path.exists(args.out_path):
os.mkdir(args.out_path)
if args.verbose:
print("Read " + str(len(pages)) + " recipe pages to scrape from")
driver = atk.create_driver(args.driver)
try:
atk.login(driver, args.email, args.password)
for page in pages:
print("Working on "+page)
atk.save_recipes(driver, page, args.image, args.json, args.sortby, args.out_path)
if args.image:
atk.format_images(args.out_path)
finally:
# Close chrome
driver.close()