1from apify_client import ApifyClient
2
3
4
5client = ApifyClient("<YOUR_API_TOKEN>")
6
7
8run_input = {
9 "requests": [
10 { "url": "https://www.scrapethissite.com/pages/simple/" },
11 {
12 "id": "forms",
13 "url": "https://www.scrapethissite.com/pages/simple/",
14 "extract": [{
15 "field_name": "extracted_html",
16 "selector": "#countries > div > div:nth-child(4) > div:nth-child(1)",
17 "extract_type": "HTML",
18 }],
19 },
20 {
21 "id": "hockey",
22 "url": "https://www.scrapethissite.com/pages/forms/",
23 "extract": [
24 {
25 "field_name": "year1",
26 "selector": "#hockey > div > table > tbody > tr:nth-child(2) > td.year",
27 "extract_type": "Text",
28 },
29 {
30 "field_name": "year2",
31 "selector": "#hockey > div > table > tbody > tr:nth-child(3) > td.year",
32 "extract_type": "Text",
33 },
34 {
35 "field_name": "class_name",
36 "selector": "#hockey > div > table > tbody > tr:nth-child(2) > td.year",
37 "extract_type": { "Attribute": "class" },
38 },
39 ],
40 },
41 ],
42 "proxy_settings": { "useApifyProxy": True },
43}
44
45
46run = client.actor("danielherman/fast-scraper").call(run_input=run_input)
47
48
49print("💾 Check your data here: https://console.apify.com/storage/datasets/" + run["defaultDatasetId"])
50for item in client.dataset(run["defaultDatasetId"]).iterate_items():
51 print(item)
52
53