@@ -37,7 +37,8 @@ def get_product_details(context: BeautifulSoupCrawlingContext, category: str) ->
37
37
"""Scrape details of specific product."""
38
38
soup = context .soup
39
39
details = {
40
- 'sku' : soup .find ('span' , {'itemprop' : 'name' }).text ,
40
+ 'name' : soup .find ('span' , {'itemprop' : 'name' }).text ,
41
+ 'sku' : soup .find ('div' , {'itemprop' : 'sku' }).text ,
41
42
'category' : category ,
42
43
'price' : soup .find ('div' , 'product-info-price' ).find ('span' , 'price' ).text ,
43
44
'imageUrl' : soup .select ('.gallery-placeholder__image' )[0 ]['src' ].split ('?' )[0 ],
@@ -70,7 +71,7 @@ async def main() -> None:
70
71
async with Actor :
71
72
actor_input = await Actor .get_input () or {}
72
73
max_requests_per_crawl = actor_input .get ('max_requests_per_crawl' , 30 )
73
- desired_categories = {category .lower () for category in actor_input .get ('categories ' , [])}
74
+ desired_categories = {category .lower () for category in actor_input .get ('desired_categories ' , [])}
74
75
include_keywords = {word .lower () for word in actor_input .get ('include_keywords' , [])}
75
76
exclude_keywords = {word .lower () for word in actor_input .get ('exclude_keywords' , [])}
76
77
Actor .log .info (f'{ desired_categories = } , { include_keywords = } ,{ exclude_keywords = } ,{ max_requests_per_crawl = } ' )
0 commit comments