Facebook
From yo, 4 Years ago, written in Plain Text.
This paste is a reply to Untitled from yo - view diff
Embed
Download Paste or View Raw
Hits: 260
  1. {
  2.   "start_urls":
  3.   [
  4.         "https://www.amazon.es/b/ref=pantry-wayfinder-3-1-4?node=15426699031",
  5.     "https://www.amazon.es/s?rh=n%3A6198072031%2Cn%3A%2114849352031%2Cn%3A%2114849354031%2Cn%3A15426699031&page=2&qid=1576664435&ref=lp_15426699031_pg_2",
  6.     "https://www.amazon.es/s?i=grocery&rh=n%3A6198072031%2Cn%3A14849352031%2Cn%3A14849354031%2Cn%3A15426699031&page=3&qid=1576664490&ref=sr_pg_3",
  7.     "https://www.amazon.es/s?i=grocery&rh=n%3A6198072031%2Cn%3A14849352031%2Cn%3A14849354031%2Cn%3A15426699031&page=4&qid=1576664545&ref=sr_pg_4",
  8.     "https://www.amazon.es/s?i=grocery&rh=n%3A6198072031%2Cn%3A14849352031%2Cn%3A14849354031%2Cn%3A15426699031&page=5&qid=1576664563&ref=sr_pg_5",
  9.     "https://www.amazon.es/s?i=grocery&rh=n%3A6198072031%2Cn%3A14849352031%2Cn%3A14849354031%2Cn%3A15426699031&page=6&qid=1576664656&ref=sr_pg_6",
  10.     "https://www.amazon.es/s?i=grocery&rh=n%3A6198072031%2Cn%3A14849352031%2Cn%3A14849354031%2Cn%3A15426699031&page=7&qid=1576664666&ref=sr_pg_7",
  11.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346878031&dc&fst=as%3Aoff&qid=1573662807&rnid=3677431031&ref=sr_nr_n_1",
  12.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4347676031&dc&fst=as%3Aoff&qid=1573662931&rnid=3677431031&ref=sr_nr_n_2",
  13.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346879031&dc&fst=as%3Aoff&qid=1573662983&rnid=3677431031&ref=sr_nr_n_3",
  14.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346880031&dc&fst=as%3Aoff&qid=1573662957&rnid=3677431031&ref=sr_nr_n_4",
  15.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346882031&dc&fst=as%3Aoff&qid=1573663005&rnid=3677431031&ref=sr_nr_n_5",
  16.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346884031&dc&fst=as%3Aoff&qid=1573663030&rnid=3677431031&ref=sr_nr_n_6",
  17.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4347698031&dc&fst=as%3Aoff&qid=1573663051&rnid=3677431031&ref=sr_nr_n_7",
  18.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346918031&dc&fst=as%3Aoff&qid=1573663095&rnid=3677431031&ref=sr_nr_n_9",
  19.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A6691131031&dc&fst=as%3Aoff&qid=1573663203&rnid=3677431031&ref=sr_nr_n_10",
  20.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346885031&dc&fst=as%3Aoff&qid=1573663602&rnid=3677431031&ref=sr_nr_n_11",
  21.     "https://www.amazon.es/s?i=pantry&srs=10547412031&bbn=10858545031&rh=n%3A10858545031%2Cn%3A%213677431031%2Cn%3A4346886031&dc&fst=as%3Aoff&qid=1573663621&rnid=3677431031&ref=sr_nr_n_12"
  22.   ],
  23.   "fields": {
  24.     "name": "//h1[@id='title']/span[@id='productTitle']/text()",
  25.     "price": "//td[@class='a-span12']/span[@id='priceblock_ourprice']",
  26.     "price_old": "//span[@class='priceBlockStrikePriceString a-text-strike']/text()",
  27.     "reference": "",
  28.     "image": "//div[@id='imgTagWrapperId']/img/@src",
  29.     "description": "//div[@id='productDescription']//text()",
  30.     "brand": "",
  31.     "brand_text": "//div[@id='merchant-info']/a[@id='sellerProfileTriggerId']/text()",
  32.     "categories": "//div[@id='wayfinding-breadcrumbs_container']//ul/li/span[@class='a-list-item']/a/text()",
  33.     "availability": "//div[@class='a-section']/div[@id='availability']/span/text()",
  34.     "rating_average": "//span[@class='a-declarative']//span[@data-hook='rating-out-of-text']/text()",
  35.     "rating_count": "//*[@id='reviewsMedley']/div/div[1]/div[1]/div[2]",
  36.     "barcode": "",
  37.     "stock": "",
  38.     "seller": "//div[@id='merchant-info']/a[@id='sellerProfileTriggerId']/text()"
  39.   },
  40.   "links": {
  41.     "detail": "(//i[@aria-label='Amazon Pantry']/parent::span/parent::a[contains(@class,'a-link-normal')]|//img[@aria-label='Amazon Pantry']/preceding-sibling::a[contains(@class,'a-text-normal')])",
  42.     "next_page": "//a[(contains(.,'Siguiente') or contains(.,'siguiente')) and not(contains(@class,'carousel-goto-nextpage'))]"
  43.   },
  44.     "regex": {
  45.         "rating_average": ["(.*?)de", 1],
  46.         "rating_count": ["(.*?)valoraciones", 1]
  47.     }
  48. }