Facebook
From Matheuss, 3 Years ago, written in Plain Text.
This paste is a reply to Re: Re: amazon from Social Lemur - go back
Embed
Viewing differences between Re: Re: amazon and Re: Re: Re: amazon
{
  "start_urls":
  [
    "https://www.amazon.es/s?k=irrigador+dental&__mk_es_ES=%C3%85M%C3%85%C5%BD%C3%95%C3%91&qid=1575978395&ref=sr_pg_1"
  ],
  "fields": {
{{
  "start_urls":
  [
    "https://www.amazon.es/s?k=irrigador+dental&__mk_es_ES=%C3%85M%C3%85%C5%BD%C3%95%C3%91&qid=1575978395&ref=sr_pg_1"
  ],
  "Campos": {
    "name": "// h1 [@ id = 'title'] / span [@ id = 'productTitle'] / text ()",
    "price": "// span [@ id = 'priceblock_ourprice'] / text () | // span [@ id = 'priceblock_saleprice'] / text ()",
    "price_old": "// span [@ class = 'priceBlockStrikePriceString a-text-strike'] / text ()",
    "referência": "",
    "imagem": "// div [@ id = 'imgTagWrapperId'] / img / @ src",
    "descrição": "// div [@ id = 'productDescription'] // text ()",
    "marca": "",
    "brand_text": "// * [@ id = 'bylineInfo_feature_div'] / div / a / text ()",
    "categorias": "// div [@ id = 'wayfinding-breadcrumbs_container'] // ul / li / span [@ class = 'a-list-item'] / a / text ()",
    "disponibilidade": "// div [@ class = 'a-section'] / div [@ id = 'disponibilidade'] / span / text ()",
    "rating_average": "// span [@ class = 'a-declarative'] // span [@ data-hook = 'rating-out-of-text'] / text ()",
    "rating_count": "// * [@ id = 'reviewsMedley'] / div / div [1] / div [1] / div [2] / span / text ()",
    "código de barras": "",
    "estoque": "",
    "seller": "// div [@ id = 'merchant-info'] / a [@ id = 'sellerProfileTriggerId'] / text ()"
  },
  "links": {
    "detalhe": "// h2 / a [contém (@ class, 'a-text-normal') e não (contém (@ href, 'pantry'))] | // div [@ class = 's-item -container 'e não (self :: * // img [contains (@ src,' pantry ')])] // h2 / parent :: a [contains (@ class,' a-text-normal ')] " ,
    "next_page": "//a[(contains(.,'Siguiente ') ou contém (.,' siguiente ')) e não (contém (@ class,' carrossel-goto-nextpage '))]"
  },
  "regex": {
    "rating_average": ["(. *?) de", 1],
    "rating_count": ["(. *?) valoraci", 1]
  }
}
    "name": "//h1[@id='title']/span[@id='productTitle']/text()",
    "price": "//span[@id='priceblock_ourprice']/text()|//span[@id='priceblock_saleprice']/text()",
    "price_old": "//span[@class='priceBlockStrikePriceString a-text-strike']/text()",
    "reference": "",
    "image": "//div[@id='imgTagWrapperId']/img/@src",
    "description": "//div[@id='productDescription']//text()",
    "brand": "",
    "brand_text": "//*[@id='bylineInfo_feature_div']/div/a/text()",
    "categories": "//div[@id='wayfinding-breadcrumbs_container']//ul/li/span[@class='a-list-item']/a/text()",
    "availability": "//div[@class='a-section']/div[@id='availability']/span/text()",
    "rating_average": "//span[@class='a-declarative']//span[@data-hook='rating-out-of-text']/text()",
    "rating_count": "//*[@id='reviewsMedley']/div/div[1]/div[1]/div[2]/span/text()",
    "barcode": "",
    "stock": "",
    "seller": "//div[@id='merchant-info']/a[@id='sellerProfileTriggerId']/text()"
  },
  "links": {
    "detail": "//h2/a[contains(@class,'a-text-normal') and not(contains(@href,'pantry'))]|//div[@class='s-item-container' and not(self::*//img[contains(@src,'pantry')])]//h2/parent::a[contains(@class,'a-text-normal')]",
    "next_page": "//a[(contains(.,'Siguiente') or contains(.,'siguiente')) and not(contains(@class,'carousel-goto-nextpage'))]"
  },
  "regex": {
    "rating_average": ["(.*?)de", 1],
    "rating_count": ["(.*?)valoraci", 1]
  }
}