[enh] Add Pagination to Wiby / Fix Kaufland (#3000)

* [fix] Fix Kaufland engine

Changed Xpath expressions

* [enh] Remove tracking params from Kaufland results

* [enh] Add pagination to Wiby

* [fix] Properly select title_xpath

Co-authored-by: Noémi Ványi <kvch@users.noreply.github.com>
This commit is contained in:
Allen 2021-10-10 20:52:06 +02:00 committed by GitHub
parent 79dc10e382
commit b0888c6ca3
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 5 additions and 4 deletions

View File

@ -21,7 +21,7 @@ from urllib.parse import urlunparse, parse_qsl, urlencode
regexes = {re.compile(r'utm_[^&]+'),
re.compile(r'(wkey|wemail)[^&]*'),
re.compile(r'(_hsenc|_hsmi|hsCtaTracking|__hssc|__hstc|__hsfp)[^&]*'),
re.compile(r'(_hsenc|_hsmi|hsCtaTracking|__hssc|__hstc|__hsfp|search_value)[^&]*'),
re.compile(r'&$')}
name = gettext('Tracker URL remover')

View File

@ -1231,7 +1231,8 @@ engines:
- name : wiby
engine : json_engine
search_url : https://wiby.me/json/?q={query}
paging : True
search_url : https://wiby.me/json/?q={query}&o={pageno}0
url_query : URL
title_query : Title
content_query : Snippet
@ -1533,8 +1534,8 @@ engines:
timeout : 3.0
paging : True
search_url : https://www.kaufland.de/item/search/?search_value={query}&page={pageno}
title_xpath : //li[@class="product__title"]
url_xpath : //div[@class="product"]//a/@href
title_xpath : //div[@class="product__title"]/text()
url_xpath : //article[@class="product"]//a/@href
content_xpath : //div[@class="price"]
#thumbnail_xpath : '//div[@class="product__image-container"]//img/@data-src'
categories : general