From 5b50d7455a719b145be5f90069026a60b480673d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?No=C3=A9mi=20V=C3=A1nyi?= Date: Tue, 2 Aug 2022 19:19:12 +0200 Subject: [PATCH] Do not consent to tracking when using google --- searx/engines/google.py | 3 ++- searx/engines/google_news.py | 3 ++- searx/engines/google_scholar.py | 3 ++- searx/engines/google_videos.py | 3 ++- searx/engines/youtube_noapi.py | 3 ++- 5 files changed, 10 insertions(+), 5 deletions(-) diff --git a/searx/engines/google.py b/searx/engines/google.py index 707bff8a..1388550b 100644 --- a/searx/engines/google.py +++ b/searx/engines/google.py @@ -11,6 +11,7 @@ Definitions`_. # pylint: disable=invalid-name, missing-function-docstring, too-many-branches from urllib.parse import urlencode, urlparse +from random import random from lxml import html from searx import logger from searx.utils import match_language, extract_text, eval_xpath, eval_xpath_list, eval_xpath_getindex @@ -236,7 +237,7 @@ def request(query, params): params['url'] = query_url logger.debug("HTTP header Accept-Language --> %s", lang_info.get('Accept-Language')) - params['cookies']['CONSENT'] = "YES+" + params['cookies']['CONSENT'] = "PENDING+" + str(random()*100) params['headers'].update(lang_info['headers']) if use_mobile_ui: params['headers']['Accept'] = '*/*' diff --git a/searx/engines/google_news.py b/searx/engines/google_news.py index c9b23ccc..ff39543d 100644 --- a/searx/engines/google_news.py +++ b/searx/engines/google_news.py @@ -21,6 +21,7 @@ import binascii import re from urllib.parse import urlencode from base64 import b64decode +from random import random from lxml import html from searx import logger @@ -113,7 +114,7 @@ def request(query, params): logger.debug("HTTP header Accept-Language --> %s", lang_info.get('Accept-Language')) - params['cookies']['CONSENT'] = "YES+" + params['cookies']['CONSENT'] = "PENDING+" + str(random()*100) params['headers'].update(lang_info['headers']) params['headers']['Accept'] = ( 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8' diff --git a/searx/engines/google_scholar.py b/searx/engines/google_scholar.py index 307380ff..2978d403 100644 --- a/searx/engines/google_scholar.py +++ b/searx/engines/google_scholar.py @@ -12,6 +12,7 @@ Definitions`_. from urllib.parse import urlencode from datetime import datetime +from random import random from lxml import html from searx import logger @@ -99,7 +100,7 @@ def request(query, params): params['url'] = query_url logger.debug("HTTP header Accept-Language --> %s", lang_info.get('Accept-Language')) - params['cookies']['CONSENT'] = "YES+" + params['cookies']['CONSENT'] = "PENDING+" + str(random()*100) params['headers'].update(lang_info['headers']) params['headers']['Accept'] = ( 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8' diff --git a/searx/engines/google_videos.py b/searx/engines/google_videos.py index 1c286d03..8665181a 100644 --- a/searx/engines/google_videos.py +++ b/searx/engines/google_videos.py @@ -22,6 +22,7 @@ Definitions`_. Not all parameters can be appied. import re from urllib.parse import urlencode +from random import random from lxml import html from searx import logger @@ -139,7 +140,7 @@ def request(query, params): params['url'] = query_url logger.debug("HTTP header Accept-Language --> %s", lang_info.get('Accept-Language')) - params['cookies']['CONSENT'] = "YES+" + params['cookies']['CONSENT'] = "PENDING+" + str(random()*100) params['headers'].update(lang_info['headers']) params['headers']['Accept'] = ( 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8' diff --git a/searx/engines/youtube_noapi.py b/searx/engines/youtube_noapi.py index d9af3429..e043b743 100644 --- a/searx/engines/youtube_noapi.py +++ b/searx/engines/youtube_noapi.py @@ -6,6 +6,7 @@ from functools import reduce from json import loads, dumps from urllib.parse import quote_plus +from random import random # about about = { @@ -43,7 +44,7 @@ base_youtube_url = 'https://www.youtube.com/watch?v=' # do search-request def request(query, params): - params['cookies']['CONSENT'] = "YES+" + params['cookies']['CONSENT'] = "PENDING+" + str(random() * 100) if not params['engine_data'].get('next_page_token'): params['url'] = search_url.format(query=quote_plus(query), page=params['pageno']) if params['time_range'] in time_range_dict: