Update XPath for Google engine

This commit is contained in:
Émilien Devos 2022-01-17 21:49:57 +00:00 committed by GitHub
parent 96ab5e57ff
commit 6670063e0d
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 4 additions and 4 deletions

View File

@ -111,8 +111,8 @@ filter_mapping = {0: 'off', 1: 'medium', 2: 'high'}
# specific xpath variables # specific xpath variables
# ------------------------ # ------------------------
# google results are grouped into <div class="g" ../> # google results are grouped into <div class="g ..." ../>
results_xpath = '//div[@class="g"]' results_xpath = '//div[contains(@class, "g")]'
# google *sections* are no usual *results*, we ignore them # google *sections* are no usual *results*, we ignore them
g_section_with_header = './g-section-with-header' g_section_with_header = './g-section-with-header'
@ -124,8 +124,8 @@ title_xpath = './/h3[1]'
# href=...> # href=...>
href_xpath = './/div[@class="yuRUbf"]//a/@href' href_xpath = './/div[@class="yuRUbf"]//a/@href'
# in the result group there is <div class="IsZvec" ../> containing he *content* # in the result group there is <div class="VwiC3b ..." ../> containing the *content*
content_xpath = './/div[@class="IsZvec"]' content_xpath = './/div[contains(@class, "VwiC3b")]'
# Suggestions are links placed in a *card-section*, we extract only the text # Suggestions are links placed in a *card-section*, we extract only the text
# from the links not the links itself. # from the links not the links itself.