Aol Engine Update

2024-01-01 19:24:07 +01:00 · 2024-09-28 17:34:28 +03:00 · 2024-09-28 17:34:28 +03:00 · 97cec586c0
commit 97cec586c0
parent 0226c1383f
7 changed files with 303 additions and 0 deletions
--- a/searx/engines/limetorrentlol.py
+++ b/searx/engines/limetorrentlol.py
@ -0,0 +1,34 @@
 from lxml import html
 from searx.utils import (
    extract_text,
    eval_xpath,
 )
 about = {
    "website": 'https://www.limetorrents.lol',
 }
 base_url = 'https://www.limetorrents.lol'
 def request(query, params):
    params['url'] = f"{base_url}/search/all/{query}/"
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    for result in eval_xpath(dom,
                             '//table[@class="table2"]//tr[@bgcolor="#F4F4F4"] | //table[@class="table2"]//tr[@bgcolor="#FFFFFF"]'):
        title = result.xpath('.//td/div')
        title = extract_text(title[0]) if title else None
        url = result.xpath('.//td/div/a/@href')
        url = url[0] if url else None
        if url or title:
            results.append({'url': url, 'title': title,})
    return results
--- a/searx/engines/limetorrentnet.py
+++ b/searx/engines/limetorrentnet.py
@ -0,0 +1,41 @@
 """LimeTorrents
 """
 from urllib.parse import urlencode
 from lxml import html
 from searx.utils import (
    extract_text,
    eval_xpath,
 )
 about = {
    "website": 'https://limetorrent.net',
 }
 base_url = 'https://limetorrent.net'
 def request(query, params):
    query_params = {
        'q': query,
    }
    params['url'] = f"{base_url}/search/?{urlencode(query_params)}"
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    for result in eval_xpath(dom, '//tbody/tr[@bgcolor="#F4F4F4"]'):
        title = result.xpath('.//td/div')
        title = extract_text(title[0]) if title else None
        url = result.xpath('.//td/div/a/@href')
        url = extract_text(url[0]) if url else None
        if url or title:
            results.append({'url': url, 'title': title, })
    return results
--- a/searx/engines/searchencrypt.py
+++ b/searx/engines/searchencrypt.py
@ -0,0 +1,39 @@
 from urllib.parse import urlencode
 from lxml import html
 from searx.utils import extract_text
 about = {
    "website": 'https://www.searchencrypt.com',
    "results": 'HTML',
 }
 safesearch = True
 base_url = 'https://www.searchencrypt.com/search'
 def request(query, params):
    query_params = {
        'q': query,
    }
    params['url'] = f'{base_url}?{urlencode(query_params)}'
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    # Update XPath expressions based on provided HTML structure
    for result in dom.xpath('//div[@class="serp__web-result__container"]'):
        link = result.xpath('.//div/h3/a/@href')
        link = link[0] if link else None
        title = result.xpath('.//div/h3/a/span')
        title = extract_text(title[0]) if title else None
        content = result.xpath('.//div/p/a/span')
        content = extract_text(content[0]) if content else 'None'
        if link or title or content:
            results.append({'url': link, 'title': title, 'content': content})
    return results
--- a/searx/engines/sogou.py
+++ b/searx/engines/sogou.py
@ -0,0 +1,72 @@
 from urllib.parse import urlencode
 from lxml import html
 from searx.utils import extract_text
 about = {
    "website": 'https://www.sogou.com/',
    "results": 'HTML',
 }
 paging = True
 base_url = 'https://www.sogou.com/web'
 def request(query, params):
    page = params.get('pageno', 1)
    query_params = {
        'query': query,
        'page': page,
    }
    # Add the URL for the request
    params['url'] = f'{base_url}?{urlencode(query_params)}'
    # Custom headers for the request
    headers = {
        'Sec-Fetch-Mode': 'cors',
        'Sec-Fetch-Site': 'same-origin',
        'Origin': 'https://translate.sogou.com',
        'Accept-Encoding': 'gzip, deflate, br',
        'Accept-Language': 'en-US,en;q=0.9,zh-CN;q=0.8,zh;q=0.7',
        'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.90 Safari/537.36',
        'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8',
        'Accept': 'application/json',
        'Referer': 'https://translate.sogou.com/',
        'X-Requested-With': 'XMLHttpRequest',
        'Connection': 'keep-alive',
    }
    # Merge with any existing headers in params
    if 'headers' in params:
        params['headers'].update(headers)
    else:
        params['headers'] = headers
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    for result in dom.xpath('//div[@class="vrwrap"]'):
        # Extract link
        link_divs = result.xpath('.//div[contains(@class, "r-sech") and (contains(@class, "click-better-sugg") or contains(@class, "result_list"))]')
        link = link_divs[0].xpath('./@data-url')[0] if link_divs else None
        # Extract title
        title_elem = result.xpath('.//h3[@class="vr-title"]/a') or result.xpath('.//div/h3/a')
        title = title_elem[0].text_content().strip() if title_elem else None
        # Extract content from multiple possible elements
        content_elem = result.xpath('.//div[@class="fz-mid space-txt"]')
        content = content_elem[0].text_content().strip() if content_elem else 'None'
        if link or title:
            results.append({
                'url': link,
                'title': title,
                'content': content,
            })
    return results
--- a/searx/engines/torlock.py
+++ b/searx/engines/torlock.py
@ -0,0 +1,43 @@
 from lxml import html
 from searx.utils import (
    extract_text,
    eval_xpath,
 )
 about = {
    "website": 'https://www.torlock.com',
 }
 base_url = 'https://www.torlock.com'
 paging = True
 def request(query, params):
    params['url'] = f"{base_url}/all/torrents/{query}/{params.get('pageno', 1)}.html"
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    for result in eval_xpath(dom, '(.//tr)'):
        url_elem = result.xpath('.//div[@style="float:left"]/a/@href')
        if url_elem:
            url = url_elem[0]
            if not (url.startswith("www") or url.startswith("http")):
                url = f"{base_url}{url}"
            else:
                url = None
        else:
            url = None
        title_elem = result.xpath('.//div[@style="float:left"]/a/b')
        title = extract_text(title_elem[0]) if title_elem else None
        if title and url:
            results.append({
                'url': url,
                'title': title,
            })
    return results
--- a/searx/engines/torrentdownloads.py
+++ b/searx/engines/torrentdownloads.py
@ -0,0 +1,38 @@
 from lxml import html
 from searx.utils import (
    extract_text,
    eval_xpath,
 )
 about = {
    "website": 'https://www.torrentdownloads.pro',
 }
 base_url = 'https://www.torrentdownloads.pro'
 def request(query, params):
    params['url'] = f"{base_url}/search/?search={query}"
    return params
 def response(resp):
    results = []
    dom = html.fromstring(resp.text)
    for result in eval_xpath(dom, '(//div[@class="inner_container"])[2]/div[contains(@class, "grey_bar3")]'):
        url_elem = result.xpath('.//p/a/@href')
        url = url_elem[0] if url_elem else None
        if url and not (url.startswith('www') or url.startswith('http')):
            url = f"{base_url}{url}"
        title_elem = result.xpath('.//p/a')
        title = extract_text(title_elem[0]) if title_elem else None
        if title and url:
            results.append({
                'url': url,
                'title': title,
            })
    return results
--- a/searx/settings.yml
+++ b/searx/settings.yml
@ -326,6 +326,42 @@ engines:
    categories: [ 'general', 'web' ]
    disabled: true
  - name: sogou
    engine: sogou
    shortcut: sogo
    categories: [ 'general', 'web' ]
    disabled: true
  - name: searchencrypt
    engine: searchencrypt
    shortcut: srchen
    categories: [ 'general', 'web' ]
    disabled: true
  - name: torlock
    engine: torlock
    categories: [ files, torrent ]
    shortcut: trlck
    disabled: true
  - name: torrentdownloads
    engine: torrentdownloads
    categories: [ files, torrent ]
    shortcut: trrnd
    disabled: true
  - name: limetorrent.net
    engine: limetorrentnet
    categories: [ files, torrent ]
    shortcut: lmtn
    disabled: true
  - name: limetorrent.lol
    engine: limetorrentlol
    categories: [ files, torrent ]
    shortcut: lmtl
    disabled: true
  - name: 9gag
    engine: 9gag
    shortcut: 9g