mirror of
				https://github.com/searxng/searxng
				synced 2024-01-01 19:24:07 +01:00 
			
		
		
		
	[fix] yahoo url mods
This commit is contained in:
		
							parent
							
								
									8c8d9d10cb
								
							
						
					
					
						commit
						4627788834
					
				
					 1 changed files with 5 additions and 1 deletions
				
			
		|  | @ -1,6 +1,7 @@ | |||
| #!/usr/bin/env python | ||||
| 
 | ||||
| from urllib import urlencode | ||||
| from urlparse import unquote | ||||
| from lxml import html | ||||
| from searx.engines.xpath import extract_text, extract_url | ||||
| 
 | ||||
|  | @ -33,7 +34,10 @@ def response(resp): | |||
|     dom = html.fromstring(resp.text) | ||||
| 
 | ||||
|     for result in dom.xpath(results_xpath): | ||||
|         url = extract_url(result.xpath(url_xpath), search_url) | ||||
|         url_string = extract_url(result.xpath(url_xpath), search_url) | ||||
|         start = url_string.find('/RU=')+4 | ||||
|         end = url_string.rfind('/RS') | ||||
|         url = unquote(url_string[start:end]) | ||||
|         title = extract_text(result.xpath(title_xpath)[0]) | ||||
|         content = extract_text(result.xpath(content_xpath)[0]) | ||||
|         results.append({'url': url, 'title': title, 'content': content}) | ||||
|  |  | |||
		Loading…
	
	Add table
		
		Reference in a new issue
	
	 Adam Tauber
						Adam Tauber