mirror of
				https://github.com/searxng/searxng.git
				synced 2025-10-30 10:12:31 -04:00 
			
		
		
		
	
		
			
				
	
	
		
			85 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			85 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Doku Wiki
 | |
| #
 | |
| # @website     https://www.dokuwiki.org/
 | |
| # @provide-api yes
 | |
| #              (https://www.dokuwiki.org/devel:xmlrpc)
 | |
| #
 | |
| # @using-api   no
 | |
| # @results     HTML
 | |
| # @stable      yes
 | |
| # @parse       (general)    url, title, content
 | |
| 
 | |
| from lxml.html import fromstring
 | |
| from searx.engines.xpath import extract_text
 | |
| from searx.url_utils import urlencode
 | |
| 
 | |
| # engine dependent config
 | |
| categories = ['general']  # TODO , 'images', 'music', 'videos', 'files'
 | |
| paging = False
 | |
| language_support = False
 | |
| number_of_results = 5
 | |
| 
 | |
| # search-url
 | |
| # Doku is OpenSearch compatible
 | |
| base_url = 'http://localhost:8090'
 | |
| search_url = '/?do=search'\
 | |
|              '&{query}'
 | |
| # TODO             '&startRecord={offset}'\
 | |
| # TODO             '&maximumRecords={limit}'\
 | |
| 
 | |
| 
 | |
| # do search-request
 | |
| def request(query, params):
 | |
| 
 | |
|     params['url'] = base_url +\
 | |
|         search_url.format(query=urlencode({'id': query}))
 | |
| 
 | |
|     return params
 | |
| 
 | |
| 
 | |
| # get response from search-request
 | |
| def response(resp):
 | |
|     results = []
 | |
| 
 | |
|     doc = fromstring(resp.text)
 | |
| 
 | |
|     # parse results
 | |
|     # Quickhits
 | |
|     for r in doc.xpath('//div[@class="search_quickresult"]/ul/li'):
 | |
|         try:
 | |
|             res_url = r.xpath('.//a[@class="wikilink1"]/@href')[-1]
 | |
|         except:
 | |
|             continue
 | |
| 
 | |
|         if not res_url:
 | |
|             continue
 | |
| 
 | |
|         title = extract_text(r.xpath('.//a[@class="wikilink1"]/@title'))
 | |
| 
 | |
|         # append result
 | |
|         results.append({'title': title,
 | |
|                         'content': "",
 | |
|                         'url': base_url + res_url})
 | |
| 
 | |
|     # Search results
 | |
|     for r in doc.xpath('//dl[@class="search_results"]/*'):
 | |
|         try:
 | |
|             if r.tag == "dt":
 | |
|                 res_url = r.xpath('.//a[@class="wikilink1"]/@href')[-1]
 | |
|                 title = extract_text(r.xpath('.//a[@class="wikilink1"]/@title'))
 | |
|             elif r.tag == "dd":
 | |
|                 content = extract_text(r.xpath('.'))
 | |
| 
 | |
|                 # append result
 | |
|                 results.append({'title': title,
 | |
|                                 'content': content,
 | |
|                                 'url': base_url + res_url})
 | |
|         except:
 | |
|             continue
 | |
| 
 | |
|         if not res_url:
 | |
|             continue
 | |
| 
 | |
|     # return results
 | |
|     return results
 |