mirror of
				https://github.com/searxng/searxng.git
				synced 2025-11-03 11:07:07 -05:00 
			
		
		
		
	- ValueError in duration: issue reported in #3799 - HTML in title: related to #3770 [#3799] https://github.com/searxng/searxng/issues/3799 [#3770] https://github.com/searxng/searxng/pull/3770 Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
		
			
				
	
	
		
			104 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			104 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
# SPDX-License-Identifier: AGPL-3.0-or-later
 | 
						|
"""Bilibili is a Chinese video sharing website.
 | 
						|
 | 
						|
.. _Bilibili: https://www.bilibili.com
 | 
						|
"""
 | 
						|
 | 
						|
import random
 | 
						|
import string
 | 
						|
from urllib.parse import urlencode
 | 
						|
from datetime import datetime, timedelta
 | 
						|
 | 
						|
from searx import utils
 | 
						|
 | 
						|
# Engine metadata
 | 
						|
about = {
 | 
						|
    "website": "https://www.bilibili.com",
 | 
						|
    "wikidata_id": "Q3077586",
 | 
						|
    "official_api_documentation": None,
 | 
						|
    "use_official_api": False,
 | 
						|
    "require_api_key": False,
 | 
						|
    "results": "JSON",
 | 
						|
}
 | 
						|
 | 
						|
# Engine configuration
 | 
						|
paging = True
 | 
						|
results_per_page = 20
 | 
						|
categories = ["videos"]
 | 
						|
 | 
						|
# Search URL
 | 
						|
base_url = "https://api.bilibili.com/x/web-interface/search/type"
 | 
						|
 | 
						|
cookie = {
 | 
						|
    "innersign": "0",
 | 
						|
    "buvid3": "".join(random.choice(string.hexdigits) for _ in range(16)) + "infoc",
 | 
						|
    "i-wanna-go-back": "-1",
 | 
						|
    "b_ut": "7",
 | 
						|
    "FEED_LIVE_VERSION": "V8",
 | 
						|
    "header_theme_version": "undefined",
 | 
						|
    "home_feed_column": "4",
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
def request(query, params):
 | 
						|
    query_params = {
 | 
						|
        "__refresh__": "true",
 | 
						|
        "page": params["pageno"],
 | 
						|
        "page_size": results_per_page,
 | 
						|
        "single_column": "0",
 | 
						|
        "keyword": query,
 | 
						|
        "search_type": "video",
 | 
						|
    }
 | 
						|
 | 
						|
    params["url"] = f"{base_url}?{urlencode(query_params)}"
 | 
						|
    params["cookies"] = cookie
 | 
						|
 | 
						|
    return params
 | 
						|
 | 
						|
 | 
						|
# Format the video duration
 | 
						|
def format_duration(duration):
 | 
						|
    if not ":" in duration:
 | 
						|
        return None
 | 
						|
    minutes, seconds = map(int, duration.split(":"))
 | 
						|
    total_seconds = minutes * 60 + seconds
 | 
						|
 | 
						|
    formatted_duration = str(timedelta(seconds=total_seconds))[2:] if 0 <= total_seconds < 3600 else ""
 | 
						|
 | 
						|
    return formatted_duration
 | 
						|
 | 
						|
 | 
						|
def response(resp):
 | 
						|
    search_res = resp.json()
 | 
						|
 | 
						|
    results = []
 | 
						|
 | 
						|
    for item in search_res.get("data", {}).get("result", []):
 | 
						|
        title = utils.html_to_text(item["title"])
 | 
						|
        url = item["arcurl"]
 | 
						|
        thumbnail = item["pic"]
 | 
						|
        description = item["description"]
 | 
						|
        author = item["author"]
 | 
						|
        video_id = item["aid"]
 | 
						|
        unix_date = item["pubdate"]
 | 
						|
 | 
						|
        formatted_date = datetime.utcfromtimestamp(unix_date)
 | 
						|
        formatted_duration = format_duration(item["duration"])
 | 
						|
        iframe_url = f"https://player.bilibili.com/player.html?aid={video_id}&high_quality=1&autoplay=false&danmaku=0"
 | 
						|
 | 
						|
        results.append(
 | 
						|
            {
 | 
						|
                "title": title,
 | 
						|
                "url": url,
 | 
						|
                "content": description,
 | 
						|
                "author": author,
 | 
						|
                "publishedDate": formatted_date,
 | 
						|
                "length": formatted_duration,
 | 
						|
                "thumbnail": thumbnail,
 | 
						|
                "iframe_src": iframe_url,
 | 
						|
                "template": "videos.html",
 | 
						|
            }
 | 
						|
        )
 | 
						|
 | 
						|
    return results
 |