[feat] engine: brave - support for videos (cae06f27) · Commits · e / infra / spot

searx/engines/brave.py

+45 −23

Original line number	Diff line number	Diff line
		@@ -4,10 +4,8 @@
		"""

		from urllib.parse import urlencode
		from lxml import html
		from searx.utils import extract_text, eval_xpath, eval_xpath_list
		import chompjs, json
		import re
		import chompjs
		import json

		about = {
		"website": 'https://search.brave.com/',
		@@ -21,6 +19,7 @@ base_url = "https://search.brave.com/"
		paging = False
		categories = ['images', 'videos', 'news'] # images, videos, news


		def request(query, params):
		args = {
		'q': query,
		@@ -28,38 +27,61 @@ def request(query, params):
		}
		params["url"] = f"{base_url}{categories[0]}?{urlencode(args)}"

		def get_image_results(text):
		results = []

		datastr = ""
		for line in text.split("\n"):
		if "const data = " in line:
		datastr = line.replace("const data = ", "").strip()[:-1]
		break

		json_data = chompjs.parse_js_object(datastr)
		def get_video_results(json_data):
		results = []

		for result in json_data[1]["data"]["body"]["response"]["results"]:
		for result in json_data:
		results.append(
		{
		'template': 'images.html',
		'template': 'videos.html',
		'url': result['url'],
		'thumbnail_src': result['thumbnail']['src'],
		'img_src': result['properties']['url'],
		'content': result['description'],
		'title': result['title'],
		'source': result['source'],
		'img_format': result['properties']['format'],
		'duration': result['video']['duration'],
		}
		)

		return results


		def response(resp):
		dom = html.fromstring(resp.text)
		results = []

		datastr = ""
		for line in resp.text.split("\n"):
		if "const data = " in line:
		datastr = line.replace("const data = ", "").strip()[:-1]
		break

		json_data = chompjs.parse_js_object(datastr)
		json_results = json_data[1]["data"]["body"]["response"]["results"]

		with open("outfile.json", "w") as f:
		json.dump(json_data, f)

		for result in json_results:
		item = {
		'url': result['url'],
		'title': result['title'],
		'content': result['description'],
		}
		if result['thumbnail'] != "null":
		item['thumbnail'] = result['thumbnail']['src']

		match categories[0]:
		case 'images':
		return get_image_results(resp.text)
		case _:
		return []
		No newline at end of file
		item['template'] = 'images.html'
		item['img_format'] = result['properties']['format']
		item['source'] = result['source']
		item['img_src'] = result['properties']['url']
		case 'videos':
		item['template'] = 'videos.html'
		item['length'] = result['video']['duration']

		results.append(item)

		return results

searx/settings.yml

+6 −0

Original line number	Diff line number	Diff line
		@@ -1849,6 +1849,12 @@ engines:
		categories: images
		disabled: false

		- name: brave.videos
		shortcut: bravevid
		engine: brave
		categories: videos
		disabled: false

		- name: petalsearch
		shortcut: pts
		engine: xpath