Loading searx/engines/brave.py +45 −23 Original line number Diff line number Diff line Loading @@ -4,10 +4,8 @@ """ from urllib.parse import urlencode from lxml import html from searx.utils import extract_text, eval_xpath, eval_xpath_list import chompjs, json import re import chompjs import json about = { "website": 'https://search.brave.com/', Loading @@ -21,6 +19,7 @@ base_url = "https://search.brave.com/" paging = False categories = ['images', 'videos', 'news'] # images, videos, news def request(query, params): args = { 'q': query, Loading @@ -28,38 +27,61 @@ def request(query, params): } params["url"] = f"{base_url}{categories[0]}?{urlencode(args)}" def get_image_results(text): results = [] datastr = "" for line in text.split("\n"): if "const data = " in line: datastr = line.replace("const data = ", "").strip()[:-1] break json_data = chompjs.parse_js_object(datastr) def get_video_results(json_data): results = [] for result in json_data[1]["data"]["body"]["response"]["results"]: for result in json_data: results.append( { 'template': 'images.html', 'template': 'videos.html', 'url': result['url'], 'thumbnail_src': result['thumbnail']['src'], 'img_src': result['properties']['url'], 'content': result['description'], 'title': result['title'], 'source': result['source'], 'img_format': result['properties']['format'], 'duration': result['video']['duration'], } ) return results def response(resp): dom = html.fromstring(resp.text) results = [] datastr = "" for line in resp.text.split("\n"): if "const data = " in line: datastr = line.replace("const data = ", "").strip()[:-1] break json_data = chompjs.parse_js_object(datastr) json_results = json_data[1]["data"]["body"]["response"]["results"] with open("outfile.json", "w") as f: json.dump(json_data, f) for result in json_results: item = { 'url': result['url'], 'title': result['title'], 'content': result['description'], } if result['thumbnail'] != "null": item['thumbnail'] = result['thumbnail']['src'] match categories[0]: case 'images': return get_image_results(resp.text) case _: return [] No newline at end of file item['template'] = 'images.html' item['img_format'] = result['properties']['format'] item['source'] = result['source'] item['img_src'] = result['properties']['url'] case 'videos': item['template'] = 'videos.html' item['length'] = result['video']['duration'] results.append(item) return results searx/settings.yml +6 −0 Original line number Diff line number Diff line Loading @@ -1849,6 +1849,12 @@ engines: categories: images disabled: false - name: brave.videos shortcut: bravevid engine: brave categories: videos disabled: false - name: petalsearch shortcut: pts engine: xpath Loading Loading
searx/engines/brave.py +45 −23 Original line number Diff line number Diff line Loading @@ -4,10 +4,8 @@ """ from urllib.parse import urlencode from lxml import html from searx.utils import extract_text, eval_xpath, eval_xpath_list import chompjs, json import re import chompjs import json about = { "website": 'https://search.brave.com/', Loading @@ -21,6 +19,7 @@ base_url = "https://search.brave.com/" paging = False categories = ['images', 'videos', 'news'] # images, videos, news def request(query, params): args = { 'q': query, Loading @@ -28,38 +27,61 @@ def request(query, params): } params["url"] = f"{base_url}{categories[0]}?{urlencode(args)}" def get_image_results(text): results = [] datastr = "" for line in text.split("\n"): if "const data = " in line: datastr = line.replace("const data = ", "").strip()[:-1] break json_data = chompjs.parse_js_object(datastr) def get_video_results(json_data): results = [] for result in json_data[1]["data"]["body"]["response"]["results"]: for result in json_data: results.append( { 'template': 'images.html', 'template': 'videos.html', 'url': result['url'], 'thumbnail_src': result['thumbnail']['src'], 'img_src': result['properties']['url'], 'content': result['description'], 'title': result['title'], 'source': result['source'], 'img_format': result['properties']['format'], 'duration': result['video']['duration'], } ) return results def response(resp): dom = html.fromstring(resp.text) results = [] datastr = "" for line in resp.text.split("\n"): if "const data = " in line: datastr = line.replace("const data = ", "").strip()[:-1] break json_data = chompjs.parse_js_object(datastr) json_results = json_data[1]["data"]["body"]["response"]["results"] with open("outfile.json", "w") as f: json.dump(json_data, f) for result in json_results: item = { 'url': result['url'], 'title': result['title'], 'content': result['description'], } if result['thumbnail'] != "null": item['thumbnail'] = result['thumbnail']['src'] match categories[0]: case 'images': return get_image_results(resp.text) case _: return [] No newline at end of file item['template'] = 'images.html' item['img_format'] = result['properties']['format'] item['source'] = result['source'] item['img_src'] = result['properties']['url'] case 'videos': item['template'] = 'videos.html' item['length'] = result['video']['duration'] results.append(item) return results
searx/settings.yml +6 −0 Original line number Diff line number Diff line Loading @@ -1849,6 +1849,12 @@ engines: categories: images disabled: false - name: brave.videos shortcut: bravevid engine: brave categories: videos disabled: false - name: petalsearch shortcut: pts engine: xpath Loading