[fix] indexing ++ url extraction

2024-11-23 11:21:00 +00:00 · 2014-03-21 16:36:13 +01:00 · 2014-03-21 16:36:13 +01:00 · 01c2eeb8ff
commit 01c2eeb8ff
parent 3854703d95
1 changed files with 5 additions and 2 deletions
--- a/searx/engines/yahoo.py
+++ b/searx/engines/yahoo.py
@ -47,8 +47,11 @@ def response(resp):
    dom = html.fromstring(resp.text)

    for result in dom.xpath(results_xpath):
+        try:
            url = parse_url(extract_url(result.xpath(url_xpath), search_url))
            title = extract_text(result.xpath(title_xpath)[0])
+        except:
+            continue
        content = extract_text(result.xpath(content_xpath)[0])
        results.append({'url': url, 'title': title, 'content': content})