From 326a33fafeaade21cc97cea1fe5e50c0dbea40d5 Mon Sep 17 00:00:00 2001 From: asciimoo Date: Sat, 2 Nov 2013 18:07:48 +0100 Subject: [PATCH] [enh] better url comparison --- searx/engines/__init__.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/searx/engines/__init__.py b/searx/engines/__init__.py index a1205f6c3..29ec5af16 100644 --- a/searx/engines/__init__.py +++ b/searx/engines/__init__.py @@ -147,8 +147,10 @@ def search(query, request, selected_categories): score = int((flat_len - i)/engines_len)*settings.weights.get(res['engine'], 1)+1 duplicated = False for new_res in results: + p1 = res['parsed_url'].path[:-1] if res['parsed_url'].path.endswith('/') else res['parsed_url'].path + p2 = new_res['parsed_url'].path[:-1] if new_res['parsed_url'].path.endswith('/') else new_res['parsed_url'].path if res['parsed_url'].netloc == new_res['parsed_url'].netloc and\ - res['parsed_url'].path == new_res['parsed_url'].path and\ + p1 == p2 and\ res['parsed_url'].query == new_res['parsed_url'].query and\ res.get('template') == new_res.get('template'): duplicated = new_res