searxng/searx/search.py

115 lines
4.1 KiB
Python
Raw Normal View History

from searx.engines import (
categories, engines, engine_shortcuts
)
from searx.languages import language_codes
class Search(object):
"""Search information container"""
def __init__(self, request):
super(Search, self).__init__()
self.query = None
self.engines = []
self.categories = []
self.paging = False
self.pageno = 1
self.lang = 'all'
if request.cookies.get('blocked_engines'):
2014-02-07 01:45:12 +00:00
self.blocked_engines = request.cookies['blocked_engines'].split(',') # noqa
else:
self.blocked_engines = []
self.results = []
self.suggestions = []
self.request_data = {}
if request.cookies.get('language')\
and request.cookies['language'] in (x[0] for x in language_codes):
self.lang = request.cookies['language']
if request.method == 'POST':
self.request_data = request.form
else:
self.request_data = request.args
# TODO better exceptions
if not self.request_data.get('q'):
raise Exception('noquery')
self.query = self.request_data['q']
pageno_param = self.request_data.get('pageno', '1')
if not pageno_param.isdigit() or int(pageno_param) < 1:
raise Exception('wrong pagenumber')
self.pageno = int(pageno_param)
2014-02-09 00:07:18 +00:00
self.parse_query()
self.categories = []
if len(self.engines):
self.categories = list(set(engine['category']
2014-02-07 01:45:12 +00:00
for engine in self.engines))
else:
for pd_name, pd in self.request_data.items():
if pd_name.startswith('category_'):
category = pd_name[9:]
if not category in categories:
continue
self.categories.append(category)
if not len(self.categories):
cookie_categories = request.cookies.get('categories', '')
cookie_categories = cookie_categories.split(',')
for ccateg in cookie_categories:
if ccateg in categories:
self.categories.append(ccateg)
if not len(self.categories):
self.categories = ['general']
for categ in self.categories:
self.engines.extend({'category': categ,
'name': x.name}
for x in categories[categ]
if not x.name in self.blocked_engines)
2014-02-09 00:07:18 +00:00
def parse_query(self):
query_parts = self.query.split()
modified = False
2014-02-09 00:22:30 +00:00
if query_parts[0].startswith(':'):
2014-02-09 10:35:52 +00:00
lang = query_parts[0][1:].lower()
for lc in language_codes:
lang_id, lang_name, country = map(str.lower, lc)
if lang == lang_id\
or lang_id.startswith(lang)\
or lang == lang_name\
or lang == country:
self.lang = lang
modified = True
break
2014-02-09 00:22:30 +00:00
elif query_parts[0].startswith('!'):
2014-02-09 00:07:18 +00:00
prefix = query_parts[0][1:].replace('_', ' ')
2014-02-09 00:07:18 +00:00
if prefix in engine_shortcuts\
and not engine_shortcuts[prefix] in self.blocked_engines:
modified = True
self.engines.append({'category': 'none',
'name': engine_shortcuts[prefix]})
elif prefix in engines\
and not prefix in self.blocked_engines:
modified = True
self.engines.append({'category': 'none',
'name': prefix})
elif prefix in categories:
modified = True
self.engines.extend({'category': prefix,
'name': engine.name}
for engine in categories[prefix]
if not engine in self.blocked_engines)
if modified:
self.query = self.query.replace(query_parts[0], '', 1).strip()
2014-02-09 00:23:01 +00:00
self.parse_query()