#!/usr/bin/env python ''' searx is free software: you can redistribute it and/or modify it under the terms of the GNU Affero General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. searx is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public License for more details. You should have received a copy of the GNU Affero General Public License along with searx. If not, see < http://www.gnu.org/licenses/ >. (C) 2013- by Adam Tauber, ''' import os if __name__ == "__main__": from sys import path path.append(os.path.realpath(os.path.dirname(os.path.realpath(__file__))+'/../')) from flask import Flask, request, render_template, url_for, Response, make_response, redirect from searx.engines import search, categories, engines, get_engines_stats from searx import settings import json import cStringIO from searx.utils import UnicodeWriter from flask import send_from_directory app = Flask(__name__) app.secret_key = settings.secret_key opensearch_xml = ''' searx Search searx UTF-8 searx meta search engine ''' def render(template_name, **kwargs): global categories kwargs['categories'] = sorted(categories.keys()) if not 'selected_categories' in kwargs: kwargs['selected_categories'] = [] cookie_categories = request.cookies.get('categories', '').split(',') for ccateg in cookie_categories: if ccateg in categories: kwargs['selected_categories'].append(ccateg) if not len(kwargs['selected_categories']): kwargs['selected_categories'] = ['general'] return render_template(template_name, **kwargs) def parse_query(query): query_engines = [] query_parts = query.split() if query_parts[0].startswith('-') and query_parts[0][1:] in engines: query_engines.append({'category': 'TODO', 'name': query_parts[0][1:]}) query = query.replace(query_parts[0], '', 1).strip() return query, query_engines @app.route('/', methods=['GET', 'POST']) def index(): global categories if request.method=='POST': request_data = request.form else: request_data = request.args if not request_data.get('q'): return render('index.html') selected_categories = [] query, selected_engines = parse_query(request_data['q'].encode('utf-8')) if not len(selected_engines): for pd_name,pd in request_data.items(): if pd_name.startswith('category_'): category = pd_name[9:] if not category in categories: continue selected_categories.append(category) if not len(selected_categories): cookie_categories = request.cookies.get('categories', '').split(',') for ccateg in cookie_categories: if ccateg in categories: selected_categories.append(ccateg) if not len(selected_categories): selected_categories = ['general'] for categ in selected_categories: selected_engines.extend({'category': categ, 'name': x.name} for x in categories[categ]) results, suggestions = search(query, request, selected_engines) for result in results: if len(result['url']) > 74: result['pretty_url'] = result['url'][:35] + '[..]' + result['url'][-35:] else: result['pretty_url'] = result['url'] if request_data.get('format') == 'json': return Response(json.dumps({'query': query, 'results': results}), mimetype='application/json') elif request_data.get('format') == 'csv': csv = UnicodeWriter(cStringIO.StringIO()) keys = ('title', 'url', 'content', 'host', 'engine', 'score') if len(results): csv.writerow(keys) for row in results: row['host'] = row['parsed_url'].netloc csv.writerow([row.get(key, '') for key in keys]) csv.stream.seek(0) response = Response(csv.stream.read(), mimetype='application/csv') response.headers.add('Content-Disposition', 'attachment;Filename=searx_-_{0}.csv'.format('_'.join(query.split()))) return response return render('results.html' ,results=results ,q=request_data['q'] ,selected_categories=selected_categories ,number_of_results=len(results) ,suggestions=suggestions ) @app.route('/about', methods=['GET']) def about(): global categories return render('about.html', categs=categories.items()) @app.route('/preferences', methods=['GET', 'POST']) def preferences(): if request.method=='POST': selected_categories = [] for pd_name,pd in request.form.items(): if pd_name.startswith('category_'): category = pd_name[9:] if not category in categories: continue selected_categories.append(category) if selected_categories: resp = make_response(redirect('/')) resp.set_cookie('categories', ','.join(selected_categories)) return resp return render('preferences.html') @app.route('/stats', methods=['GET']) def stats(): global categories stats = get_engines_stats() return render('stats.html', stats=stats) @app.route('/robots.txt', methods=['GET']) def robots(): return Response("""User-agent: * Allow: / Allow: /about Disallow: /stats """, mimetype='text/plain') @app.route('/opensearch.xml', methods=['GET']) def opensearch(): global opensearch_xml method = 'post' scheme = 'http' # chrome/chromium only supports HTTP GET.... if request.headers.get('User-Agent', '').lower().find('webkit') >= 0: method = 'get' if request.is_secure: scheme = 'https' if settings.base_url: hostname = settings.base_url else: hostname = url_for('index', _external=True, _scheme=scheme) ret = opensearch_xml.format(method=method, host=hostname) resp = Response(response=ret, status=200, mimetype="application/xml") return resp @app.route('/favicon.ico') def favicon(): return send_from_directory(os.path.join(app.root_path, 'static/img'), 'favicon.png', mimetype='image/vnd.microsoft.icon') if __name__ == "__main__": from gevent import monkey monkey.patch_all() app.run(debug = settings.debug ,use_debugger = settings.debug ,port = settings.port )