瀏覽代碼

Merge branch 'master' into flask_perimeter

Adam Tauber 8 年之前
父節點
當前提交
627962ce40

+ 32
- 0
manage.sh 查看文件

@@ -14,6 +14,36 @@ update_dev_packages() {
14 14
     pip install --upgrade -r "$BASE_DIR/requirements-dev.txt"
15 15
 }
16 16
 
17
+check_geckodriver() {
18
+    echo '[!] Checking geckodriver'
19
+    set -e
20
+    geckodriver -V 2>1 > /dev/null || NOTFOUND=1
21
+    set +e
22
+    if [ -z $NOTFOUND ]; then
23
+	return
24
+    fi
25
+    GECKODRIVER_VERSION="v0.11.1"
26
+    PLATFORM=`python -c "import platform; print platform.system().lower(), platform.architecture()[0]"`
27
+    case $PLATFORM in
28
+	"linux 32bit" | "linux2 32bit") ARCH="linux32";;
29
+	"linux 64bit" | "linux2 64bit") ARCH="linux64";;
30
+	"windows 32 bit") ARCH="win32";;
31
+	"windows 64 bit") ARCH="win64";;
32
+	"mac 64bit") ARCH="macos";;
33
+    esac
34
+    GECKODRIVER_URL="https://github.com/mozilla/geckodriver/releases/download/$GECKODRIVER_VERSION/geckodriver-$GECKODRIVER_VERSION-$ARCH.tar.gz";
35
+    if [ -z "$VIRTUAL_ENV" ]; then
36
+	echo "geckodriver can't be installed because VIRTUAL_ENV is not set, you should download it from\n  $GECKODRIVER_URL"
37
+	exit
38
+    else
39
+	echo "Installing $VIRTUAL_ENV from\n  $GECKODRIVER_URL"
40
+	FILE=`mktemp`
41
+	wget "$GECKODRIVER_URL" -qO $FILE && tar xz -C $VIRTUAL_ENV/bin/ -f $FILE geckodriver
42
+	rm $FILE
43
+	chmod 777 $VIRTUAL_ENV/bin/geckodriver
44
+    fi
45
+}
46
+
17 47
 pep8_check() {
18 48
     echo '[!] Running pep8 check'
19 49
     # ignored rules:
@@ -43,6 +73,7 @@ tests() {
43 73
     set -e
44 74
     pep8_check
45 75
     unit_tests
76
+    check_geckodriver
46 77
     robot_tests
47 78
     set +e
48 79
 }
@@ -88,6 +119,7 @@ Commands
88 119
     unit_tests           - Run unit tests
89 120
     update_dev_packages  - Check & update development and production dependency changes
90 121
     update_packages      - Check & update dependency changes
122
+    check_geckodriver    - Check & download geckodriver (required for robot_tests)
91 123
 "
92 124
 }
93 125
 

+ 5
- 5
requirements.txt 查看文件

@@ -1,12 +1,12 @@
1 1
 certifi==2016.9.26
2
-flask==0.11.1
2
+flask==0.12
3 3
 flask-babel==0.11.1
4
-lxml==3.6.0
5
-ndg-httpsclient==0.4.1
4
+lxml==3.7.1
5
+ndg-httpsclient==0.4.2
6 6
 pyasn1==0.1.9
7 7
 pyasn1-modules==0.0.8
8 8
 pygments==2.1.3
9
-pyopenssl==0.15.1
9
+pyopenssl==16.2.0
10 10
 python-dateutil==2.5.3
11 11
 pyyaml==3.11
12
-requests[socks]==2.10.0
12
+requests[socks]==2.12.4

+ 5
- 5
searx/autocomplete.py 查看文件

@@ -81,22 +81,22 @@ def searx_bang(full_query):
81 81
             engine_query = full_query.getSearchQuery()[1:]
82 82
 
83 83
             for lc in language_codes:
84
-                lang_id, lang_name, country, english_name = map(str.lower, lc)
84
+                lang_id, lang_name, country, english_name = map(unicode.lower, lc)
85 85
 
86 86
                 # check if query starts with language-id
87 87
                 if lang_id.startswith(engine_query):
88 88
                     if len(engine_query) <= 2:
89
-                        results.append(':{lang_id}'.format(lang_id=lang_id.split('-')[0]))
89
+                        results.append(u':{lang_id}'.format(lang_id=lang_id.split('-')[0]))
90 90
                     else:
91
-                        results.append(':{lang_id}'.format(lang_id=lang_id))
91
+                        results.append(u':{lang_id}'.format(lang_id=lang_id))
92 92
 
93 93
                 # check if query starts with language name
94 94
                 if lang_name.startswith(engine_query) or english_name.startswith(engine_query):
95
-                    results.append(':{lang_name}'.format(lang_name=lang_name))
95
+                    results.append(u':{lang_name}'.format(lang_name=lang_name))
96 96
 
97 97
                 # check if query starts with country
98 98
                 if country.startswith(engine_query.replace('_', ' ')):
99
-                    results.append(':{country}'.format(country=country.replace(' ', '_')))
99
+                    results.append(u':{country}'.format(country=country.replace(' ', '_')))
100 100
 
101 101
     # remove duplicates
102 102
     result_set = set(results)

+ 3
- 1
searx/engines/xpath.py 查看文件

@@ -42,7 +42,9 @@ def extract_text(xpath_results):
42 42
         return ''.join(xpath_results)
43 43
     else:
44 44
         # it's a element
45
-        return html_to_text(xpath_results.text_content()).strip()
45
+        text = html.tostring(xpath_results, encoding='unicode', method='text', with_tail=False)
46
+        text = text.strip().replace('\n', ' ')
47
+        return ' '.join(text.split())
46 48
 
47 49
 
48 50
 def extract_url(xpath_results, search_url):

+ 0
- 4
searx/static/plugins/js/infinite_scroll.js 查看文件

@@ -4,13 +4,9 @@ $(document).ready(function() {
4 4
         if ($(document).height() - win.height() == win.scrollTop()) {
5 5
             var formData = $('#pagination form:last').serialize();
6 6
             if (formData) {
7
-                var pageno = $('#pagination input[name=pageno]:last').attr('value');
8 7
                 $('#pagination').html('<div class="loading-spinner"></div>');
9 8
                 $.post('./', formData, function (data) {
10
-                    var lastImageHref = $('.result-images:last a').attr('href');
11 9
                     var body = $(data);
12
-                    $('a[href^="#open-modal"]:last').attr('href', '#open-modal-1-' + pageno);
13
-                    body.find('.modal-image a:first').attr('href', lastImageHref);
14 10
                     $('#pagination').remove();
15 11
                     $('#main_results').append('<hr/>');
16 12
                     $('#main_results').append(body.find('.result'));

+ 1
- 1
searx/static/themes/oscar/css/logicodev.min.css
文件差異過大導致無法顯示
查看文件


+ 1
- 1
searx/static/themes/oscar/css/pointhi.min.css
文件差異過大導致無法顯示
查看文件


+ 0
- 77
searx/static/themes/oscar/less/logicodev/modal-pic.less 查看文件

@@ -1,77 +0,0 @@
1
-.modal-image {
2
-    position: fixed;
3
-    top: 0;
4
-    right: 0;
5
-    bottom: 0;
6
-    left: 0;
7
-    background: rgba(0,0,0,0.8);
8
-    z-index: 1000000001;
9
-    opacity:0 !important;
10
-    pointer-events: none;
11
-
12
-    button {
13
-        display: none;
14
-    }
15
-
16
-    &:target {
17
-        opacity: 1 !important;
18
-        pointer-events: auto;
19
-    }
20
-
21
-    & > div {
22
-        margin: 2% auto;
23
-        width: 97%;
24
-        background: @dim-gray;
25
-        border: @gray 0.1rem solid;
26
-    }
27
-
28
-    @media (min-width: 769px) {
29
-        & > div {
30
-            max-width: 60.0rem;
31
-        }
32
-    }
33
-
34
-    .image-paging-left {
35
-        margin-right: 1.0rem;
36
-        margin-top: 0.5rem;
37
-        width:15px;
38
-        height:15px;
39
-        background: url(data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAA8AAAAPCAYAAAA71pVKAAAABmJLR0QA/wD/AP+gvaeTAAAACXBI
40
-WXMAAAsTAAALEwEAmpwYAAAAB3RJTUUH4AweDQoOuikqUQAAAB1pVFh0Q29tbWVudAAAAAAAQ3Jl
41
-YXRlZCB3aXRoIEdJTVBkLmUHAAAAiElEQVQoz6XTrQ0CQRCG4SesQHI5g6EAqIEewNLSVUACzfAT
42
-BApDDSgSBAaJORKyauf2czOZdybzl5SpxR5j3H/OUQHYoMMMNwE1fcUT5hFwUgPuenAxBDxHwRZb
43
-HKMgbPDCuiQ4ZfYDU6xwxTNafXDP1dOu3nP1heUJDnmCVAB/cMES7/+v+gIq0Bs3k6NL9AAAAABJ
44
-RU5ErkJggg==) 96% no-repeat;
45
-    }
46
-
47
-    .image-paging-right {
48
-        margin-left: 1.2rem;
49
-        margin-top: 0.5rem;
50
-        width:15px;
51
-        height:15px;
52
-        background: url(data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAA8AAAAPCAYAAAA71pVKAAAABmJLR0QA/wD/AP+gvaeTAAAACXBI
53
-        WXMAAAsTAAALEwEAmpwYAAAAB3RJTUUH4AweDQon+JuyPQAAAB1pVFh0Q29tbWVudAAAAAAAQ3Jl
54
-        YXRlZCB3aXRoIEdJTVBkLmUHAAAAaklEQVQoz73TsQ2DUAxF0SMWAFEzwGcaWhgpEyAlbQYJMACj
55
-        sAINTaiIf8Tt3FzL9jPfDHijdoHiVK9o8EAlQMKM1z8EZUTQHoJnjmDJFUwYr17hTIcN/W2dwzOH
56
-        tx2+czhhCZ9oNH/6qh1F2RaYgWxrQwAAAABJRU5ErkJggg==);
57
-
58
-    }
59
-
60
-    .image-container::before {
61
-        display: block;
62
-        min-width: 1.0rem;
63
-        max-width: 60.0rem;
64
-        min-height: 10.0rem;
65
-        height: 30.0rem;
66
-        content: "";
67
-    }
68
-}
69
-
70
-.modal-close {
71
-    position:fixed;
72
-    top: 0;
73
-    left: 0;
74
-    height: 100% !important;
75
-    width: 100% !important;
76
-    z-index: -1;
77
-}

+ 0
- 2
searx/static/themes/oscar/less/logicodev/oscar.less 查看文件

@@ -19,5 +19,3 @@
19 19
 @import "cursor.less";
20 20
 
21 21
 @import "code.less";
22
-
23
-@import "modal-pic.less";

+ 0
- 4
searx/static/themes/oscar/less/pointhi/oscar.less 查看文件

@@ -17,7 +17,3 @@
17 17
 @import "code.less";
18 18
 
19 19
 @import "navbar.less";
20
-
21
-@import "../logicodev/variables.less";
22
-
23
-@import "../logicodev/modal-pic.less";

+ 29
- 44
searx/templates/oscar/result_templates/images.html 查看文件

@@ -1,54 +1,39 @@
1
-<a href="#open-modal-{{ index }}-{{ pageno }}">
2
-    <img src="{% if result.thumbnail_src %}{{ image_proxify(result.thumbnail_src) }}{% else %}{{ image_proxify(result.img_src) }}{% endif %}" alt="{{ result.title|striptags }}" title="{{ result.title|striptags }}" class="img-thumbnail" id="img-result-thumb-{{ index }}" />
3
-</a>
1
+{% from 'oscar/macros.html' import draw_favicon %}
4 2
 
5
-<style type="text/css" media="screen">
6
-#open-modal-{{ index }}-{{ pageno }}:target .image-container::before {
7
-    background: url({{ image_proxify(result.img_src)|safe }}) no-repeat center/contain;
8
-}
9
-</style>
3
+<a href="{{ result.img_src }}" {% if results_on_new_tab %}target="_blank" rel="noopener noreferrer"{% else %}rel="noreferrer"{% endif %} data-toggle="modal" data-target="#modal-{{ index }}-{{pageno}}">
4
+    <img src="{% if result.thumbnail_src %}{{ image_proxify(result.thumbnail_src) }}{% else %}{{ image_proxify(result.img_src) }}{% endif %}" alt="{{ result.title|striptags }}" title="{{ result.title|striptags }}" class="img-thumbnail">
5
+</a>
10 6
 
11
-<div id="open-modal-{{ index }}-{{ pageno }}" class="modal-image">
12
-    <div class="container modal-dialog">
13
-        <div class="row">
14
-            <div class="col-md-12 col-sm-12 col-xs-12 modal-header">
15
-                <a {% if index != 1 %}href="#open-modal-{{ index-1 }}-{{ pageno }}"{% endif %}>
16
-                    <span class="pull-left image-paging-left"></span>
17
-                 </a>
18
-                <a href="#open-modal-{{ index+1 }}-{{ pageno }}">
19
-                    <span class="pull-right image-paging-right"></span>
20
-                </a>
21
-                <h4 class="modal-title image-title">{{ result.title|striptags }}</h4>
22
-            </div>
23
-        </div>
24
-        <div class="row">
25
-            <div class="col-md-12 col-sm-12 col-xs-12 modal-body">
26
-                <a href="{{ result.img_src }}" {% if results_on_new_tab %}target="_blank" rel="noopener noreferrer"{% else %}rel="noreferrer"{% endif %}><div class="image-container"></div></a>
7
+<div class="modal fade" id="modal-{{ index }}-{{ pageno }}" tabindex="-1" role="dialog" aria-hidden="true">
8
+    <div class="modal-dialog">
9
+        <div class="modal-wrapper">
10
+            <div class="modal-header">
11
+                <button type="button" class="close" data-dismiss="modal"><span aria-hidden="true">&times;</span><span class="sr-only">Close</span></button>
12
+                <h4 class="modal-title">{% if result.engine~".png" in favicons %}{{ draw_favicon(result.engine) }} {% endif %}{{ result.title|striptags }}</h4>
27 13
             </div>
28
-        </div>
29
-        {% if result.content %}
30
-        <div class="row">
31
-            <div class="col-md-12 hidden-sm hidden-xs modal-body">
32
-                <p class="result-content">{{ result.content|safe }}</p>
14
+            <div class="modal-body">
15
+                <img class="img-responsive center-block" src="{% if result.thumbnail_src %}{{ image_proxify(result.thumbnail_src) }}{% else %}{{ image_proxify(result.img_src) }}{% endif %}" alt="{{ result.title|striptags }}">
33 16
                 {% if result.author %}<span class="photo-author">{{ result.author }}</span><br />{% endif %}
17
+                {% if result.content %}
18
+                    <p class="result-content">
19
+                        {{ result.content }}
20
+                    </p>
21
+                {% endif %}
34 22
             </div>
35
-        </div>
36
-        {% endif %}
37
-        <div class="modal-footer">
38
-            <div class="row">
39
-                <div class="col-md-10 col-xs-12">
40
-                    <p class="text-muted pull-left">{{ result.pretty_url }}</p>
23
+            <div class="modal-footer">
24
+                <div class="clearfix"></div>
25
+                <span class="label label-default pull-right">{{ result.engine }}</span>
26
+                <p class="text-muted pull-left">{{ result.pretty_url }}</p>
27
+                <div class="clearfix"></div>
28
+				<div class="row">
29
+                    <div class="col-md-6">
30
+                        <a href="{{ result.img_src }}" {% if results_on_new_tab %}target="_blank" rel="noopener noreferrer"{% else %}rel="noreferrer"{% endif %} class="btn btn-default">{{ _('Get image') }}</a>
31
+                    </div>
32
+                    <div class="col-md-6">
33
+                        <a href="{{ result.url }}" {% if results_on_new_tab %}target="_blank" rel="noopener noreferrer"{% else %}rel="noreferrer"{% endif %} class="btn btn-default">{{ _('View source') }}</a>
34
+                    </div>
41 35
                 </div>
42
-                <div class="col-md-2 hidden-sm hidden-xs">
43
-                    <span class="label label-default pull-right">{{ result.engine }}</span>
44
-                </div>
45
-            </div>
46
-            <div class="row">
47
-                <a href="{{ result.url }}" class="btn btn-default">
48
-                    {{ _('View source') }}
49
-                </a>
50 36
             </div>
51 37
         </div>
52 38
     </div>
53
-    <a href="#img-result-thumb-{{ index }}-{{ pageno }}" class="modal-close"></a>
54 39
 </div>

utils/standalone_search.py → utils/google_search.py 查看文件

@@ -13,10 +13,9 @@ request_params = default_request_params()
13 13
 # Possible params
14 14
 # request_params['headers']['User-Agent'] = ''
15 15
 # request_params['category'] = ''
16
-# request_params['started'] = ''
17
-
18 16
 request_params['pageno'] = 1
19 17
 request_params['language'] = 'en_us'
18
+request_params['time_range'] = ''
20 19
 
21 20
 params = google.request(argv[1], request_params)
22 21
 
@@ -32,5 +31,5 @@ else:
32 31
     request_args['data'] = request_params['data']
33 32
 
34 33
 resp = req(request_params['url'], **request_args)
35
-
34
+resp.search_params = request_params
36 35
 print(dumps(google.response(resp)))

+ 101
- 0
utils/standalone_searx.py 查看文件

@@ -0,0 +1,101 @@
1
+#!/usr/bin/env python
2
+
3
+'''
4
+searx is free software: you can redistribute it and/or modify
5
+it under the terms of the GNU Affero General Public License as published by
6
+the Free Software Foundation, either version 3 of the License, or
7
+(at your option) any later version.
8
+
9
+searx is distributed in the hope that it will be useful,
10
+but WITHOUT ANY WARRANTY; without even the implied warranty of
11
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12
+GNU Affero General Public License for more details.
13
+
14
+You should have received a copy of the GNU Affero General Public License
15
+along with searx. If not, see < http://www.gnu.org/licenses/ >.
16
+
17
+(C) 2016- by Alexandre Flament, <alex@al-f.net>
18
+'''
19
+
20
+# set path
21
+from sys import path
22
+from os.path import realpath, dirname
23
+path.append(realpath(dirname(realpath(__file__)) + '/../'))
24
+
25
+# initialization
26
+from json import dumps
27
+from searx import settings
28
+import searx.query
29
+import searx.search
30
+import searx.engines
31
+import searx.preferences
32
+import argparse
33
+
34
+searx.engines.initialize_engines(settings['engines'])
35
+
36
+# command line parsing
37
+parser = argparse.ArgumentParser(description='Standalone searx.')
38
+parser.add_argument('query', type=str,
39
+                    help='Text query')
40
+parser.add_argument('--category', type=str, nargs='?',
41
+                    choices=searx.engines.categories.keys(),
42
+                    default='general',
43
+                    help='Search category')
44
+parser.add_argument('--lang', type=str, nargs='?',default='all',
45
+                    help='Search language')
46
+parser.add_argument('--pageno', type=int, nargs='?', default=1,
47
+                    help='Page number starting from 1')
48
+parser.add_argument('--safesearch', type=str, nargs='?', choices=['0', '1', '2'], default='0',
49
+                    help='Safe content filter from none to strict')
50
+parser.add_argument('--timerange', type=str, nargs='?', choices=['day', 'week', 'month', 'year'],
51
+                    help='Filter by time range')
52
+args = parser.parse_args()
53
+
54
+# search results for the query
55
+form = {
56
+    "q":args.query,
57
+    "categories":args.category.decode('utf-8'),
58
+    "pageno":str(args.pageno),
59
+    "language":args.lang,
60
+    "time_range":args.timerange
61
+}
62
+preferences = searx.preferences.Preferences(['oscar'], searx.engines.categories.keys(), searx.engines.engines, [])
63
+preferences.key_value_settings['safesearch'].parse(args.safesearch)
64
+
65
+search_query = searx.search.get_search_query_from_webapp(preferences, form)
66
+search = searx.search.Search(search_query)
67
+result_container = search.search()
68
+
69
+# output
70
+from datetime import datetime
71
+
72
+def no_parsed_url(results):
73
+    for result in results:
74
+        del result['parsed_url']
75
+    return results
76
+
77
+def json_serial(obj):
78
+    """JSON serializer for objects not serializable by default json code"""
79
+    if isinstance(obj, datetime):
80
+        serial = obj.isoformat()
81
+        return serial
82
+    raise TypeError ("Type not serializable")
83
+
84
+result_container_json = {
85
+    "search": {
86
+        "q": search_query.query,
87
+        "pageno": search_query.pageno,
88
+        "lang": search_query.lang,
89
+        "safesearch": search_query.safesearch,
90
+        "timerange": search_query.time_range,
91
+        "engines": search_query.engines  
92
+    },
93
+    "results": no_parsed_url(result_container.get_ordered_results()),
94
+    "infoboxes": result_container.infoboxes,
95
+    "suggestions": list(result_container.suggestions),
96
+    "answers": list(result_container.answers),
97
+    "paging": result_container.paging,
98
+    "results_number": result_container.results_number()
99
+}
100
+
101
+print(dumps(result_container_json, sort_keys=True, indent=4, ensure_ascii=False, encoding="utf-8", default=json_serial))