summaryrefslogtreecommitdiff
path: root/service/pixelated/search_query.py
blob: 278e1f2f05409756458bee6c4a98c1caf455da15 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
#
# Copyright (c) 2014 ThoughtWorks, Inc.
#
# Pixelated is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Pixelated is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with Pixelated. If not, see <http://www.gnu.org/licenses/>.
from scanner import StringScanner, StringRegexp
import re


def compile(query):
    compiled = {"tags": [], "not_tags": []}
    sanitized_query = re.sub(r"['\"]", "", query.encode('utf8'))
    scanner = StringScanner(sanitized_query)
    first_token = True

    while not scanner.is_eos:
        token = scanner.scan(_next_token())

        if not token:
            scanner.skip(_separators())
            continue

        if ":" in token:
            compiled = _compile_tag(compiled, token)
        elif first_token:
            compiled["general"] = token

        if not first_token:
            first_token = True

    return compiled


def _next_token():
    return StringRegexp('[^\s]+')


def _separators():
    return StringRegexp('[\s&]+')


def _compile_tag(compiled, token):
    tag = token.split(":").pop()
    if token[0] == "-":
        compiled["not_tags"].append(tag)
    else:
        compiled["tags"].append(tag)
    return compiled