summaryrefslogtreecommitdiff
path: root/service/pixelated/adapter/search/contacts.py
blob: 733489b0edf0be9e0a1b3e30e89c51e1083dafd2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#
# Copyright (c) 2014 ThoughtWorks, Inc.
#
# Pixelated is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Pixelated is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with Pixelated. If not, see <http://www.gnu.org/licenses/>.
from email.utils import parseaddr
from pixelated.support.functional import flatten
from whoosh.qparser import QueryParser
from whoosh import sorting
from whoosh.query import Term


def address_duplication_filter(contacts):
    contacts_by_mail = dict()

    for contact in contacts:
        mail_address = extract_mail_address(contact)
        current = contacts_by_mail.get(mail_address, '')
        current = contact if len(contact) > len(current) else current
        contacts_by_mail[mail_address] = current
    return contacts_by_mail.values()


def extract_mail_address(text):
    return parseaddr(text)[1]


def contacts_suggestions(query, searcher):
    return address_duplication_filter(search_addresses(searcher, query)) if query else []


def search_addresses(searcher, query):
    restrict_q = Term("tag", "drafts") | Term("tag", "trash")
    results = []
    for field in ['to', 'cc', 'bcc', 'sender']:
        query_parser = QueryParser(field, searcher.schema)
        results.append(
            searcher.search(
                query_parser.parse("*%s* OR *%s*" % (query.title(), query)),
                limit=None,
                mask=restrict_q,
                groupedby=sorting.FieldFacet(
                    field,
                    allow_overlap=True),
                terms=True).matched_terms())
    return [address[1] for address in flatten(results)]