summaryrefslogtreecommitdiff
path: root/service/pixelated/adapter/search/contacts.py
blob: 0dfeb15ba60995565ded18ebf6a1ec4e7ad7fe31 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
#
# Copyright (c) 2014 ThoughtWorks, Inc.
#
# Pixelated is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# Pixelated is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with Pixelated. If not, see <http://www.gnu.org/licenses/>.
from email.utils import parseaddr
from pixelated.support.functional import flatten
from whoosh.qparser import QueryParser
from whoosh import sorting
from whoosh.query import Term


def address_duplication_filter(contacts):
    contacts_by_mail = dict()

    for contact in contacts:
        mail_address = extract_mail_address(contact)
        current = contacts_by_mail.get(mail_address, '')
        current = contact if len(contact) > len(current) else current
        contacts_by_mail[mail_address] = current
    return contacts_by_mail.values()


def bounced_addresses_filter(searcher, contacts):
    query = QueryParser('bounced', searcher.schema).parse('*')
    bounced_addresses = searcher.search(query,
                                        limit=None,
                                        groupedby=sorting.FieldFacet('bounced',
                                                                     allow_overlap=True)).groups()
    return set(contacts) - set(flatten([bounced_addresses]))


def extract_mail_address(text):
    return parseaddr(text)[1]


def contacts_suggestions(query, searcher):
    return address_duplication_filter(bounced_addresses_filter(searcher, search_addresses(searcher, query))) if query else []


def search_addresses(searcher, query):
    restrict_q = Term("tag", "drafts") | Term("tag", "trash")
    results = []
    for field in ['to', 'cc', 'bcc', 'sender']:
        query_parser = QueryParser(field, searcher.schema)
        results.append(searcher.search(query_parser.parse("*%s*" % query),
                                       limit=None,
                                       mask=restrict_q,
                                       groupedby=sorting.FieldFacet(field,
                                                                    allow_overlap=True)).groups())
    return flatten(results)