1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
|
# Copyright (C) 2008-2012 by the Free Software Foundation, Inc.
#
# This file is part of GNU Mailman.
#
# GNU Mailman is free software: you can redistribute it and/or modify it under
# the terms of the GNU General Public License as published by the Free
# Software Foundation, either version 3 of the License, or (at your option)
# any later version.
#
# GNU Mailman is distributed in the hope that it will be useful, but WITHOUT
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
# more details.
#
# You should have received a copy of the GNU General Public License along with
# GNU Mailman. If not, see <http://www.gnu.org/licenses/>.
#
# Authors: Toshio Kuratomi <toshio@fedoraproject.org>
# Authors: Pierre-Yves Chibon <pingou@fedoraproject.org>
#
"""Integration with HyperKitty Archiver."""
from __future__ import absolute_import, unicode_literals
__metaclass__ = type
__all__ = [
'HyperKitty',
]
from base64 import b32encode
import hashlib
import pymongo
import datetime
import email.Utils
from urllib import quote
from urlparse import urljoin
from zope.interface import implements
from mailman.config import config
from mailman.interfaces.archiver import IArchiver
from mailman.interfaces.mailinglist import IMailingList
def convert_date(date_string):
""" Convert the string of the date to a datetime object. """
date_string = date_string.strip()
time_tuple = email.Utils.parsedate(date_string)
# convert time_tuple to datetime
EpochSeconds = time.mktime(time_tuple)
dt = datetime.datetime.fromtimestamp(EpochSeconds)
return dt
class HyperKitty(object):
"""An archiver for mailman implementing tagging, rating, and a forum-ish interface
Mailman proposes a draft specification for interoperability between list
servers and archivers: <http://wiki.list.org/display/DEV/Stable+URLs>.
"""
implements(IArchiver)
name = 'hyperkitty'
@staticmethod
def list_url(mlist):
"""See `IArchiver`."""
if mlist.archive_private:
return None
base_url = config.archiver.hyperkitty.base_url
if not base_url:
# Pick a default
base_url = mlist.domain.base_url
# TODO: I see that some lists use mlist.posting_address -- is there a
# difference with fqdn_listname?
return urljoin(base_url, quote(mlist.fqdn_listname))
@staticmethod
def stable_url_id(msg):
# Should this be a method or attribute on mailman.email.message instead?
message_id = msg.get('message-id')
# It is not the archiver's job to ensure the message has a Message-ID.
# If this header is missing, there is no permalink.
if message_id is None:
return None
# The angle brackets are not part of the Message-ID. See RFC 2822.
if message_id.startswith('<') and message_id.endswith('>'):
message_id = message_id[1:-1]
else:
message_id = message_id.strip()
digest = hashlib.sha1(message_id).digest()
message_id_hash = b32encode(digest)
del msg['x-message-id-hash']
msg['X-Message-ID-Hash'] = message_id_hash
return message_id_hash
@classmethod
def permalink(cls, mlist, message):
"""See `IArchiver`."""
base_url = cls.list_url(mlist)
message_id_hash = cls.stable_url_id(message)
if not base_url or not message_id_hash:
return None
return urljoin(base_url, 'messages/%s/%s' % (mlist.fqdn_listname,
message_id_hash))
@classmethod
def archive_message(cls, mlist, message):
"""See `IArchiver`."""
# Side effect: stable_id_hash is saved in msg['X-Message-ID-Hash'] -- used by
# HyperKitty archiver
cls.stable_url_id(message)
connection = pymongo.Connection('localhost', 27017)
#TODO: We have to adjust the client for this, use the full list
# name (with domain name) as table instead of just the list name
db = connection[mlist.fqdn_listname]
db.mails.create_index('MessageID')
db.mails.ensure_index('MessageID')
db.mails.create_index('InReplyTo')
db.mails.ensure_index('InReplyTo')
db.mails.create_index('ThreadID')
db.mails.ensure_index('ThreadID')
infos = {}
for it in message.keys():
# Avoids problem when called in a template
it2 = it.replace('-', '')
infos[it2] = message[it]
keys = infos.keys()
## There seem to be a problem to parse some messages
if not keys:
print ' Failed: %s keys: "%s"' % (mbfile, keys)
# Will we still need this ?
raise Exception ('Message could not be parsed correctly')
# Will we still need this ?
# TODO: Should we replace Message-ID by X-Message-ID-Hash ?
if db.mails.find({'MessageID': infos['MessageID']}).count() == 0:
# Do we need this conversion or has the module already done that?
infos['Date'] = convert_date(infos['Date'])
infos['Content'] = message.get_payload()
if not 'References' in infos:
infos['ThreadID'] = msg['MessageID']
else:
ref = infos['References'].split('\n')[0].strip()
res = db.mails.find_one({'MessageID': ref})
if res and 'ThreadID' in res:
infos['ThreadID'] = res['ThreadID']
else:
infos['ThreadID'] = msg['MessageID']
infos['Category'] = 'Question'
if 'agenda' in infos['Subject'].lower():
infos['Category'] = 'Agenda'
if 'reminder' in infos['Subject'].lower():
infos['Category'] = 'Agenda'
db.mails.insert(infos)
else:
raise Exception (
'MessageID %s already exists in the database' % \
infos['MessageID'])
## TODO: Should we save the message on the hard-disk as well?
return cls.permalink(mlist, message)
|