60
def _parse_message(message):
61
"""Get a date and dict of an RFC822 message."""
62
parsed = email.parser.Parser().parsestr(message)
65
for key in ('from', 'to', 'subject', 'message-id'):
66
value = parsed.get(key, None)
68
message_dict[key] = value
70
date = parsed.get('date')
73
pdate = parsedate_tz(date)
74
date = datetime.datetime(
76
tzinfo=dateutil.tz.tzoffset('', pdate[9]))
79
message_dict['date'] = date.isoformat() if date is not None else None
81
return date, message_dict
84
def _utc_datetime(dt):
85
return dt.astimezone(dateutil.tz.tzutc())
88
def _utc_timestamp(dt):
89
return time.mktime(_utc_datetime(dt).timetuple()) - time.timezone
92
def _utc_timeuuid(dt, lowest_val=True):
93
return convert_time_to_uuid(_utc_timestamp(dt), lowest_val)
96
def _cmp_timeuuid(a, b):
98
return cmp(a.time, b.time)
102
def _bound_timeuuid(a, b, max=False):
103
if a == '' or _cmp_timeuuid(b, a) == (1 if max else -1):
108
def _make_bounds(memo, range_start, range_finish, backward):
111
memo = uuid.UUID(memo)
116
if range_start is not None:
117
start = _bound_timeuuid(
118
start, _utc_timeuuid(range_start), max=True)
119
if range_finish is not None:
120
finish = _bound_timeuuid(
121
finish, _utc_timeuuid(range_finish, lowest_val=False))
122
return memo, start, finish
125
LEGAL_HEADERS = set([
126
'date', 'from', 'subject', 'message-id',
130
def _format_message(want, message):
133
data[key] = message.get(key)
137
def _format_all(headers):
138
assert not set(headers).difference(LEGAL_HEADERS)
139
want = list(headers) + ['content']
140
return want, functools.partial(_format_message, want)
148
54
class CassandraConnection(object):
150
56
def __init__(self, keyspace, host):
163
69
def add_message(self, archive_uuid, message):
164
70
message_uuid = uuid.uuid4()
165
message_date, message_dict = _parse_message(message)
166
message_dict['content'] = message
167
message_dict['date_created'] = (
168
datetime.datetime.utcnow().isoformat() + 'Z')
169
self.messages.insert(message_uuid, message_dict)
71
parsed = email.parser.Parser().parsestr(message)
72
date = parsed.get('date')
75
pdate = parsedate_tz(date)
76
date = datetime.datetime(
78
tzinfo=dateutil.tz.tzoffset('', pdate[9]))
83
{'date_created': datetime.datetime.utcnow().isoformat() + 'Z',
85
'from': parsed.get('From'),
86
'to': parsed.get('To'),
87
'subject': parsed.get('Subject'),
88
'date': date.isoformat() if date is not None else None,
89
'message_id': parsed.get('Message-ID'),
170
91
self.archive_messages.insert(
172
{_utc_timestamp(message_date): message_uuid})
93
{date.astimezone(dateutil.tz.tzutc()): message_uuid})
174
'Imported %s into %s'
175
% (message_dict.get('message-id', None), archive_uuid))
95
'Imported %s into %s' % (parsed.get('Message-ID'), archive_uuid))
176
96
return message_uuid
178
def _trim(self, sequence, end):
179
"""Return the sequence with one of the ends trimmed.
181
:param end: if true, remove the last element. otherwise remove
189
def get_messages(self, archive_uuid, order, count, memo, backward=False,
190
start_date=None, finish_date=None, format='all',
191
headers=['from', 'date', 'subject', 'message-id']):
98
def _format_message(self, message):
100
'date': message['date'],
101
'from': message['from'],
102
'subject': message['subject'],
105
def get_messages(self, archive_uuid, order, count, start):
192
106
if order in ("date", "-date"):
193
107
reversed = order[0] == '-'
195
109
raise AssertionError("Unsupported order.")
197
memo, start, finish = _make_bounds(
198
memo, start_date, finish_date, backward)
200
# Get up to n+1 messages from the memo: the last item of the
201
# previous batch (because that's where the memo starts) + this
203
110
pairs = self.archive_messages.get(
204
archive_uuid, column_count=count + 1, column_start=start,
205
column_finish=finish, column_reversed=reversed).items()
207
if len(pairs) and memo and pairs[0][0] <= memo:
208
# The memo (from the previous batch) was included in the result.
210
pairs = self._trim(pairs, False ^ backward)
211
elif len(pairs) > count:
212
# There was no memo in the result, so the n+1th element is
213
# unnecessary. Kill it.
214
pairs = self._trim(pairs, True ^ backward)
217
return (None, [], None)
219
assert 0 < len(pairs) <= count
221
# We've narrowed down the message references. Fetch the messages.
111
archive_uuid, column_count=count + 1,
112
column_start=start, column_reversed=reversed).items()
222
113
ids = [v for k, v in pairs]
224
wanted_cols, func = FORMATS[format](headers)
226
# XXX: No need to get all columns. Restrict based on format.
227
messages = self.messages.multiget(ids)
114
messages = self.messages.multiget(
115
ids, columns=['date', 'from', 'subject'])
116
actual_count = len(pairs)
117
if len(pairs) > count:
118
assert len(pairs) == count + 1
120
next_memo = str(pairs[count][0])
231
[func(messages[id]) for id in ids],
124
[self._format_message(messages[id]) for id in ids[:actual_count]],