forked from polo2ro/imapbox
-
Notifications
You must be signed in to change notification settings - Fork 0
/
mailboxresource.py
147 lines (112 loc) · 5.01 KB
/
mailboxresource.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
#!/usr/bin/env python
#-*- coding:utf-8 -*-
from __future__ import print_function
import imaplib, email
import re
import os
import hashlib
from message import Message
import datetime
from utilities import errorHandler
class MailboxClient:
"""Operations on a mailbox"""
def __init__(self, host, port, username, password, remote_folder, ssl):
if not ssl:
self.mailbox = imaplib.IMAP4(host, port)
else:
self.mailbox = imaplib.IMAP4_SSL(host, port)
self.mailbox.login(username, password)
typ, data = self.mailbox.select(remote_folder, readonly=True)
if typ != 'OK':
# Handle case where Exchange/Outlook uses '.' path separator when
# reporting subfolders. Adjust to use '/' on remote.
adjust_remote_folder = re.sub(r'\.', '/', remote_folder)
typ, data = self.mailbox.select(adjust_remote_folder, readonly=True)
if typ != 'OK':
errorHandler(remote_folder, 'MailboxClient: Could not select remote folder', exitCode=None)
def copy_emails(self, days, local_folder, wkhtmltopdf):
n_saved = 0
n_exists = 0
self.local_folder = local_folder
self.wkhtmltopdf = wkhtmltopdf
criterion = 'ALL'
if days:
date = (datetime.date.today() - datetime.timedelta(days)).strftime("%d-%b-%Y")
criterion = '(SENTSINCE {date})'.format(date=date)
typ, data = self.mailbox.search(None, criterion)
for num in data[0].split():
typ, data = self.mailbox.fetch(num, '(RFC822)')
if self.saveEmail(data):
n_saved += 1
else:
n_exists += 1
return (n_saved, n_exists)
def cleanup(self):
self.mailbox.close()
self.mailbox.logout()
def getEmailFolder(self, msg, data):
# 255is the max filename length on all systems
if msg['Message-Id'] and len(msg['Message-Id']) < 255:
foldername = re.sub(r'[^a-zA-Z0-9_\-\.() ]+', '', msg['Message-Id'])
else:
foldername = hashlib.sha224(data).hexdigest()
year = 'None'
if msg['Date']:
match = re.search(r'\d{1,2}\s\w{3}\s(\d{4})', msg['Date'])
if match:
year = match.group(1)
return os.path.join(self.local_folder, year, foldername)
def saveEmail(self, data):
for response_part in data:
if isinstance(response_part, tuple):
msg = ""
# Handle Python version differences:
# Python 2 imaplib returns bytearray, Python 3 imaplib
# returns str.
if isinstance(response_part[1], str):
msg = email.message_from_string(response_part[1])
else:
try:
msg = email.message_from_string(response_part[1].decode("utf-8"))
except:
print("couldn't decode message with utf-8 - trying 'ISO-8859-1'")
msg = email.message_from_string(response_part[1].decode("ISO-8859-1"))
directory = self.getEmailFolder(msg, data[0][1])
if os.path.exists(directory):
return False
os.makedirs(directory)
try:
message = Message(directory, msg)
message.createRawFile(data[0][1])
message.createMetaFile()
message.extractAttachments()
if self.wkhtmltopdf:
message.createPdfFile(self.wkhtmltopdf)
except Exception as e:
# ex: Unsupported charset on decode
print(directory)
errorHandler(e, 'MailboxClient.saveEmail() failed', exitCode=None)
return True
def save_emails(account, options):
mailbox = MailboxClient(account['host'], account['port'], account['username'], account['password'], account['remote_folder'], account['ssl'])
stats = mailbox.copy_emails(options['days'], options['local_folder'], options['wkhtmltopdf'])
mailbox.cleanup()
print('{} emails created, {} emails already exists'.format(stats[0], stats[1]))
def get_folder_fist(account):
if not account['ssl']:
mailbox = imaplib.IMAP4(account['host'], account['port'])
else:
mailbox = imaplib.IMAP4_SSL(account['host'], account['port'])
mailbox.login(account['username'], account['password'])
folder_list = mailbox.list()[1]
mailbox.logout()
return folder_list
def get_folders(account):
folders = []
for folder_entry in get_folder_fist(account):
folders.append(folder_entry.decode().replace("/",".").split(' "." ')[1])
# Remove Gmail parent folder from array otherwise the script fails:
if '"[Gmail]"' in folders: folders.remove('"[Gmail]"')
# Remove Gmail "All Mail" folder which just duplicates emails:
if '"[Gmail].All Mail"' in folders: folders.remove('"[Gmail].All Mail"')
return folders