-
Notifications
You must be signed in to change notification settings - Fork 104
/
email_client.py
83 lines (60 loc) · 1.97 KB
/
email_client.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
#pip install beautifulsoup4
import email
import imaplib #imap pop
from bs4 import BeautifulSoup
import os
import mimetypes
username = '[email protected]'
password = 'iamhungry2016day19'
mail = imaplib.IMAP4_SSL("imap.gmail.com") # https://www.google.com/settings/security/lesssecureapps
mail.login(username, password)
mail.select("inbox")
#Create new folder
# mail.create("Item2")
#list Folders
#mail.list()
result, data = mail.uid('search', None, "ALL")
inbox_item_list = data[0].split()
for item in inbox_item_list:
result2, email_data = mail.uid('fetch', item, '(RFC822)')
raw_email = email_data[0][1].decode("utf-8")
email_message = email.message_from_string(raw_email)
to_ = email_message['To']
from_ = email_message['From']
subject_ = email_message['Subject']
date_ = email_message['date']
counter = 1
for part in email_message.walk():
if part.get_content_maintype() == "multipart":
continue
filename = part.get_filename()
content_type = part.get_content_type()
if not filename:
ext = mimetypes.guess_extension(content_type)
if not ext:
ext = '.bin'
if 'text' in content_type:
ext = '.txt'
elif 'html' in content_type:
ext = '.html'
filename = 'msg-part-%08d%s' %(counter, ext)
counter += 1
#save file
save_path = os.path.join(os.getcwd(), "emails", date_, subject_)
if not os.path.exists(save_path):
os.makedirs(save_path)
with open(os.path.join(save_path, filename), 'wb') as fp:
fp.write(part.get_payload(decode=True))
# if "plain" in content_type:
# #print(part.get_payload())
# pass
# elif "html" in content_type:
# html_ = part.get_payload()
# soup = BeautifulSoup(html_, "html.parser")
# text = soup.get_text()
# print(subject_)
# print(text)
# else:
# pass
# #print(content_type)
# #email_message.get_payload()