Python-imaplib-fetch-body-emails-gmail
我写了这个脚本来获取某个邮箱中电子邮件的正文,该邮箱的标题以“$”开头,由某个发件人发送Python-imaplib-fetch-body-emails-gmail,python,email,request,imap,imaplib,Python,Email,Request,Imap,Imaplib,我写了这个脚本来获取某个邮箱中电子邮件的正文,该邮箱的标题以“$”开头,由某个发件人发送 import email, getpass, imaplib, os detach_dir = "F:\PYTHONPROJECTS" # where you will save attachments user = raw_input("Enter your GMail username --> ") pwd = getpass.getpass("Enter your password -->
import email, getpass, imaplib, os
detach_dir = "F:\PYTHONPROJECTS" # where you will save attachments
user = raw_input("Enter your GMail username --> ")
pwd = getpass.getpass("Enter your password --> ")
# connect to the gmail imap server
m = imaplib.IMAP4_SSL("imap.gmail.com")
m.login(user, pwd)
m.select("PETROLEUM") # here you a can choose a mail box like INBOX instead
# use m.list() to get all the mailboxes
resp, items = m.search(None, '(FROM "EIA_eLists@eia.gov")')
items = items[0].split() # getting the mails id
my_msg = [] # store relevant msgs here in please
msg_cnt = 0
break_ = False
for emailid in items[::-1]:
resp, data = m.fetch(emailid, "(RFC822)")
if ( break_ ):
break
for response_part in data:
if isinstance(response_part, tuple):
msg = email.message_from_string(response_part[1])
varSubject = msg['subject']
if varSubject[0] == '$':
msg_cnt += 1
my_msg.append(msg)
print msg_cnt
print email.message_from_string(response_part[1])
if ( msg_cnt == 5 ):
break_ = True
如果我打印email.message\u from\u string(response\u part[1])
,我可以看到它包含第一个信息(标题、开始、结束、日期…),以及全文正文。但是,我拿不到尸体本身<代码>电子邮件。来自字符串的消息(响应部分[0])打印邮件ID,并且电子邮件。来自字符串的消息(响应部分[2])
超出范围<代码>电子邮件。来自字符串的消息(响应部分[1][0])两者都没有这样做
谢谢和问候
更新
现在,我几乎可以有正文了。然而,它仍然被先发的信息声明所破坏。结果我得到了
From nobody Tue Dec 25 11:42:58 2012
US=3D$4.030
EastCst=3D$4.036
NewEng=3D$4.205
CenAtl=3D$4.149
LwrAtl=3D$3.921
Midwst=3D$3.984
GulfCst=3D$3.945
RkyMt=3D$4.195
WCst=3D$4.187
CA=3D$4.268
我想在2012年12月25日星期二11:42:58从任何人那里摆脱信息。我知道我可以解析文本,查找第一行相关内容。。。我知道
实现so(插入我的第一个示例)的代码是
你有更好的方法(没有信息字符串)吗???更多:现在获取日期的命令是什么?我知道我可以在上面适合的地方做
varDate=msg['date']
,但是如何只获取日-月-年?谢谢您可以通过执行以下任一操作来获取正文内容
msg.as_string()
str(msg)
repr(msg)
我使用Gmail成功地实现了这一点,它提取有用的信息并将其输出到文本文件:
import datetime
import email
import imaplib
import mailbox
EMAIL_ACCOUNT = "your@gmail.com"
PASSWORD = "your password"
mail = imaplib.IMAP4_SSL('imap.gmail.com')
mail.login(EMAIL_ACCOUNT, PASSWORD)
mail.list()
mail.select('inbox')
result, data = mail.uid('search', None, "UNSEEN") # (ALL/UNSEEN)
i = len(data[0].split())
for x in range(i):
latest_email_uid = data[0].split()[x]
result, email_data = mail.uid('fetch', latest_email_uid, '(RFC822)')
# result, email_data = conn.store(num,'-FLAGS','\\Seen')
# this might work to set flag to seen, if it doesn't already
raw_email = email_data[0][1]
raw_email_string = raw_email.decode('utf-8')
email_message = email.message_from_string(raw_email_string)
# Header Details
date_tuple = email.utils.parsedate_tz(email_message['Date'])
if date_tuple:
local_date = datetime.datetime.fromtimestamp(email.utils.mktime_tz(date_tuple))
local_message_date = "%s" %(str(local_date.strftime("%a, %d %b %Y %H:%M:%S")))
email_from = str(email.header.make_header(email.header.decode_header(email_message['From'])))
email_to = str(email.header.make_header(email.header.decode_header(email_message['To'])))
subject = str(email.header.make_header(email.header.decode_header(email_message['Subject'])))
# Body details
for part in email_message.walk():
if part.get_content_type() == "text/plain":
body = part.get_payload(decode=True)
file_name = "email_" + str(x) + ".txt"
output_file = open(file_name, 'w')
output_file.write("From: %s\nTo: %s\nDate: %s\nSubject: %s\n\nBody: \n\n%s" %(email_from, email_to,local_message_date, subject, body.decode('utf-8')))
output_file.close()
else:
continue
这将需要外部库,但要简单得多
import datetime
import email
import imaplib
import mailbox
EMAIL_ACCOUNT = "your@gmail.com"
PASSWORD = "your password"
mail = imaplib.IMAP4_SSL('imap.gmail.com')
mail.login(EMAIL_ACCOUNT, PASSWORD)
mail.list()
mail.select('inbox')
result, data = mail.uid('search', None, "UNSEEN") # (ALL/UNSEEN)
i = len(data[0].split())
for x in range(i):
latest_email_uid = data[0].split()[x]
result, email_data = mail.uid('fetch', latest_email_uid, '(RFC822)')
# result, email_data = conn.store(num,'-FLAGS','\\Seen')
# this might work to set flag to seen, if it doesn't already
raw_email = email_data[0][1]
raw_email_string = raw_email.decode('utf-8')
email_message = email.message_from_string(raw_email_string)
# Header Details
date_tuple = email.utils.parsedate_tz(email_message['Date'])
if date_tuple:
local_date = datetime.datetime.fromtimestamp(email.utils.mktime_tz(date_tuple))
local_message_date = "%s" %(str(local_date.strftime("%a, %d %b %Y %H:%M:%S")))
email_from = str(email.header.make_header(email.header.decode_header(email_message['From'])))
email_to = str(email.header.make_header(email.header.decode_header(email_message['To'])))
subject = str(email.header.make_header(email.header.decode_header(email_message['Subject'])))
# Body details
for part in email_message.walk():
if part.get_content_type() == "text/plain":
body = part.get_payload(decode=True)
file_name = "email_" + str(x) + ".txt"
output_file = open(file_name, 'w')
output_file.write("From: %s\nTo: %s\nDate: %s\nSubject: %s\n\nBody: \n\n%s" %(email_from, email_to,local_message_date, subject, body.decode('utf-8')))
output_file.close()
else:
continue
import datetime
import email
import imaplib
import mailbox
import re
EMAIL_ACCOUNT = "yourmail@yahoo.com"
PASSWORD = "password"
mail = imaplib.IMAP4_SSL('imap.mail.yahoo.com')
mail.login(EMAIL_ACCOUNT, PASSWORD)
mail.select('INBOX')
result, data = mail.search(None, '(FROM "Sender Email")','ALL')
result, data = mail.search(None, '(SUBJECT "Message")','ALL')
i = len(data[0].split())
if i == 1:
latest_email_uid = data[0].split()[0]
result, email_data = mail.uid('fetch', latest_email_uid, '(RFC822)')
raw_email = email_data[0][1]
raw_email_string = raw_email.decode('utf-8')
email_message = email.message_from_string(raw_email_string)
body = email_message.get_payload(decode=True)
for part in email_message.walk():
if part.get_content_type() == "text/plain":
emailBody = part.get_payload(decode=True)
print(emailBody)
else:
continue
else:
print('Email NOT ' + EMAIL_ACCOUNT )
from imap_tools import MailBox
# get all attachments from INBOX and save them to files
with MailBox('imap.my.ru').login('acc', 'pwd', 'INBOX') as mailbox:
for msg in mailbox.fetch():
print(msg.text)
print(msg.html)