python imaplib获取gmail收件箱主题标题和发件人姓名

sad*_*ave 22 python gmail email-headers imaplib

我正在使用pythons imaplib连接到我的Gmail帐户.我想检索前15条消息(未读或读取,无关紧要)并仅显示主题和发件人姓名(或地址),但不知道如何显示收件箱的内容.

这是我到目前为止的代码(成功连接)

import imaplib

mail = imaplib.IMAP4_SSL('imap.gmail.com')
mail.login('mygmail@gmail.com', 'somecrazypassword')
mail.list()
mail.select('inbox')

#need to add some stuff in here

mail.logout()
Run Code Online (Sandbox Code Playgroud)

我相信这应该很简单,我对imaplib库的命令还不够熟悉.任何帮助都必须得到赞赏......

更新 感谢Julian我可以遍历每条消息并检索整个内容:

typ, data = mail.search(None, 'ALL')
for num in data[0].split():
   typ, data = mail.fetch(num, '(RFC822)')
   print 'Message %s\n%s\n' % (num, data[0][1])
mail.close()
Run Code Online (Sandbox Code Playgroud)

但我只想要主题和发送者.是否有针对这些项目的imaplib命令,或者我是否必须解析文本的全部内容[0] [1]:主题和发件人?

更新 确定,让主题和发件人部分工作,但迭代(1,15)由desc命令完成,显然首先显示最旧的消息.我怎么能改变这个?我试过这样做:

for i in range( len(data[0])-15, len(data[0]) ):
     print data
Run Code Online (Sandbox Code Playgroud)

但这只是给了我None所有15次迭代......任何想法?我也试过mail.sort('REVERSE DATE', 'UTF-8', 'ALL')但是gmail不支持.sort()函数

更新 找出一种方法:

#....^other code is the same as above except need to import email module
mail.select('inbox')
typ, data = mail.search(None, 'ALL')
ids = data[0]
id_list = ids.split()
#get the most recent email id
latest_email_id = int( id_list[-1] )

#iterate through 15 messages in decending order starting with latest_email_id
#the '-1' dictates reverse looping order
for i in range( latest_email_id, latest_email_id-15, -1 ):
   typ, data = mail.fetch( i, '(RFC822)' )

   for response_part in data:
      if isinstance(response_part, tuple):
          msg = email.message_from_string(response_part[1])
          varSubject = msg['subject']
          varFrom = msg['from']

   #remove the brackets around the sender email address
   varFrom = varFrom.replace('<', '')
   varFrom = varFrom.replace('>', '')

   #add ellipsis (...) if subject length is greater than 35 characters
   if len( varSubject ) > 35:
      varSubject = varSubject[0:32] + '...'

   print '[' + varFrom.split()[-1] + '] ' + varSubject
Run Code Online (Sandbox Code Playgroud)

这给了我最新的15个邮件主题和发件人地址按要求降序!感谢所有帮助过的人!

Tor*_*xed 14

    c.select('INBOX', readonly=True)

    for i in range(1, 30):
        typ, msg_data = c.fetch(str(i), '(RFC822)')
        for response_part in msg_data:
            if isinstance(response_part, tuple):
                msg = email.message_from_string(response_part[1])
                for header in [ 'subject', 'to', 'from' ]:
                    print '%-8s: %s' % (header.upper(), msg[header])
Run Code Online (Sandbox Code Playgroud)

这应该让您了解如何检索主题和从?

  • 什么是电子邮件?你指的是我的'邮件'变量吗?什么是message_from_string()组成的?我收到一条错误,指出`AttributeError("未知的IMAP4命令:'%s'"%attr)AttributeError:未知的IMAP4命令:'message_from_string' (2认同)
  • 没关系,想通了,我没有包含电子邮件模块.谢谢 (2认同)

小智 5

对于那些寻找如何检查邮件和解析标头的人,这是我所使用的:

def parse_header(str_after, checkli_name, mailbox) :
    #typ, data = m.search(None,'SENTON', str_after)
    print mailbox
    m.SELECT(mailbox)
    date = (datetime.date.today() - datetime.timedelta(1)).strftime("%d-%b-%Y")
    #date = (datetime.date.today().strftime("%d-%b-%Y"))
    #date = "23-Jul-2012"

    print date
    result, data = m.uid('search', None, '(SENTON %s)' % date)
    print data

    doneli = []
    for latest_email_uid in data[0].split():
        print latest_email_uid
        result, data = m.uid('fetch', latest_email_uid, '(RFC822)')
        raw_email = data[0][1]

        import email
        email_message = email.message_from_string(raw_email)
        print email_message['To']
        print email_message['Subject']
        print email.utils.parseaddr(email_message['From'])
        print email_message.items() # print all headers
Run Code Online (Sandbox Code Playgroud)


Edw*_*man 5

这是我从电子邮件中获取有用信息的解决方案:

import datetime
import email
import imaplib
import mailbox


EMAIL_ACCOUNT = "your@gmail.com"
PASSWORD = "your password"

mail = imaplib.IMAP4_SSL('imap.gmail.com')
mail.login(EMAIL_ACCOUNT, PASSWORD)
mail.list()
mail.select('inbox')
result, data = mail.uid('search', None, "UNSEEN") # (ALL/UNSEEN)
i = len(data[0].split())

for x in range(i):
    latest_email_uid = data[0].split()[x]
    result, email_data = mail.uid('fetch', latest_email_uid, '(RFC822)')
    # result, email_data = conn.store(num,'-FLAGS','\\Seen') 
    # this might work to set flag to seen, if it doesn't already
    raw_email = email_data[0][1]
    raw_email_string = raw_email.decode('utf-8')
    email_message = email.message_from_string(raw_email_string)

    # Header Details
    date_tuple = email.utils.parsedate_tz(email_message['Date'])
    if date_tuple:
        local_date = datetime.datetime.fromtimestamp(email.utils.mktime_tz(date_tuple))
        local_message_date = "%s" %(str(local_date.strftime("%a, %d %b %Y %H:%M:%S")))
    email_from = str(email.header.make_header(email.header.decode_header(email_message['From'])))
    email_to = str(email.header.make_header(email.header.decode_header(email_message['To'])))
    subject = str(email.header.make_header(email.header.decode_header(email_message['Subject'])))

    # Body details
    for part in email_message.walk():
        if part.get_content_type() == "text/plain":
            body = part.get_payload(decode=True)
            file_name = "email_" + str(x) + ".txt"
            output_file = open(file_name, 'w')
            output_file.write("From: %s\nTo: %s\nDate: %s\nSubject: %s\n\nBody: \n\n%s" %(email_from, email_to,local_message_date, subject, body.decode('utf-8')))
            output_file.close()
        else:
            continue
Run Code Online (Sandbox Code Playgroud)