I wrote something a couple of weeks ago that might help.
It works with POP3 mailboxes and it handles messages with
body text and/or attachments, but you could easily change
it.
Hope it helps.
Larry Bates
Syscon, Inc.
import poplib
import email
import email.Parser
import os
import sys
class email_attachment:
def __init__(self, messagenum, attachmentnum, filename, contents):
'''
arguments:
messagenum - message number of this message in the Inbox
attachmentnum - attachment number for this attachment
filename - filename for this attachment
contents - attachment's contents
'''
self.messagenum=messagenum
self.attachmentnum=attachmentnum
self.filename=filename
self.contents=contents
return
def save(self, savepath, savefilename=None):
'''
Method to save the contents of an attachment to a file
arguments:
savepath - path where file is to be saved
safefilename - optional name (if None will use filename of
attachment
'''
savefilename=savefilename or self.filename
f=open(os.path.join(savepath, savefilename),"wb")
f.write(self.contents)
f.close()
return
class email_msg:
def __init__(self, messagenum, contents):
self.messagenum=messagenum
self.contents=contents
self.attachments_index=0 # Index of attachments for next method
self.ATTACHMENTS=[] # List of attachment objects
self.msglines='\n'.join(contents[1])
#
# See if I can parse the message lines with email.Parser
#
self.msg=email.Parser.Parser().parsestr(self.msgli nes)
if self.msg.is_multipart():
attachmentnum=0
for part in self.msg.walk():
# multipart/* are just containers
mptype=part.get_content_maintype()
filename = part.get_filename()
if mptype == "multipart": continue
if filename: # Attached object with filename
attachmentnum+=1
self.ATTACHMENTS.append(email_attachment(messagenu m,
attachmentnum,
filename,
part.get_payload(decode=1)))
print "Attachment filename=%s" % filename
else: # Must be body portion of multipart
self.body=part.get_payload()
else: # Not multipart, only body portion exists
self.body=self.msg.get_payload()
return
def get(self, key):
try: return self.msg.get(key)
except:
emsg="email_msg-Unable to get email key=%s information" % key
print emsg
sys.exit(emsg)
def has_attachments(self):
return (len(self.ATTACHMENTS) > 0)
def __iter__(self):
return self
def next(self):
#
# Try to get the next attachment
#
try: ATTACHMENT=self.ATTACHMENTS[self.attachments_index]
except:
self.attachments_index=0
raise StopIteration
#
# Increment the index pointer for the next call
#
self.attachments_index+=1
return ATTACHMENT
class pop3_inbox:
def __init__(self, server, userid, password):
self._trace=0
if self._trace: print "pop3_inbox.__init__-Entering"
self.result=0 # Result of server communication
self.MESSAGES=[] # List for storing message objects
self.messages_index=0 # Index of message for next method
#
# See if I can connect using information provided
#
try:
if self._trace: print "pop3_inbox.__init__-Calling
poplib.POP3(server)"
self.connection=poplib.POP3(server)
if self._trace: print "pop3_inbox.__init__-Calling
connection.user(userid)"
self.connection.user(userid)
if self._trace: print "pop3_inbox.__init__-Calling
connection.pass_(password)"
self.connection.pass_(password)
except:
if self._trace: print "pop3_inbox.__init__-Login failure,
closing connection"
self.result=1
self.connection.quit()
#
# Get count of messages and size of mailbox
#
if self._trace: print "pop3_inbox.__init__-Calling
connection.stat()"
self.msgcount, self.size=self.connection.stat()
#
# Loop over all the messages processing each one in turn
#
for msgnum in range(1, self.msgcount+1):
self.MESSAGES.append(email_msg(msgnum,
self.connection.retr(msgnum)))
if self._trace: print "pop3_inbox.__init__-Leaving"
return
def close(self):
self.connection.quit()
return
def remove(self, msgnumorlist):
if isinstance(msgnumorlist, int): self.connection.dele(msgnumorlist)
elif isinstance(msgnumorlist, (list, tuple)):
map(self.connection.dele, msgnumorlist)
else:
emsg="pop3_inbox.remove-msgnumorlist must be type int, list, or
tuple, not %s" % type(msgnumorlist)
print emsg
sys.exit(emsg)
self.msgcount-=1
return
def __len__(self):
return self.msgcount
def __iter__(self):
return self
def next(self):
#
# Try to get the next attachment
#
try: MESSAGE=self.MESSAGES[self.messages_index]
except:
self.messages_index=0
raise StopIteration
#
# Increment the index pointer for the next call
#
self.messages_index+=1
return MESSAGE
if __name__=="__main__":
server="www.domain.com" # set server here
userid="userid" # set userid here
password="password" # set password here
inbox=pop3_inbox(server, userid, password)
if inbox.result:
emsg="Failure connecting to pop3_inbox"
print emsg
sys.exit(emsg)
print "Message count=%i, Inbox size=%i" % (inbox.msgcount, inbox.size)
counter=0
for m in inbox:
counter+=1
print "Subject: %s" % m.get('subject')
print "-------------Message (%i) body lines---------------" %
counter
print m.body
print "-------------End message (%i) body lines-----------" %
counter
if m.has_attachments():
acounter=0
for a in m:
acounter+=1
print "-------------Message (%i) attachments-------------" %
counter
print "%i: %s" % (acounter, a.filename)
print "-------------End message (%i) attachments---------" %
counter
a.save(r"C:\temp")
else: print "-------------Message has no attachments----------"
#
# See if I can delete all messages
#
#if inbox.msgcount: inbox.remove(range(1, inbox.msgcount+1))
inbox.close()
"chuck amadi" <ch*********@ntlworld.com> wrote in message
news:ma*************************************@pytho n.org...
By the way list is there a better way than using the readlines() to >parse the mail data into a file , because Im using
>email.message_from_file it returns
>all the data i.e reads one entire line from the file , headers as well >as just the desired body messages .
>
>fp = file("/home/chuck/pythonScript/testbox")
>mb = mailbox.UnixMailbox(fp,
>email.message_from_file)
>
>
>mailout = file("/home/chuck/pythonScript/SurveyResults.txt","w")
>for mail in fp.readlines():
> mailout.write(mail)
>
>Something like this>
>
>for mail in mb:
> body = mail.get_payload()
> mailout.write(body) # write only the body messages to SurveyResults.txt >
>Cheers if the is a better way I can't get my head round how I can print >mail (
>only the body messages) to screen and the entire mail headers and body >to the new file.
>
>Hi have any one got any suggstions to my script I can parse the email >body messages to screen but I want the same desired effect to save to a >new file.I have tried a few things to no effect.
.
.
.
There's a lot going on in your message. I *think* what you want
is the suggestion to replace
for mail in fp.readlines():
mailout.write(mail)
with
mailout.write(fp.read())
--
Hi again where I print mail.get_payload()
I want to write this to the file. Bu uisng readlinds() function I
obviously get the entire contents including the headers thus I want to
do something like this
for bdymsg in mb:
bdymsg = mail.get_payload()
print mail.get_payload()# prints body msg's to screen
mailout.write(bdymsg)
# mailout.write(mail.get_payload()) # Something along these lines.
mailout.close()