How to extract all email addresses in the body from an eml file

145 Views Asked by At

I am working on a project that looks in a mailbox and extract data from mails.

I want to extract all email addressess found in the mail body.

Extract email addresses:

# Python script to extract email addresses from email messages / eml
# Comment from JNevill solved the final bit
import os
import re
from email import policy
from email.parser import BytesParser

emaillocation = os.chdir(r"\\10.21.1.236\websites\vaccinatieplanner\mail\stroomz\onbezorgd")
emaillist = []

for emailmessage in os.listdir(emaillocation):
    with open(f'{emailmessage}', 'rb') as em:
        msg = BytesParser(policy=policy.default).parse(em)
    emailmsgraw = msg.get_body(preferencelist=('plain', 'html'))
    emailmsg = emailmsgraw.get_content()
    emaillist.extend(re.findall(r'[\w.+-]+@[\w-]+\.[\w.-]+', emailmsg))

print(emaillist)
1

There are 1 best solutions below

0
On

Answered and solved with the help of the comment of JNevill

# Python script to extract email addresses from email messages / eml
# Comment from JNevill solved the final bit
import os
import re
from email import policy
from email.parser import BytesParser

emaillocation = os.chdir(r"\\10.21.1.236\websites\vaccinatieplanner\mail\stroomz\onbezorgd")
emaillist = []

for emailmessage in os.listdir(emaillocation):
    with open(f'{emailmessage}', 'rb') as em:
        msg = BytesParser(policy=policy.default).parse(em)
    emailmsgraw = msg.get_body(preferencelist=('plain', 'html'))
    emailmsg = emailmsgraw.get_content()
    emaillist.extend(re.findall(r'[\w.+-]+@[\w-]+\.[\w.-]+', emailmsg))

print(emaillist)