#!/usr/bin/python import os, argparse, hashlib, email, glob, sqlite3 print sqlite3.version parser = argparse.ArgumentParser(description='Parses emails into an SQLite database, and optionally renders static HTML files.') parser.add_argument('-p', '--pattern', dest='pattern', action='store', default='*', help='glob pattern (including path) that has to be matched for a file to be parsed') parser.add_argument('-r', '--render', dest='render', action='store_true', help='render static HTML files using the template files in templates/') args = parser.parse_args() options = vars(args) database = sqlite3.connect('emails.db') cursor = database.cursor() try: # Try to create the table cursor.execute("CREATE TABLE emails (`message_id`, `from`, `to`, `subject`, `date`, `body`, `html`, `hash`)") except sqlite3.OperationalError: # Table already exists pass file_list = glob.glob(options['pattern']) for email_file in file_list: message = email.message_from_file(open(email_file)) if message['message-id'] is None: print "%s is not a valid e-mail file." % email_file else: if 'subject' not in message or message['subject'] is None: subject = "" else: subject = message['subject'] sha1_hash = hashlib.sha1("%s/%s/%s/%s" % (message['from'], message['to'], message['message-id'], subject)).hexdigest() timestamp = 0 textbody = "" htmlbody = "" new_row = (message['message-id'], message['from'], message['to'], subject, timestamp, textbody, htmlbody, sha1_hash) cursor.execute("INSERT INTO emails VALUES (?, ?, ?, ?, ?, ?, ?, ?)", new_row) print "Successfully parsed and inserted e-mail with SHA1 hash %s." % sha1_hash database.commit() print "Changes successfully committed to database, exiting..."