2 fix_imap_internaldate.py - Fix the INTERNALDATE field on IMAP servers
4 Copyright (c) 2012 Intra2net AG
5 Author: Plamen Dimitrov and Thomas Jarosch
7 This program is free software: you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation, either version 3 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
25 import ConfigParser as configparser
28 from mail_date_parser import MailDateParser
29 from mail_iterator import MailIterator
30 from caching_data import CachingData
32 CONFIG_FILENAME = "fix_imap_internaldate.cfg"
33 LOG_FILENAME = "fix_imap_internaldate.log"
34 CSV_FILENAME = "userdata.csv"
37 """Interprets command arguments and initializes configuration and logger.
38 Then begins mail synchronization."""
41 parser = argparse.ArgumentParser(description="Fix the INTERNALDATE field on IMAP servers. "
42 "Small tool to fix the IMAP internaldate "
43 "in case it's too much off compared to the last date "
44 "stored in the received lines.")
45 parser.add_argument('-u', '--update', dest='test_mode', action='store_false',
46 default=True, help='update all e-mails and exit test mode')
48 # config and logging setup
49 config = load_configuration()
50 prepare_logger(config)
51 args = parser.parse_args()
53 # check for update mode in the config
54 if config.getboolean('basic_settings', 'update_mode_i_know_what_i_am_doing'):
55 args.test_mode = False
58 logging.info("Testing mode initiated. No message will be modified on the server.")
60 logging.info("Update mode initiated. Messages will be modified.")
62 # proceed to main functionality
64 synchronize_csv(config, args.test_mode)
65 except KeyboardInterrupt:
66 logging.info("Script was interrupted by the user.")
68 logging.info("All done. Exiting.")
71 def load_configuration():
72 """Loads the script configuration from a file or creates such."""
73 config = configparser.RawConfigParser()
74 success = config.read(CONFIG_FILENAME)
76 # if no file is found create a default one
78 if(not config.has_section('basic_settings')):
79 config.add_section('basic_settings')
80 config.set('basic_settings', 'file_log_level', logging.INFO)
81 config.set('basic_settings', 'console_log_level', logging.INFO)
82 config.set('basic_settings', 'imap_server', 'imap.company.com')
83 config.set('basic_settings', 'tolerance_mins', 30)
84 config.set('basic_settings', 'skip_shared_folders', "True")
85 config.set('basic_settings', 'fallback_to_date_header', "False")
86 config.set('basic_settings', 'update_mode_i_know_what_i_am_doing', "False")
87 with open(CONFIG_FILENAME, 'w') as configfile:
88 config.write(configfile)
89 configfile.write("# 0 NOTSET, 10 DEBUG, 20 INFO, 30 WARNING, 40 ERROR, 50 CRITICAL\n")
90 print("Created initial config %s" % CONFIG_FILENAME)
93 config.get('basic_settings', 'file_log_level')
94 config.get('basic_settings', 'console_log_level')
95 config.get('basic_settings', 'imap_server')
96 config.getint('basic_settings', 'tolerance_mins')
97 config.getboolean('basic_settings', 'skip_shared_folders')
98 config.getboolean('basic_settings', 'fallback_to_date_header')
99 config.getboolean('basic_settings', 'update_mode_i_know_what_i_am_doing')
100 except (configparser.NoSectionError, configparser.NoOptionError, ValueError) as ex:
101 print("Could not read config file '%s': %s." % (CONFIG_FILENAME, ex))
102 print("Please change or remove the config file.")
107 def prepare_logger(config):
108 """Sets up the logging functionality"""
111 with open(LOG_FILENAME, 'w'):
114 # add basic configuration
115 logging.basicConfig(filename=LOG_FILENAME,
116 format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
117 level=config.getint('basic_settings', 'file_log_level'))
119 # add a handler for a console output
120 console = logging.StreamHandler()
121 console.setLevel(config.getint('basic_settings', 'console_log_level'))
122 formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
123 console.setFormatter(formatter)
124 logging.getLogger('').addHandler(console)
127 def synchronize_csv(config, test_mode):
128 """Iterates through csv list of users and synchronizes their messages."""
130 # initialize loop permanent data
131 caching_data = CachingData(config.getboolean('basic_settings', 'fallback_to_date_header'))
132 date_parser = MailDateParser()
133 server = config.get('basic_settings', 'imap_server')
134 tolerance = config.getint('basic_settings', 'tolerance_mins') * 60
135 skip_shared_folders = config.getboolean('basic_settings', 'skip_shared_folders')
137 # iterate through the users in the csv data
138 user_reader = csv.DictReader(open(CSV_FILENAME, "r"), delimiter=',')
139 for user in user_reader:
141 session = MailIterator(server, user['username'], user['password'], skip_shared_folders)
142 except UserWarning as ex:
145 for mailbox in session:
147 box = caching_data.retrieve_cached_mailbox(mailbox[0], mailbox[1], user['username'])
148 mail_ids = session.fetch_messages()
149 new_ids = box.synchronize(mail_ids, tolerance)
150 logging.info("%s new messages out of %s found in %s.", len(new_ids), len(mail_ids), box.name)
151 except UserWarning as ex:
156 fetched_internal_date = session.fetch_internal_date(mid)
157 internal_date = date_parser.extract_internal_date(fetched_internal_date)
158 fetched_correct_date = session.fetch_received_date(mid)
159 correct_date = date_parser.extract_received_date(fetched_correct_date)
160 # check for empty received headers
161 if(correct_date == ""):
162 logging.debug("No received date could be found in message uid: %s - mailbox: %s - user: %s.",
163 mid.decode('iso-8859-1'), box.name, box.owner)
164 box.no_received_field += 1
165 # correct these messages if required and override received_date from basic date
166 if(config.getboolean('basic_settings', 'fallback_to_date_header')):
167 fetched_correct_date = session.fetch_basic_date(mid)
168 correct_date = date_parser.extract_received_date(fetched_correct_date)
169 if(correct_date == ""):
170 logging.debug("No fallback date header could be found in message uid: %s - mailbox: %s - user: %s.",
171 mid.decode('iso-8859-1'), box.name, box.owner)
173 if(correct_date == ""):
174 # skip synchronization for this message
177 # preserve only the first received line as fetched if everything is ok
178 fetched_correct_date = fetched_correct_date.split("Received:")[1]
179 except UserWarning as ex:
182 if(date_parser.compare_dates(correct_date, internal_date, tolerance)):
183 logging.warning("Date conflict found in message uid: %s - mailbox: %s - user: %s.\nInternal date %s is different from extracted date %s from header:\n%s.",
184 mid.decode('iso-8859-1'), box.name, box.owner,
185 internal_date.strftime("%d %b %Y %H:%M:%S"),
186 correct_date.strftime("%d %b %Y %H:%M:%S"),
187 fetched_correct_date)
190 session.update_message(mid, box.name, correct_date)
191 except UserWarning as ex:
195 # count total emails for every user and mailbox
196 box.date_conflicts += 1
198 # if all messages were successfully fixed confirm caching
202 # final report on date conflicts
203 caching_data.report_conflicts()
206 if(__name__ == "__main__"):