Commit | Line | Data |
---|---|---|
c9da760a PD |
1 | ''' |
2 | fix_imap_internaldate.py - Fix the INTERNALDATE field on IMAP servers | |
3 | ||
4 | Copyright (c) 2012 Intra2net AG | |
5 | Author: Plamen Dimitrov | |
6 | ||
7 | This program is free software: you can redistribute it and/or modify | |
8 | it under the terms of the GNU General Public License as published by | |
9 | the Free Software Foundation, either version 3 of the License, or | |
10 | (at your option) any later version. | |
11 | ||
12 | This program is distributed in the hope that it will be useful, | |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | GNU General Public License for more details. | |
c9da760a PD |
16 | ''' |
17 | ||
d0cfa9d0 | 18 | import sys |
c9da760a | 19 | import csv |
d0cfa9d0 PD |
20 | import argparse |
21 | # python version handling | |
22 | try: | |
23 | import configparser | |
24 | except ImportError: | |
25 | print("This module needs python version 3 or later.") | |
26 | sys.exit() | |
8fe4e3ff | 27 | import logging |
8a9d4c89 | 28 | from mail_date_parser import MailDateParser |
c9da760a | 29 | from mail_iterator import MailIterator |
8301e589 | 30 | from caching_data import CachingData |
c9da760a | 31 | |
6177b21d TJ |
32 | CONFIG_FILENAME = "fix_imap_internaldate.cfg" |
33 | LOG_FILENAME = "fix_imap_internaldate.log" | |
34 | CSV_FILENAME = "userdata.csv" | |
35 | ||
c9da760a | 36 | def main(): |
97bd6bea PD |
37 | """Interprets command arguments and initializes configuration and logger. |
38 | Then begins mail synchronization.""" | |
648f0037 | 39 | |
97bd6bea | 40 | # parse arguments |
648f0037 PD |
41 | parser = argparse.ArgumentParser(description="Fix the INTERNALDATE field on IMAP servers. " |
42 | "Small tool to fix the IMAP internaldate " | |
43 | "in case it's too much off compared to the last date " | |
44 | "stored in the received lines.") | |
45 | parser.add_argument('-u', '--update', dest='test_mode', action='store_false', | |
46 | default=True, help='update all e-mails and exit test mode') | |
c9da760a | 47 | |
8fe4e3ff | 48 | # config and logging setup |
c9da760a | 49 | config = load_configuration() |
8fe4e3ff | 50 | prepare_logger(config) |
97bd6bea | 51 | args = parser.parse_args() |
648f0037 | 52 | if(args.test_mode): |
f9fd9b29 | 53 | logging.info("Testing mode initiated. No message will be modified on the server.") |
648f0037 | 54 | else: |
f9fd9b29 | 55 | logging.info("Update mode initiated. Messages will be modified.") |
3b81023f | 56 | |
97bd6bea | 57 | # proceed to main functionality |
d0cfa9d0 PD |
58 | try: |
59 | synchronize_csv(config, args.test_mode) | |
60 | except KeyboardInterrupt: | |
61 | logging.info("Script was interrupted by the user.") | |
97bd6bea | 62 | |
28d8aa17 | 63 | logging.info("All done. Exiting.") |
97bd6bea PD |
64 | return |
65 | ||
66 | def load_configuration(): | |
67 | """Loads the script configuration from a file or creates such.""" | |
68 | config = configparser.RawConfigParser() | |
6177b21d | 69 | success = config.read(CONFIG_FILENAME) |
97bd6bea PD |
70 | if(len(success)==0): |
71 | config.add_section('basic_settings') | |
72 | config.set('basic_settings', 'file_log_level', logging.INFO) | |
73 | config.set('basic_settings', 'console_log_level', logging.INFO) | |
74 | config.set('basic_settings', 'imap_server', 'imap.company.com') | |
a936a06b | 75 | config.set('basic_settings', 'tolerance_mins', 30) |
87cde111 PD |
76 | config.set('basic_settings', 'skip_shared_folders', "ON") |
77 | config.set('basic_settings', 'fallback_to_date_header', "OFF") | |
6177b21d | 78 | with open(CONFIG_FILENAME, 'w') as configfile: |
97bd6bea | 79 | config.write(configfile) |
926e6e98 | 80 | configfile.write("# 0 NOTSET, 10 DEBUG, 20 INFO, 30 WARNING, 40 ERROR, 50 CRITICAL") |
97bd6bea PD |
81 | return config |
82 | ||
83 | def prepare_logger(config): | |
84 | """Sets up the logging functionality""" | |
6177b21d | 85 | |
97bd6bea | 86 | # reset the log |
6177b21d | 87 | with open(LOG_FILENAME, 'w'): |
97bd6bea | 88 | pass |
6177b21d | 89 | |
97bd6bea | 90 | # add basic configuration |
6177b21d | 91 | logging.basicConfig(filename=LOG_FILENAME, |
97bd6bea PD |
92 | format='%(asctime)s - %(name)s - %(levelname)s - %(message)s', |
93 | level=config.getint('basic_settings', 'file_log_level')) | |
6177b21d | 94 | |
97bd6bea PD |
95 | # add a handler for a console output |
96 | console = logging.StreamHandler() | |
97 | console.setLevel(config.getint('basic_settings', 'console_log_level')) | |
98 | formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s') | |
99 | console.setFormatter(formatter) | |
100 | logging.getLogger('').addHandler(console) | |
101 | return | |
102 | ||
103 | def synchronize_csv(config, test_mode): | |
104 | """Iterates through csv list of users and synchronizes their messages.""" | |
105 | ||
106 | # initialize loop permanent data | |
107 | caching_data = CachingData() | |
108 | date_parser = MailDateParser() | |
c9da760a | 109 | server = config.get('basic_settings', 'imap_server') |
a936a06b | 110 | tolerance = config.getint('basic_settings', 'tolerance_mins') * 60 |
c9da760a | 111 | |
97bd6bea | 112 | # iterate through the users in the csv data |
6177b21d | 113 | user_reader = csv.DictReader(open(CSV_FILENAME, "r"), delimiter=',') |
c9da760a PD |
114 | for user in user_reader: |
115 | try: | |
116 | session = MailIterator(server, user['username'], user['password']) | |
117 | except UserWarning as ex: | |
118 | logging.error(ex) | |
119 | continue | |
120 | for mailbox in session: | |
121 | try: | |
7a1d4c35 | 122 | box = caching_data.retrieve_cached_mailbox(mailbox[0], mailbox[1], user['username']) |
c9da760a | 123 | mail_ids = session.fetch_messages() |
3b81023f | 124 | new_ids = box.synchronize(mail_ids, tolerance) |
6f2bc406 | 125 | logging.info("%s new messages out of %s found in %s.", len(new_ids), len(mail_ids), box.name) |
c9da760a PD |
126 | except UserWarning as ex: |
127 | logging.error(ex) | |
128 | continue | |
8301e589 | 129 | for mid in new_ids: |
c9da760a PD |
130 | try: |
131 | fetched_internal_date = session.fetch_internal_date(mid) | |
8a9d4c89 | 132 | internal_date = date_parser.extract_internal_date(fetched_internal_date) |
87cde111 PD |
133 | fetched_correct_date = session.fetch_received_date(mid) |
134 | correct_date = date_parser.extract_received_date(fetched_correct_date) | |
135 | # check for empty received headers | |
136 | if(correct_date == ""): | |
d5ccfbec | 137 | logging.debug("No received date could be found in message uid: %s - mailbox: %s - user: %s.", |
8a9d4c89 | 138 | mid.decode('iso-8859-1'), box.name, box.owner) |
7a1d4c35 | 139 | box.no_received_field += 1 |
87cde111 PD |
140 | # correct these messages if required and override received_date from basic date |
141 | if(config.get('basic_settings', 'fallback_to_date_header') == "ON"): | |
142 | fetched_correct_date = session.fetch_basic_date(mid) | |
143 | correct_date = date_parser.extract_received_date(fetched_correct_date) | |
144 | else: | |
145 | # skip synchronization for this message | |
146 | continue | |
147 | else: | |
148 | # preserve only the first received line as fetched if everything is ok | |
149 | fetched_correct_date = fetched_correct_date.split("Received:")[1] | |
c9da760a PD |
150 | except UserWarning as ex: |
151 | logging.error(ex) | |
152 | continue | |
87cde111 PD |
153 | if(date_parser.compare_dates(correct_date, internal_date, tolerance)): |
154 | logging.warning("Date conflict found in message uid: %s - mailbox: %s - user: %s.\nInternal date %s is different from extracted date %s from header:\n%s.", | |
36f4d196 TJ |
155 | mid.decode('iso-8859-1'), box.name, box.owner, |
156 | internal_date.strftime("%d %b %Y %H:%M:%S"), | |
87cde111 PD |
157 | correct_date.strftime("%d %b %Y %H:%M:%S"), |
158 | fetched_correct_date) | |
5a4bc5d8 | 159 | if(not test_mode): |
c9da760a | 160 | try: |
87cde111 | 161 | session.update_message(mid, box.name, correct_date) |
c9da760a PD |
162 | except UserWarning as ex: |
163 | logging.error(ex) | |
164 | continue | |
36f4d196 | 165 | |
8301e589 | 166 | # count total emails for every user and mailbox |
7a1d4c35 | 167 | box.date_conflicts += 1 |
36f4d196 | 168 | |
8301e589 | 169 | # if all messages were successfully fixed confirm caching |
97bd6bea | 170 | if(not test_mode): |
7a1d4c35 | 171 | box.confirm_change() |
6177b21d | 172 | |
08ba5736 PD |
173 | # final report on date conflicts |
174 | caching_data.report_conflicts() | |
8fe4e3ff PD |
175 | return |
176 | ||
c9da760a PD |
177 | if(__name__ == "__main__"): |
178 | main() |