Handle difference in pickle protocol between python 2.x and 3.x
[imap-fix-internaldate] / src / caching_data.py
CommitLineData
8301e589
PD
1'''
2caching_data.py - The module contains the CachingData class.
3
4Copyright (c) 2012 Intra2net AG
5Author: Plamen Dimitrov
6
7This program is free software: you can redistribute it and/or modify
8it under the terms of the GNU General Public License as published by
9the Free Software Foundation, either version 3 of the License, or
10(at your option) any later version.
11
12This program is distributed in the hope that it will be useful,
13but WITHOUT ANY WARRANTY; without even the implied warranty of
14MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15GNU General Public License for more details.
16'''
5a4bc5d8 17import os, platform, tempfile
8301e589 18import pickle
8fe4e3ff 19import logging
7a1d4c35
PD
20from mailbox_state import MailboxState
21
8fe4e3ff 22CACHE_FILENAME = "message_cache.dat"
db3f09a6 23CACHE_VERSION = "1"
8301e589
PD
24
25class CachingData:
26 """This class is responsible for the caching of data."""
7a1d4c35
PD
27
28 # class attributes
29 # integer for version of the cache
30 version = None
db3f09a6
PD
31 # boolean flag which indicates fallback mode of the cache
32 fallback_to_date_header = None
7a1d4c35
PD
33 # dictionary of usernames as keys and dictionaries as values
34 # the second dictionaries have unique mailbox keys and mailboxes as values
35 data = None
8301e589 36
db3f09a6 37 def __init__(self, fallback_mode):
8fe4e3ff 38 # open data file or create one and initialize date if not found
8301e589 39 try:
8fe4e3ff 40 cachefile = open(CACHE_FILENAME, 'rb')
db3f09a6
PD
41 cache_info, self.data = pickle.load(cachefile)
42 cache_info = cache_info.split(' ')
43 self.version = cache_info[0]
8a9d4c89 44 if(self.version != CACHE_VERSION):
04d3d4de 45 raise IOError("Cache file has version %s and the script version is %s" % (self.version, CACHE_VERSION))
db3f09a6
PD
46 self.fallback_to_date_header = cache_info[1]
47 if(self.fallback_to_date_header != str(fallback_mode)):
04d3d4de 48 raise IOError("Cache file date fallback mode setting is different than current settings")
28d8aa17 49 logging.info("Cache file %s loaded", CACHE_FILENAME)
04d3d4de
TJ
50 logging.info("%s users found.", len(self.data))
51 except (IOError, ValueError) as ex:
52 logging.warning("Couldn't load cache file %s: %s", CACHE_FILENAME, ex)
53 logging.warning("DELETING CACHE")
8a9d4c89 54 self.version = CACHE_VERSION
db3f09a6 55 stored_cache_info = self.version + ' ' + str(fallback_mode)
8301e589 56 self.data = {}
8fe4e3ff 57 with open(CACHE_FILENAME, 'wb') as cachefile:
db3f09a6 58 pickle.dump((stored_cache_info, self.data), cachefile)
8301e589
PD
59
60 def __del__(self):
7a1d4c35 61 # create temporary file first
8fe4e3ff 62 location = os.path.dirname(CACHE_FILENAME)
7a1d4c35 63 file_descriptor, tmpname = tempfile.mkstemp(dir=location)
8fe4e3ff
PD
64 try:
65 cachefile = os.fdopen(file_descriptor, 'wb')
28d8aa17 66
8fe4e3ff
PD
67 # prepare data based on a save flag
68 saved_data = {}
69 for user in self.data:
70 saved_data[user] = {}
71 for box_key in self.data[user]:
72 if(self.data[user][box_key].needs_save):
73 saved_data[user][box_key] = self.data[user][box_key]
74 logging.debug("The mailbox %s will be saved.", saved_data[user][box_key].name)
75 if(len(saved_data[user])==0):
76 del saved_data[user]
77 logging.debug("The user %s will not be saved.", user)
78 self.data = saved_data
8fe4e3ff
PD
79 # avoid test mode or cases where nothing needs saving
80 if(len(saved_data)==0):
5a4bc5d8 81 cachefile.close()
8fe4e3ff
PD
82 os.unlink(tmpname)
83 return
28d8aa17 84
8fe4e3ff 85 # serialize in file
db3f09a6
PD
86 stored_cache_info = self.version + ' ' + self.fallback_to_date_header
87 pickle.dump((stored_cache_info, self.data), cachefile)
8fe4e3ff 88 logging.debug("%s users stored.", len(self.data))
5a4bc5d8
PD
89
90 # handle windows non-atomic rename
91 if(platform.system()=='Windows'):
92 if(os.path.exists(CACHE_FILENAME)):
93 cachefile.close()
94 os.unlink(CACHE_FILENAME)
95
8fe4e3ff
PD
96 os.rename(tmpname, CACHE_FILENAME)
97 except:
d061b671 98 # clean up temporary file
28d8aa17 99 os.unlink(tmpname)
d061b671 100 raise
28d8aa17
TJ
101
102 logging.info("Wrote cache file %s", CACHE_FILENAME)
8301e589 103
7a1d4c35
PD
104 def retrieve_cached_mailbox(self, name, uidvalidity, user):
105 """Retrieve a cached mailbox or create it."""
106 box_key = name.strip('"') + uidvalidity
107 if(user not in self.data):
108 self.data[user] = {}
8fe4e3ff 109 logging.debug("New user %s cached.", user)
7a1d4c35
PD
110 if(box_key not in self.data[user]):
111 self.data[user][box_key] = MailboxState(name, uidvalidity, user)
8fe4e3ff 112 logging.debug("New mailbox %s cached.", box_key)
7a1d4c35
PD
113 return self.data[user][box_key]
114
3b81023f 115 def report_conflicts(self):
7a1d4c35
PD
116 """Write a date conflicts report in a file."""
117 with open("conflict_stats.txt", 'w') as statsfile:
118 owner_total_conflicts = {}
119 owner_total_missing = {}
120 for user in self.data:
d3beb6da 121 statsfile.write("user: %s\n" % user)
7a1d4c35
PD
122 owner_total_conflicts[user] = 0
123 owner_total_missing[user] = 0
124 for box_key in self.data[user]:
125 owner_total_conflicts[user] += self.data[user][box_key].date_conflicts
126 owner_total_missing[user] += self.data[user][box_key].no_received_field
d3beb6da
PD
127 statsfile.write("date conflicts: %-15.15s missing header: %-15.15s mailbox: %s\n"\
128 % (self.data[user][box_key].date_conflicts,
08ba5736
PD
129 self.data[user][box_key].no_received_field,
130 self.data[user][box_key].name))
d3beb6da
PD
131 statsfile.write("date conflicts: %-15.15s missing header: %-15.15s TOTAL \n\n"\
132 % (owner_total_conflicts[user], owner_total_missing[user]))
8301e589 133 return