Merge branch 'ss/maildir-simplify-save' into next

Conflicts:
	Changelog.draft.rst
This commit is contained in:
Nicolas Sebrecht 2011-06-13 16:30:06 +02:00
commit 543c7b2fb7
2 changed files with 59 additions and 55 deletions

@ -16,16 +16,19 @@ New Features
Changes Changes
------- -------
* Maildirs use less memory while syncing.
Bug Fixes Bug Fixes
--------- ---------
* Saving to Maildirs now checks for file existence without race conditions.
* A bug in the underlying imap library has been fixed that could * A bug in the underlying imap library has been fixed that could
potentially lead to data loss if the server interrupted responses with potentially lead to data loss if the server interrupted responses with
unexpected but legal server status responses. This would mainly occur unexpected but legal server status responses. This would mainly occur
in folders with many thousands of emails. Upgrading from the previous in folders with many thousands of emails. Upgrading from the previous
release is strongly recommended. release is strongly recommended.
Peanding for the next major release Pending for the next major release
================================== ==================================
* UIs get shorter and nicer names. (API changing) * UIs get shorter and nicer names. (API changing)

@ -28,6 +28,8 @@ try:
except ImportError: except ImportError:
from md5 import md5 from md5 import md5
from offlineimap import OfflineImapError
uidmatchre = re.compile(',U=(\d+)') uidmatchre = re.compile(',U=(\d+)')
flagmatchre = re.compile(':.*2,([A-Z]+)') flagmatchre = re.compile(':.*2,([A-Z]+)')
timestampmatchre = re.compile('(\d+)'); timestampmatchre = re.compile('(\d+)');
@ -63,12 +65,15 @@ class MaildirFolder(BaseFolder):
self.accountname = accountname self.accountname = accountname
BaseFolder.__init__(self) BaseFolder.__init__(self)
#self.ui is set in BaseFolder.init() #self.ui is set in BaseFolder.init()
# Cache the full folder path, as we use getfullname() very often
self._fullname = os.path.join(self.getroot(), self.getname())
def getaccountname(self): def getaccountname(self):
return self.accountname return self.accountname
def getfullname(self): def getfullname(self):
return os.path.join(self.getroot(), self.getname()) """Return the absolute file path to the Maildir folder (sans cur|new)"""
return self._fullname
def getuidvalidity(self): def getuidvalidity(self):
"""Maildirs have no notion of uidvalidity, so we just return a magic """Maildirs have no notion of uidvalidity, so we just return a magic
@ -182,81 +187,73 @@ class MaildirFolder(BaseFolder):
return self.messagelist return self.messagelist
def getmessage(self, uid): def getmessage(self, uid):
"""Return the content of the message"""
filename = self.messagelist[uid]['filename'] filename = self.messagelist[uid]['filename']
file = open(filename, 'rt') filepath = os.path.join(self.getfullname(), filename)
file = open(filepath, 'rt')
retval = file.read() retval = file.read()
file.close() file.close()
#TODO: WHY are we replacing \r\n with \n here? And why do we
# read it as text?
return retval.replace("\r\n", "\n") return retval.replace("\r\n", "\n")
def getmessagetime( self, uid ): def getmessagetime( self, uid ):
filename = self.messagelist[uid]['filename'] filename = self.messagelist[uid]['filename']
st = os.stat(filename) filepath = os.path.join(self.getfullname(), filename)
st = os.stat(filepath)
return st.st_mtime return st.st_mtime
def savemessage(self, uid, content, flags, rtime): def savemessage(self, uid, content, flags, rtime):
# This function only ever saves to tmp/, # This function only ever saves to tmp/,
# but it calls savemessageflags() to actually save to cur/ or new/. # but it calls savemessageflags() to actually save to cur/ or new/.
self.ui.debug('maildir', 'savemessage: called to write with flags %s and content %s' % \ self.ui.debug('maildir', 'savemessage: called to write with flags %s '
(repr(flags), repr(content))) 'and content %s' % (repr(flags), repr(content)))
if uid < 0: if uid < 0:
# We cannot assign a new uid. # We cannot assign a new uid.
return uid return uid
if uid in self.messagelist: if uid in self.messagelist:
# We already have it. # We already have it, just update flags.
self.savemessageflags(uid, flags) self.savemessageflags(uid, flags)
return uid return uid
# Otherwise, save the message in tmp/ and then call savemessageflags() # Otherwise, save the message in tmp/ and then call savemessageflags()
# to give it a permanent home. # to give it a permanent home.
tmpdir = os.path.join(self.getfullname(), 'tmp') tmpdir = os.path.join(self.getfullname(), 'tmp')
messagename = None timeval, timeseq = gettimeseq()
attempts = 0 messagename = '%d_%d.%d.%s,U=%d,FMD5=%s' % \
while 1: (timeval,
if attempts > 15: timeseq,
raise IOError, "Couldn't write to file %s" % messagename os.getpid(),
timeval, timeseq = gettimeseq() socket.gethostname(),
messagename = '%d_%d.%d.%s,U=%d,FMD5=%s' % \ uid,
(timeval, md5(self.getvisiblename()).hexdigest())
timeseq, # open file and write it out
os.getpid(), try:
socket.gethostname(), fd = os.open(os.path.join(tmpdir, messagename),
uid, os.O_EXCL|os.O_CREAT|os.O_WRONLY)
md5(self.getvisiblename()).hexdigest()) except OSError, e:
if os.path.exists(os.path.join(tmpdir, messagename)): if e.errno == 17:
time.sleep(2) #FILE EXISTS ALREADY
attempts += 1 severity = OfflineImapError.ERROR.MESSAGE
raise OfflineImapError("Unique filename %s already existing." %\
messagename, severity)
else: else:
break raise
tmpmessagename = messagename.split(',')[0]
self.ui.debug('maildir', 'savemessage: using temporary name %s' % tmpmessagename)
file = open(os.path.join(tmpdir, tmpmessagename), "wt")
file.write(content)
file = os.fdopen(fd, 'wt')
file.write(content)
# Make sure the data hits the disk # Make sure the data hits the disk
file.flush() file.flush()
if self.dofsync: if self.dofsync:
os.fsync(file.fileno()) os.fsync(fd)
file.close() file.close()
if rtime != None:
os.utime(os.path.join(tmpdir,tmpmessagename), (rtime,rtime))
self.ui.debug('maildir', 'savemessage: moving from %s to %s' % \
(tmpmessagename, messagename))
if tmpmessagename != messagename: # then rename it
os.rename(os.path.join(tmpdir, tmpmessagename),
os.path.join(tmpdir, messagename))
if self.dofsync: if rtime != None:
try: os.utime(os.path.join(tmpdir, messagename), (rtime, rtime))
# fsync the directory (safer semantics in Linux)
fd = os.open(tmpdir, os.O_RDONLY)
os.fsync(fd)
os.close(fd)
except:
pass
self.messagelist[uid] = {'uid': uid, 'flags': [], self.messagelist[uid] = {'uid': uid, 'flags': [],
'filename': os.path.join(tmpdir, messagename)} 'filename': os.path.join('tmp', messagename)}
# savemessageflags moves msg to 'cur' or 'new' as appropriate
self.savemessageflags(uid, flags) self.savemessageflags(uid, flags)
self.ui.debug('maildir', 'savemessage: returning uid %d' % uid) self.ui.debug('maildir', 'savemessage: returning uid %d' % uid)
return uid return uid
@ -266,14 +263,14 @@ class MaildirFolder(BaseFolder):
def savemessageflags(self, uid, flags): def savemessageflags(self, uid, flags):
oldfilename = self.messagelist[uid]['filename'] oldfilename = self.messagelist[uid]['filename']
newpath, newname = os.path.split(oldfilename) dir_prefix, newname = os.path.split(oldfilename)
tmpdir = os.path.join(self.getfullname(), 'tmp') tmpdir = os.path.join(self.getfullname(), 'tmp')
if 'S' in flags: if 'S' in flags:
# If a message has been seen, it goes into the cur # If a message has been seen, it goes into the cur
# directory. CR debian#152482, [complete.org #4] # directory. CR debian#152482
newpath = os.path.join(self.getfullname(), 'cur') dir_prefix = 'cur'
else: else:
newpath = os.path.join(self.getfullname(), 'new') dir_prefix = 'new'
infostr = ':' infostr = ':'
infomatch = re.search('(:.*)$', newname) infomatch = re.search('(:.*)$', newname)
if infomatch: # If the info string is present.. if infomatch: # If the info string is present..
@ -284,15 +281,16 @@ class MaildirFolder(BaseFolder):
infostr += '2,' + ''.join(flags) infostr += '2,' + ''.join(flags)
newname += infostr newname += infostr
newfilename = os.path.join(newpath, newname) newfilename = os.path.join(dir_prefix, newname)
if (newfilename != oldfilename): if (newfilename != oldfilename):
os.rename(oldfilename, newfilename) os.rename(os.path.join(self.getfullname(), oldfilename),
os.path.join(self.getfullname(), newfilename))
self.messagelist[uid]['flags'] = flags self.messagelist[uid]['flags'] = flags
self.messagelist[uid]['filename'] = newfilename self.messagelist[uid]['filename'] = newfilename
# By now, the message had better not be in tmp/ land! # By now, the message had better not be in tmp/ land!
final_dir, final_name = os.path.split(self.messagelist[uid]['filename']) final_dir, final_name = os.path.split(self.messagelist[uid]['filename'])
assert final_dir != tmpdir assert final_dir != 'tmp'
def deletemessage(self, uid): def deletemessage(self, uid):
"""Unlinks a message file from the Maildir. """Unlinks a message file from the Maildir.
@ -306,13 +304,16 @@ class MaildirFolder(BaseFolder):
return return
filename = self.messagelist[uid]['filename'] filename = self.messagelist[uid]['filename']
filepath = os.path.join(self.getfullname(), filename)
try: try:
os.unlink(filename) os.unlink(filepath)
except OSError: except OSError:
# Can't find the file -- maybe already deleted? # Can't find the file -- maybe already deleted?
newmsglist = self._scanfolder() newmsglist = self._scanfolder()
if uid in newmsglist: # Nope, try new filename. if uid in newmsglist: # Nope, try new filename.
os.unlink(newmsglist[uid]['filename']) filename = newmsglist[uid]['filename']
filepath = os.path.join(self.getfullname(), filename)
os.unlink(filepath)
# Yep -- return. # Yep -- return.
del(self.messagelist[uid]) del(self.messagelist[uid])