123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151 |
- """Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
- # Notes for authors of new mailbox subclasses:
- #
- # Remember to fsync() changes to disk before closing a modified file
- # or returning from a flush() method. See functions _sync_flush() and
- # _sync_close().
- import os
- import time
- import calendar
- import socket
- import errno
- import copy
- import warnings
- import email
- import email.message
- import email.generator
- import io
- import contextlib
- from types import GenericAlias
- try:
- import fcntl
- except ImportError:
- fcntl = None
- __all__ = ['Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
- 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
- 'BabylMessage', 'MMDFMessage', 'Error', 'NoSuchMailboxError',
- 'NotEmptyError', 'ExternalClashError', 'FormatError']
- linesep = os.linesep.encode('ascii')
- class Mailbox:
- """A group of messages in a particular place."""
- def __init__(self, path, factory=None, create=True):
- """Initialize a Mailbox instance."""
- self._path = os.path.abspath(os.path.expanduser(path))
- self._factory = factory
- def add(self, message):
- """Add message and return assigned key."""
- raise NotImplementedError('Method must be implemented by subclass')
- def remove(self, key):
- """Remove the keyed message; raise KeyError if it doesn't exist."""
- raise NotImplementedError('Method must be implemented by subclass')
- def __delitem__(self, key):
- self.remove(key)
- def discard(self, key):
- """If the keyed message exists, remove it."""
- try:
- self.remove(key)
- except KeyError:
- pass
- def __setitem__(self, key, message):
- """Replace the keyed message; raise KeyError if it doesn't exist."""
- raise NotImplementedError('Method must be implemented by subclass')
- def get(self, key, default=None):
- """Return the keyed message, or default if it doesn't exist."""
- try:
- return self.__getitem__(key)
- except KeyError:
- return default
- def __getitem__(self, key):
- """Return the keyed message; raise KeyError if it doesn't exist."""
- if not self._factory:
- return self.get_message(key)
- else:
- with contextlib.closing(self.get_file(key)) as file:
- return self._factory(file)
- def get_message(self, key):
- """Return a Message representation or raise a KeyError."""
- raise NotImplementedError('Method must be implemented by subclass')
- def get_string(self, key):
- """Return a string representation or raise a KeyError.
- Uses email.message.Message to create a 7bit clean string
- representation of the message."""
- return email.message_from_bytes(self.get_bytes(key)).as_string()
- def get_bytes(self, key):
- """Return a byte string representation or raise a KeyError."""
- raise NotImplementedError('Method must be implemented by subclass')
- def get_file(self, key):
- """Return a file-like representation or raise a KeyError."""
- raise NotImplementedError('Method must be implemented by subclass')
- def iterkeys(self):
- """Return an iterator over keys."""
- raise NotImplementedError('Method must be implemented by subclass')
- def keys(self):
- """Return a list of keys."""
- return list(self.iterkeys())
- def itervalues(self):
- """Return an iterator over all messages."""
- for key in self.iterkeys():
- try:
- value = self[key]
- except KeyError:
- continue
- yield value
- def __iter__(self):
- return self.itervalues()
- def values(self):
- """Return a list of messages. Memory intensive."""
- return list(self.itervalues())
- def iteritems(self):
- """Return an iterator over (key, message) tuples."""
- for key in self.iterkeys():
- try:
- value = self[key]
- except KeyError:
- continue
- yield (key, value)
- def items(self):
- """Return a list of (key, message) tuples. Memory intensive."""
- return list(self.iteritems())
- def __contains__(self, key):
- """Return True if the keyed message exists, False otherwise."""
- raise NotImplementedError('Method must be implemented by subclass')
- def __len__(self):
- """Return a count of messages in the mailbox."""
- raise NotImplementedError('Method must be implemented by subclass')
- def clear(self):
- """Delete all messages."""
- for key in self.keys():
- self.discard(key)
- def pop(self, key, default=None):
- """Delete the keyed message and return it, or default."""
- try:
- result = self[key]
- except KeyError:
- return default
- self.discard(key)
- return result
- def popitem(self):
- """Delete an arbitrary (key, message) pair and return it."""
- for key in self.iterkeys():
- return (key, self.pop(key)) # This is only run once.
- else:
- raise KeyError('No messages in mailbox')
- def update(self, arg=None):
- """Change the messages that correspond to certain keys."""
- if hasattr(arg, 'iteritems'):
- source = arg.iteritems()
- elif hasattr(arg, 'items'):
- source = arg.items()
- else:
- source = arg
- bad_key = False
- for key, message in source:
- try:
- self[key] = message
- except KeyError:
- bad_key = True
- if bad_key:
- raise KeyError('No message with key(s)')
- def flush(self):
- """Write any pending changes to the disk."""
- raise NotImplementedError('Method must be implemented by subclass')
- def lock(self):
- """Lock the mailbox."""
- raise NotImplementedError('Method must be implemented by subclass')
- def unlock(self):
- """Unlock the mailbox if it is locked."""
- raise NotImplementedError('Method must be implemented by subclass')
- def close(self):
- """Flush and close the mailbox."""
- raise NotImplementedError('Method must be implemented by subclass')
- def _string_to_bytes(self, message):
- # If a message is not 7bit clean, we refuse to handle it since it
- # likely came from reading invalid messages in text mode, and that way
- # lies mojibake.
- try:
- return message.encode('ascii')
- except UnicodeError:
- raise ValueError("String input must be ASCII-only; "
- "use bytes or a Message instead")
- # Whether each message must end in a newline
- _append_newline = False
- def _dump_message(self, message, target, mangle_from_=False):
- # This assumes the target file is open in binary mode.
- """Dump message contents to target file."""
- if isinstance(message, email.message.Message):
- buffer = io.BytesIO()
- gen = email.generator.BytesGenerator(buffer, mangle_from_, 0)
- gen.flatten(message)
- buffer.seek(0)
- data = buffer.read()
- data = data.replace(b'\n', linesep)
- target.write(data)
- if self._append_newline and not data.endswith(linesep):
- # Make sure the message ends with a newline
- target.write(linesep)
- elif isinstance(message, (str, bytes, io.StringIO)):
- if isinstance(message, io.StringIO):
- warnings.warn("Use of StringIO input is deprecated, "
- "use BytesIO instead", DeprecationWarning, 3)
- message = message.getvalue()
- if isinstance(message, str):
- message = self._string_to_bytes(message)
- if mangle_from_:
- message = message.replace(b'\nFrom ', b'\n>From ')
- message = message.replace(b'\n', linesep)
- target.write(message)
- if self._append_newline and not message.endswith(linesep):
- # Make sure the message ends with a newline
- target.write(linesep)
- elif hasattr(message, 'read'):
- if hasattr(message, 'buffer'):
- warnings.warn("Use of text mode files is deprecated, "
- "use a binary mode file instead", DeprecationWarning, 3)
- message = message.buffer
- lastline = None
- while True:
- line = message.readline()
- # Universal newline support.
- if line.endswith(b'\r\n'):
- line = line[:-2] + b'\n'
- elif line.endswith(b'\r'):
- line = line[:-1] + b'\n'
- if not line:
- break
- if mangle_from_ and line.startswith(b'From '):
- line = b'>From ' + line[5:]
- line = line.replace(b'\n', linesep)
- target.write(line)
- lastline = line
- if self._append_newline and lastline and not lastline.endswith(linesep):
- # Make sure the message ends with a newline
- target.write(linesep)
- else:
- raise TypeError('Invalid message type: %s' % type(message))
- __class_getitem__ = classmethod(GenericAlias)
- class Maildir(Mailbox):
- """A qmail-style Maildir mailbox."""
- colon = ':'
- def __init__(self, dirname, factory=None, create=True):
- """Initialize a Maildir instance."""
- Mailbox.__init__(self, dirname, factory, create)
- self._paths = {
- 'tmp': os.path.join(self._path, 'tmp'),
- 'new': os.path.join(self._path, 'new'),
- 'cur': os.path.join(self._path, 'cur'),
- }
- if not os.path.exists(self._path):
- if create:
- os.mkdir(self._path, 0o700)
- for path in self._paths.values():
- os.mkdir(path, 0o700)
- else:
- raise NoSuchMailboxError(self._path)
- self._toc = {}
- self._toc_mtimes = {'cur': 0, 'new': 0}
- self._last_read = 0 # Records last time we read cur/new
- self._skewfactor = 0.1 # Adjust if os/fs clocks are skewing
- def add(self, message):
- """Add message and return assigned key."""
- tmp_file = self._create_tmp()
- try:
- self._dump_message(message, tmp_file)
- except BaseException:
- tmp_file.close()
- os.remove(tmp_file.name)
- raise
- _sync_close(tmp_file)
- if isinstance(message, MaildirMessage):
- subdir = message.get_subdir()
- suffix = self.colon + message.get_info()
- if suffix == self.colon:
- suffix = ''
- else:
- subdir = 'new'
- suffix = ''
- uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
- dest = os.path.join(self._path, subdir, uniq + suffix)
- if isinstance(message, MaildirMessage):
- os.utime(tmp_file.name,
- (os.path.getatime(tmp_file.name), message.get_date()))
- # No file modification should be done after the file is moved to its
- # final position in order to prevent race conditions with changes
- # from other programs
- try:
- try:
- os.link(tmp_file.name, dest)
- except (AttributeError, PermissionError):
- os.rename(tmp_file.name, dest)
- else:
- os.remove(tmp_file.name)
- except OSError as e:
- os.remove(tmp_file.name)
- if e.errno == errno.EEXIST:
- raise ExternalClashError('Name clash with existing message: %s'
- % dest)
- else:
- raise
- return uniq
- def remove(self, key):
- """Remove the keyed message; raise KeyError if it doesn't exist."""
- os.remove(os.path.join(self._path, self._lookup(key)))
- def discard(self, key):
- """If the keyed message exists, remove it."""
- # This overrides an inapplicable implementation in the superclass.
- try:
- self.remove(key)
- except (KeyError, FileNotFoundError):
- pass
- def __setitem__(self, key, message):
- """Replace the keyed message; raise KeyError if it doesn't exist."""
- old_subpath = self._lookup(key)
- temp_key = self.add(message)
- temp_subpath = self._lookup(temp_key)
- if isinstance(message, MaildirMessage):
- # temp's subdir and suffix were specified by message.
- dominant_subpath = temp_subpath
- else:
- # temp's subdir and suffix were defaults from add().
- dominant_subpath = old_subpath
- subdir = os.path.dirname(dominant_subpath)
- if self.colon in dominant_subpath:
- suffix = self.colon + dominant_subpath.split(self.colon)[-1]
- else:
- suffix = ''
- self.discard(key)
- tmp_path = os.path.join(self._path, temp_subpath)
- new_path = os.path.join(self._path, subdir, key + suffix)
- if isinstance(message, MaildirMessage):
- os.utime(tmp_path,
- (os.path.getatime(tmp_path), message.get_date()))
- # No file modification should be done after the file is moved to its
- # final position in order to prevent race conditions with changes
- # from other programs
- os.rename(tmp_path, new_path)
- def get_message(self, key):
- """Return a Message representation or raise a KeyError."""
- subpath = self._lookup(key)
- with open(os.path.join(self._path, subpath), 'rb') as f:
- if self._factory:
- msg = self._factory(f)
- else:
- msg = MaildirMessage(f)
- subdir, name = os.path.split(subpath)
- msg.set_subdir(subdir)
- if self.colon in name:
- msg.set_info(name.split(self.colon)[-1])
- msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
- return msg
- def get_bytes(self, key):
- """Return a bytes representation or raise a KeyError."""
- with open(os.path.join(self._path, self._lookup(key)), 'rb') as f:
- return f.read().replace(linesep, b'\n')
- def get_file(self, key):
- """Return a file-like representation or raise a KeyError."""
- f = open(os.path.join(self._path, self._lookup(key)), 'rb')
- return _ProxyFile(f)
- def iterkeys(self):
- """Return an iterator over keys."""
- self._refresh()
- for key in self._toc:
- try:
- self._lookup(key)
- except KeyError:
- continue
- yield key
- def __contains__(self, key):
- """Return True if the keyed message exists, False otherwise."""
- self._refresh()
- return key in self._toc
- def __len__(self):
- """Return a count of messages in the mailbox."""
- self._refresh()
- return len(self._toc)
- def flush(self):
- """Write any pending changes to disk."""
- # Maildir changes are always written immediately, so there's nothing
- # to do.
- pass
- def lock(self):
- """Lock the mailbox."""
- return
- def unlock(self):
- """Unlock the mailbox if it is locked."""
- return
- def close(self):
- """Flush and close the mailbox."""
- return
- def list_folders(self):
- """Return a list of folder names."""
- result = []
- for entry in os.listdir(self._path):
- if len(entry) > 1 and entry[0] == '.' and \
- os.path.isdir(os.path.join(self._path, entry)):
- result.append(entry[1:])
- return result
- def get_folder(self, folder):
- """Return a Maildir instance for the named folder."""
- return Maildir(os.path.join(self._path, '.' + folder),
- factory=self._factory,
- create=False)
- def add_folder(self, folder):
- """Create a folder and return a Maildir instance representing it."""
- path = os.path.join(self._path, '.' + folder)
- result = Maildir(path, factory=self._factory)
- maildirfolder_path = os.path.join(path, 'maildirfolder')
- if not os.path.exists(maildirfolder_path):
- os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY,
- 0o666))
- return result
- def remove_folder(self, folder):
- """Delete the named folder, which must be empty."""
- path = os.path.join(self._path, '.' + folder)
- for entry in os.listdir(os.path.join(path, 'new')) + \
- os.listdir(os.path.join(path, 'cur')):
- if len(entry) < 1 or entry[0] != '.':
- raise NotEmptyError('Folder contains message(s): %s' % folder)
- for entry in os.listdir(path):
- if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
- os.path.isdir(os.path.join(path, entry)):
- raise NotEmptyError("Folder contains subdirectory '%s': %s" %
- (folder, entry))
- for root, dirs, files in os.walk(path, topdown=False):
- for entry in files:
- os.remove(os.path.join(root, entry))
- for entry in dirs:
- os.rmdir(os.path.join(root, entry))
- os.rmdir(path)
- def clean(self):
- """Delete old files in "tmp"."""
- now = time.time()
- for entry in os.listdir(os.path.join(self._path, 'tmp')):
- path = os.path.join(self._path, 'tmp', entry)
- if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
- os.remove(path)
- _count = 1 # This is used to generate unique file names.
- def _create_tmp(self):
- """Create a file in the tmp subdirectory and open and return it."""
- now = time.time()
- hostname = socket.gethostname()
- if '/' in hostname:
- hostname = hostname.replace('/', r'\057')
- if ':' in hostname:
- hostname = hostname.replace(':', r'\072')
- uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
- Maildir._count, hostname)
- path = os.path.join(self._path, 'tmp', uniq)
- try:
- os.stat(path)
- except FileNotFoundError:
- Maildir._count += 1
- try:
- return _create_carefully(path)
- except FileExistsError:
- pass
- # Fall through to here if stat succeeded or open raised EEXIST.
- raise ExternalClashError('Name clash prevented file creation: %s' %
- path)
- def _refresh(self):
- """Update table of contents mapping."""
- # If it has been less than two seconds since the last _refresh() call,
- # we have to unconditionally re-read the mailbox just in case it has
- # been modified, because os.path.mtime() has a 2 sec resolution in the
- # most common worst case (FAT) and a 1 sec resolution typically. This
- # results in a few unnecessary re-reads when _refresh() is called
- # multiple times in that interval, but once the clock ticks over, we
- # will only re-read as needed. Because the filesystem might be being
- # served by an independent system with its own clock, we record and
- # compare with the mtimes from the filesystem. Because the other
- # system's clock might be skewing relative to our clock, we add an
- # extra delta to our wait. The default is one tenth second, but is an
- # instance variable and so can be adjusted if dealing with a
- # particularly skewed or irregular system.
- if time.time() - self._last_read > 2 + self._skewfactor:
- refresh = False
- for subdir in self._toc_mtimes:
- mtime = os.path.getmtime(self._paths[subdir])
- if mtime > self._toc_mtimes[subdir]:
- refresh = True
- self._toc_mtimes[subdir] = mtime
- if not refresh:
- return
- # Refresh toc
- self._toc = {}
- for subdir in self._toc_mtimes:
- path = self._paths[subdir]
- for entry in os.listdir(path):
- p = os.path.join(path, entry)
- if os.path.isdir(p):
- continue
- uniq = entry.split(self.colon)[0]
- self._toc[uniq] = os.path.join(subdir, entry)
- self._last_read = time.time()
- def _lookup(self, key):
- """Use TOC to return subpath for given key, or raise a KeyError."""
- try:
- if os.path.exists(os.path.join(self._path, self._toc[key])):
- return self._toc[key]
- except KeyError:
- pass
- self._refresh()
- try:
- return self._toc[key]
- except KeyError:
- raise KeyError('No message with key: %s' % key) from None
- # This method is for backward compatibility only.
- def next(self):
- """Return the next message in a one-time iteration."""
- if not hasattr(self, '_onetime_keys'):
- self._onetime_keys = self.iterkeys()
- while True:
- try:
- return self[next(self._onetime_keys)]
- except StopIteration:
- return None
- except KeyError:
- continue
- class _singlefileMailbox(Mailbox):
- """A single-file mailbox."""
- def __init__(self, path, factory=None, create=True):
- """Initialize a single-file mailbox."""
- Mailbox.__init__(self, path, factory, create)
- try:
- f = open(self._path, 'rb+')
- except OSError as e:
- if e.errno == errno.ENOENT:
- if create:
- f = open(self._path, 'wb+')
- else:
- raise NoSuchMailboxError(self._path)
- elif e.errno in (errno.EACCES, errno.EROFS):
- f = open(self._path, 'rb')
- else:
- raise
- self._file = f
- self._toc = None
- self._next_key = 0
- self._pending = False # No changes require rewriting the file.
- self._pending_sync = False # No need to sync the file
- self._locked = False
- self._file_length = None # Used to record mailbox size
- def add(self, message):
- """Add message and return assigned key."""
- self._lookup()
- self._toc[self._next_key] = self._append_message(message)
- self._next_key += 1
- # _append_message appends the message to the mailbox file. We
- # don't need a full rewrite + rename, sync is enough.
- self._pending_sync = True
- return self._next_key - 1
- def remove(self, key):
- """Remove the keyed message; raise KeyError if it doesn't exist."""
- self._lookup(key)
- del self._toc[key]
- self._pending = True
- def __setitem__(self, key, message):
- """Replace the keyed message; raise KeyError if it doesn't exist."""
- self._lookup(key)
- self._toc[key] = self._append_message(message)
- self._pending = True
- def iterkeys(self):
- """Return an iterator over keys."""
- self._lookup()
- yield from self._toc.keys()
- def __contains__(self, key):
- """Return True if the keyed message exists, False otherwise."""
- self._lookup()
- return key in self._toc
- def __len__(self):
- """Return a count of messages in the mailbox."""
- self._lookup()
- return len(self._toc)
- def lock(self):
- """Lock the mailbox."""
- if not self._locked:
- _lock_file(self._file)
- self._locked = True
- def unlock(self):
- """Unlock the mailbox if it is locked."""
- if self._locked:
- _unlock_file(self._file)
- self._locked = False
- def flush(self):
- """Write any pending changes to disk."""
- if not self._pending:
- if self._pending_sync:
- # Messages have only been added, so syncing the file
- # is enough.
- _sync_flush(self._file)
- self._pending_sync = False
- return
- # In order to be writing anything out at all, self._toc must
- # already have been generated (and presumably has been modified
- # by adding or deleting an item).
- assert self._toc is not None
- # Check length of self._file; if it's changed, some other process
- # has modified the mailbox since we scanned it.
- self._file.seek(0, 2)
- cur_len = self._file.tell()
- if cur_len != self._file_length:
- raise ExternalClashError('Size of mailbox file changed '
- '(expected %i, found %i)' %
- (self._file_length, cur_len))
- new_file = _create_temporary(self._path)
- try:
- new_toc = {}
- self._pre_mailbox_hook(new_file)
- for key in sorted(self._toc.keys()):
- start, stop = self._toc[key]
- self._file.seek(start)
- self._pre_message_hook(new_file)
- new_start = new_file.tell()
- while True:
- buffer = self._file.read(min(4096,
- stop - self._file.tell()))
- if not buffer:
- break
- new_file.write(buffer)
- new_toc[key] = (new_start, new_file.tell())
- self._post_message_hook(new_file)
- self._file_length = new_file.tell()
- except:
- new_file.close()
- os.remove(new_file.name)
- raise
- _sync_close(new_file)
- # self._file is about to get replaced, so no need to sync.
- self._file.close()
- # Make sure the new file's mode is the same as the old file's
- mode = os.stat(self._path).st_mode
- os.chmod(new_file.name, mode)
- try:
- os.rename(new_file.name, self._path)
- except FileExistsError:
- os.remove(self._path)
- os.rename(new_file.name, self._path)
- self._file = open(self._path, 'rb+')
- self._toc = new_toc
- self._pending = False
- self._pending_sync = False
- if self._locked:
- _lock_file(self._file, dotlock=False)
- def _pre_mailbox_hook(self, f):
- """Called before writing the mailbox to file f."""
- return
- def _pre_message_hook(self, f):
- """Called before writing each message to file f."""
- return
- def _post_message_hook(self, f):
- """Called after writing each message to file f."""
- return
- def close(self):
- """Flush and close the mailbox."""
- try:
- self.flush()
- finally:
- try:
- if self._locked:
- self.unlock()
- finally:
- self._file.close() # Sync has been done by self.flush() above.
- def _lookup(self, key=None):
- """Return (start, stop) or raise KeyError."""
- if self._toc is None:
- self._generate_toc()
- if key is not None:
- try:
- return self._toc[key]
- except KeyError:
- raise KeyError('No message with key: %s' % key) from None
- def _append_message(self, message):
- """Append message to mailbox and return (start, stop) offsets."""
- self._file.seek(0, 2)
- before = self._file.tell()
- if len(self._toc) == 0 and not self._pending:
- # This is the first message, and the _pre_mailbox_hook
- # hasn't yet been called. If self._pending is True,
- # messages have been removed, so _pre_mailbox_hook must
- # have been called already.
- self._pre_mailbox_hook(self._file)
- try:
- self._pre_message_hook(self._file)
- offsets = self._install_message(message)
- self._post_message_hook(self._file)
- except BaseException:
- self._file.truncate(before)
- raise
- self._file.flush()
- self._file_length = self._file.tell() # Record current length of mailbox
- return offsets
- class _mboxMMDF(_singlefileMailbox):
- """An mbox or MMDF mailbox."""
- _mangle_from_ = True
- def get_message(self, key):
- """Return a Message representation or raise a KeyError."""
- start, stop = self._lookup(key)
- self._file.seek(start)
- from_line = self._file.readline().replace(linesep, b'')
- string = self._file.read(stop - self._file.tell())
- msg = self._message_factory(string.replace(linesep, b'\n'))
- msg.set_from(from_line[5:].decode('ascii'))
- return msg
- def get_string(self, key, from_=False):
- """Return a string representation or raise a KeyError."""
- return email.message_from_bytes(
- self.get_bytes(key, from_)).as_string(unixfrom=from_)
- def get_bytes(self, key, from_=False):
- """Return a string representation or raise a KeyError."""
- start, stop = self._lookup(key)
- self._file.seek(start)
- if not from_:
- self._file.readline()
- string = self._file.read(stop - self._file.tell())
- return string.replace(linesep, b'\n')
- def get_file(self, key, from_=False):
- """Return a file-like representation or raise a KeyError."""
- start, stop = self._lookup(key)
- self._file.seek(start)
- if not from_:
- self._file.readline()
- return _PartialFile(self._file, self._file.tell(), stop)
- def _install_message(self, message):
- """Format a message and blindly write to self._file."""
- from_line = None
- if isinstance(message, str):
- message = self._string_to_bytes(message)
- if isinstance(message, bytes) and message.startswith(b'From '):
- newline = message.find(b'\n')
- if newline != -1:
- from_line = message[:newline]
- message = message[newline + 1:]
- else:
- from_line = message
- message = b''
- elif isinstance(message, _mboxMMDFMessage):
- author = message.get_from().encode('ascii')
- from_line = b'From ' + author
- elif isinstance(message, email.message.Message):
- from_line = message.get_unixfrom() # May be None.
- if from_line is not None:
- from_line = from_line.encode('ascii')
- if from_line is None:
- from_line = b'From MAILER-DAEMON ' + time.asctime(time.gmtime()).encode()
- start = self._file.tell()
- self._file.write(from_line + linesep)
- self._dump_message(message, self._file, self._mangle_from_)
- stop = self._file.tell()
- return (start, stop)
- class mbox(_mboxMMDF):
- """A classic mbox mailbox."""
- _mangle_from_ = True
- # All messages must end in a newline character, and
- # _post_message_hooks outputs an empty line between messages.
- _append_newline = True
- def __init__(self, path, factory=None, create=True):
- """Initialize an mbox mailbox."""
- self._message_factory = mboxMessage
- _mboxMMDF.__init__(self, path, factory, create)
- def _post_message_hook(self, f):
- """Called after writing each message to file f."""
- f.write(linesep)
- def _generate_toc(self):
- """Generate key-to-(start, stop) table of contents."""
- starts, stops = [], []
- last_was_empty = False
- self._file.seek(0)
- while True:
- line_pos = self._file.tell()
- line = self._file.readline()
- if line.startswith(b'From '):
- if len(stops) < len(starts):
- if last_was_empty:
- stops.append(line_pos - len(linesep))
- else:
- # The last line before the "From " line wasn't
- # blank, but we consider it a start of a
- # message anyway.
- stops.append(line_pos)
- starts.append(line_pos)
- last_was_empty = False
- elif not line:
- if last_was_empty:
- stops.append(line_pos - len(linesep))
- else:
- stops.append(line_pos)
- break
- elif line == linesep:
- last_was_empty = True
- else:
- last_was_empty = False
- self._toc = dict(enumerate(zip(starts, stops)))
- self._next_key = len(self._toc)
- self._file_length = self._file.tell()
- class MMDF(_mboxMMDF):
- """An MMDF mailbox."""
- def __init__(self, path, factory=None, create=True):
- """Initialize an MMDF mailbox."""
- self._message_factory = MMDFMessage
- _mboxMMDF.__init__(self, path, factory, create)
- def _pre_message_hook(self, f):
- """Called before writing each message to file f."""
- f.write(b'\001\001\001\001' + linesep)
- def _post_message_hook(self, f):
- """Called after writing each message to file f."""
- f.write(linesep + b'\001\001\001\001' + linesep)
- def _generate_toc(self):
- """Generate key-to-(start, stop) table of contents."""
- starts, stops = [], []
- self._file.seek(0)
- next_pos = 0
- while True:
- line_pos = next_pos
- line = self._file.readline()
- next_pos = self._file.tell()
- if line.startswith(b'\001\001\001\001' + linesep):
- starts.append(next_pos)
- while True:
- line_pos = next_pos
- line = self._file.readline()
- next_pos = self._file.tell()
- if line == b'\001\001\001\001' + linesep:
- stops.append(line_pos - len(linesep))
- break
- elif not line:
- stops.append(line_pos)
- break
- elif not line:
- break
- self._toc = dict(enumerate(zip(starts, stops)))
- self._next_key = len(self._toc)
- self._file.seek(0, 2)
- self._file_length = self._file.tell()
- class MH(Mailbox):
- """An MH mailbox."""
- def __init__(self, path, factory=None, create=True):
- """Initialize an MH instance."""
- Mailbox.__init__(self, path, factory, create)
- if not os.path.exists(self._path):
- if create:
- os.mkdir(self._path, 0o700)
- os.close(os.open(os.path.join(self._path, '.mh_sequences'),
- os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
- else:
- raise NoSuchMailboxError(self._path)
- self._locked = False
- def add(self, message):
- """Add message and return assigned key."""
- keys = self.keys()
- if len(keys) == 0:
- new_key = 1
- else:
- new_key = max(keys) + 1
- new_path = os.path.join(self._path, str(new_key))
- f = _create_carefully(new_path)
- closed = False
- try:
- if self._locked:
- _lock_file(f)
- try:
- try:
- self._dump_message(message, f)
- except BaseException:
- # Unlock and close so it can be deleted on Windows
- if self._locked:
- _unlock_file(f)
- _sync_close(f)
- closed = True
- os.remove(new_path)
- raise
- if isinstance(message, MHMessage):
- self._dump_sequences(message, new_key)
- finally:
- if self._locked:
- _unlock_file(f)
- finally:
- if not closed:
- _sync_close(f)
- return new_key
- def remove(self, key):
- """Remove the keyed message; raise KeyError if it doesn't exist."""
- path = os.path.join(self._path, str(key))
- try:
- f = open(path, 'rb+')
- except OSError as e:
- if e.errno == errno.ENOENT:
- raise KeyError('No message with key: %s' % key)
- else:
- raise
- else:
- f.close()
- os.remove(path)
- def __setitem__(self, key, message):
- """Replace the keyed message; raise KeyError if it doesn't exist."""
- path = os.path.join(self._path, str(key))
- try:
- f = open(path, 'rb+')
- except OSError as e:
- if e.errno == errno.ENOENT:
- raise KeyError('No message with key: %s' % key)
- else:
- raise
- try:
- if self._locked:
- _lock_file(f)
- try:
- os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
- self._dump_message(message, f)
- if isinstance(message, MHMessage):
- self._dump_sequences(message, key)
- finally:
- if self._locked:
- _unlock_file(f)
- finally:
- _sync_close(f)
- def get_message(self, key):
- """Return a Message representation or raise a KeyError."""
- try:
- if self._locked:
- f = open(os.path.join(self._path, str(key)), 'rb+')
- else:
- f = open(os.path.join(self._path, str(key)), 'rb')
- except OSError as e:
- if e.errno == errno.ENOENT:
- raise KeyError('No message with key: %s' % key)
- else:
- raise
- with f:
- if self._locked:
- _lock_file(f)
- try:
- msg = MHMessage(f)
- finally:
- if self._locked:
- _unlock_file(f)
- for name, key_list in self.get_sequences().items():
- if key in key_list:
- msg.add_sequence(name)
- return msg
- def get_bytes(self, key):
- """Return a bytes representation or raise a KeyError."""
- try:
- if self._locked:
- f = open(os.path.join(self._path, str(key)), 'rb+')
- else:
- f = open(os.path.join(self._path, str(key)), 'rb')
- except OSError as e:
- if e.errno == errno.ENOENT:
- raise KeyError('No message with key: %s' % key)
- else:
- raise
- with f:
- if self._locked:
- _lock_file(f)
- try:
- return f.read().replace(linesep, b'\n')
- finally:
- if self._locked:
- _unlock_file(f)
- def get_file(self, key):
- """Return a file-like representation or raise a KeyError."""
- try:
- f = open(os.path.join(self._path, str(key)), 'rb')
- except OSError as e:
- if e.errno == errno.ENOENT:
- raise KeyError('No message with key: %s' % key)
- else:
- raise
- return _ProxyFile(f)
- def iterkeys(self):
- """Return an iterator over keys."""
- return iter(sorted(int(entry) for entry in os.listdir(self._path)
- if entry.isdigit()))
- def __contains__(self, key):
- """Return True if the keyed message exists, False otherwise."""
- return os.path.exists(os.path.join(self._path, str(key)))
- def __len__(self):
- """Return a count of messages in the mailbox."""
- return len(list(self.iterkeys()))
- def lock(self):
- """Lock the mailbox."""
- if not self._locked:
- self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
- _lock_file(self._file)
- self._locked = True
- def unlock(self):
- """Unlock the mailbox if it is locked."""
- if self._locked:
- _unlock_file(self._file)
- _sync_close(self._file)
- del self._file
- self._locked = False
- def flush(self):
- """Write any pending changes to the disk."""
- return
- def close(self):
- """Flush and close the mailbox."""
- if self._locked:
- self.unlock()
- def list_folders(self):
- """Return a list of folder names."""
- result = []
- for entry in os.listdir(self._path):
- if os.path.isdir(os.path.join(self._path, entry)):
- result.append(entry)
- return result
- def get_folder(self, folder):
- """Return an MH instance for the named folder."""
- return MH(os.path.join(self._path, folder),
- factory=self._factory, create=False)
- def add_folder(self, folder):
- """Create a folder and return an MH instance representing it."""
- return MH(os.path.join(self._path, folder),
- factory=self._factory)
- def remove_folder(self, folder):
- """Delete the named folder, which must be empty."""
- path = os.path.join(self._path, folder)
- entries = os.listdir(path)
- if entries == ['.mh_sequences']:
- os.remove(os.path.join(path, '.mh_sequences'))
- elif entries == []:
- pass
- else:
- raise NotEmptyError('Folder not empty: %s' % self._path)
- os.rmdir(path)
- def get_sequences(self):
- """Return a name-to-key-list dictionary to define each sequence."""
- results = {}
- with open(os.path.join(self._path, '.mh_sequences'), 'r', encoding='ASCII') as f:
- all_keys = set(self.keys())
- for line in f:
- try:
- name, contents = line.split(':')
- keys = set()
- for spec in contents.split():
- if spec.isdigit():
- keys.add(int(spec))
- else:
- start, stop = (int(x) for x in spec.split('-'))
- keys.update(range(start, stop + 1))
- results[name] = [key for key in sorted(keys) \
- if key in all_keys]
- if len(results[name]) == 0:
- del results[name]
- except ValueError:
- raise FormatError('Invalid sequence specification: %s' %
- line.rstrip())
- return results
- def set_sequences(self, sequences):
- """Set sequences using the given name-to-key-list dictionary."""
- f = open(os.path.join(self._path, '.mh_sequences'), 'r+', encoding='ASCII')
- try:
- os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
- for name, keys in sequences.items():
- if len(keys) == 0:
- continue
- f.write(name + ':')
- prev = None
- completing = False
- for key in sorted(set(keys)):
- if key - 1 == prev:
- if not completing:
- completing = True
- f.write('-')
- elif completing:
- completing = False
- f.write('%s %s' % (prev, key))
- else:
- f.write(' %s' % key)
- prev = key
- if completing:
- f.write(str(prev) + '\n')
- else:
- f.write('\n')
- finally:
- _sync_close(f)
- def pack(self):
- """Re-name messages to eliminate numbering gaps. Invalidates keys."""
- sequences = self.get_sequences()
- prev = 0
- changes = []
- for key in self.iterkeys():
- if key - 1 != prev:
- changes.append((key, prev + 1))
- try:
- os.link(os.path.join(self._path, str(key)),
- os.path.join(self._path, str(prev + 1)))
- except (AttributeError, PermissionError):
- os.rename(os.path.join(self._path, str(key)),
- os.path.join(self._path, str(prev + 1)))
- else:
- os.unlink(os.path.join(self._path, str(key)))
- prev += 1
- self._next_key = prev + 1
- if len(changes) == 0:
- return
- for name, key_list in sequences.items():
- for old, new in changes:
- if old in key_list:
- key_list[key_list.index(old)] = new
- self.set_sequences(sequences)
- def _dump_sequences(self, message, key):
- """Inspect a new MHMessage and update sequences appropriately."""
- pending_sequences = message.get_sequences()
- all_sequences = self.get_sequences()
- for name, key_list in all_sequences.items():
- if name in pending_sequences:
- key_list.append(key)
- elif key in key_list:
- del key_list[key_list.index(key)]
- for sequence in pending_sequences:
- if sequence not in all_sequences:
- all_sequences[sequence] = [key]
- self.set_sequences(all_sequences)
- class Babyl(_singlefileMailbox):
- """An Rmail-style Babyl mailbox."""
- _special_labels = frozenset({'unseen', 'deleted', 'filed', 'answered',
- 'forwarded', 'edited', 'resent'})
- def __init__(self, path, factory=None, create=True):
- """Initialize a Babyl mailbox."""
- _singlefileMailbox.__init__(self, path, factory, create)
- self._labels = {}
- def add(self, message):
- """Add message and return assigned key."""
- key = _singlefileMailbox.add(self, message)
- if isinstance(message, BabylMessage):
- self._labels[key] = message.get_labels()
- return key
- def remove(self, key):
- """Remove the keyed message; raise KeyError if it doesn't exist."""
- _singlefileMailbox.remove(self, key)
- if key in self._labels:
- del self._labels[key]
- def __setitem__(self, key, message):
- """Replace the keyed message; raise KeyError if it doesn't exist."""
- _singlefileMailbox.__setitem__(self, key, message)
- if isinstance(message, BabylMessage):
- self._labels[key] = message.get_labels()
- def get_message(self, key):
- """Return a Message representation or raise a KeyError."""
- start, stop = self._lookup(key)
- self._file.seek(start)
- self._file.readline() # Skip b'1,' line specifying labels.
- original_headers = io.BytesIO()
- while True:
- line = self._file.readline()
- if line == b'*** EOOH ***' + linesep or not line:
- break
- original_headers.write(line.replace(linesep, b'\n'))
- visible_headers = io.BytesIO()
- while True:
- line = self._file.readline()
- if line == linesep or not line:
- break
- visible_headers.write(line.replace(linesep, b'\n'))
- # Read up to the stop, or to the end
- n = stop - self._file.tell()
- assert n >= 0
- body = self._file.read(n)
- body = body.replace(linesep, b'\n')
- msg = BabylMessage(original_headers.getvalue() + body)
- msg.set_visible(visible_headers.getvalue())
- if key in self._labels:
- msg.set_labels(self._labels[key])
- return msg
- def get_bytes(self, key):
- """Return a string representation or raise a KeyError."""
- start, stop = self._lookup(key)
- self._file.seek(start)
- self._file.readline() # Skip b'1,' line specifying labels.
- original_headers = io.BytesIO()
- while True:
- line = self._file.readline()
- if line == b'*** EOOH ***' + linesep or not line:
- break
- original_headers.write(line.replace(linesep, b'\n'))
- while True:
- line = self._file.readline()
- if line == linesep or not line:
- break
- headers = original_headers.getvalue()
- n = stop - self._file.tell()
- assert n >= 0
- data = self._file.read(n)
- data = data.replace(linesep, b'\n')
- return headers + data
- def get_file(self, key):
- """Return a file-like representation or raise a KeyError."""
- return io.BytesIO(self.get_bytes(key).replace(b'\n', linesep))
- def get_labels(self):
- """Return a list of user-defined labels in the mailbox."""
- self._lookup()
- labels = set()
- for label_list in self._labels.values():
- labels.update(label_list)
- labels.difference_update(self._special_labels)
- return list(labels)
- def _generate_toc(self):
- """Generate key-to-(start, stop) table of contents."""
- starts, stops = [], []
- self._file.seek(0)
- next_pos = 0
- label_lists = []
- while True:
- line_pos = next_pos
- line = self._file.readline()
- next_pos = self._file.tell()
- if line == b'\037\014' + linesep:
- if len(stops) < len(starts):
- stops.append(line_pos - len(linesep))
- starts.append(next_pos)
- labels = [label.strip() for label
- in self._file.readline()[1:].split(b',')
- if label.strip()]
- label_lists.append(labels)
- elif line == b'\037' or line == b'\037' + linesep:
- if len(stops) < len(starts):
- stops.append(line_pos - len(linesep))
- elif not line:
- stops.append(line_pos - len(linesep))
- break
- self._toc = dict(enumerate(zip(starts, stops)))
- self._labels = dict(enumerate(label_lists))
- self._next_key = len(self._toc)
- self._file.seek(0, 2)
- self._file_length = self._file.tell()
- def _pre_mailbox_hook(self, f):
- """Called before writing the mailbox to file f."""
- babyl = b'BABYL OPTIONS:' + linesep
- babyl += b'Version: 5' + linesep
- labels = self.get_labels()
- labels = (label.encode() for label in labels)
- babyl += b'Labels:' + b','.join(labels) + linesep
- babyl += b'\037'
- f.write(babyl)
- def _pre_message_hook(self, f):
- """Called before writing each message to file f."""
- f.write(b'\014' + linesep)
- def _post_message_hook(self, f):
- """Called after writing each message to file f."""
- f.write(linesep + b'\037')
- def _install_message(self, message):
- """Write message contents and return (start, stop)."""
- start = self._file.tell()
- if isinstance(message, BabylMessage):
- special_labels = []
- labels = []
- for label in message.get_labels():
- if label in self._special_labels:
- special_labels.append(label)
- else:
- labels.append(label)
- self._file.write(b'1')
- for label in special_labels:
- self._file.write(b', ' + label.encode())
- self._file.write(b',,')
- for label in labels:
- self._file.write(b' ' + label.encode() + b',')
- self._file.write(linesep)
- else:
- self._file.write(b'1,,' + linesep)
- if isinstance(message, email.message.Message):
- orig_buffer = io.BytesIO()
- orig_generator = email.generator.BytesGenerator(orig_buffer, False, 0)
- orig_generator.flatten(message)
- orig_buffer.seek(0)
- while True:
- line = orig_buffer.readline()
- self._file.write(line.replace(b'\n', linesep))
- if line == b'\n' or not line:
- break
- self._file.write(b'*** EOOH ***' + linesep)
- if isinstance(message, BabylMessage):
- vis_buffer = io.BytesIO()
- vis_generator = email.generator.BytesGenerator(vis_buffer, False, 0)
- vis_generator.flatten(message.get_visible())
- while True:
- line = vis_buffer.readline()
- self._file.write(line.replace(b'\n', linesep))
- if line == b'\n' or not line:
- break
- else:
- orig_buffer.seek(0)
- while True:
- line = orig_buffer.readline()
- self._file.write(line.replace(b'\n', linesep))
- if line == b'\n' or not line:
- break
- while True:
- buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
- if not buffer:
- break
- self._file.write(buffer.replace(b'\n', linesep))
- elif isinstance(message, (bytes, str, io.StringIO)):
- if isinstance(message, io.StringIO):
- warnings.warn("Use of StringIO input is deprecated, "
- "use BytesIO instead", DeprecationWarning, 3)
- message = message.getvalue()
- if isinstance(message, str):
- message = self._string_to_bytes(message)
- body_start = message.find(b'\n\n') + 2
- if body_start - 2 != -1:
- self._file.write(message[:body_start].replace(b'\n', linesep))
- self._file.write(b'*** EOOH ***' + linesep)
- self._file.write(message[:body_start].replace(b'\n', linesep))
- self._file.write(message[body_start:].replace(b'\n', linesep))
- else:
- self._file.write(b'*** EOOH ***' + linesep + linesep)
- self._file.write(message.replace(b'\n', linesep))
- elif hasattr(message, 'readline'):
- if hasattr(message, 'buffer'):
- warnings.warn("Use of text mode files is deprecated, "
- "use a binary mode file instead", DeprecationWarning, 3)
- message = message.buffer
- original_pos = message.tell()
- first_pass = True
- while True:
- line = message.readline()
- # Universal newline support.
- if line.endswith(b'\r\n'):
- line = line[:-2] + b'\n'
- elif line.endswith(b'\r'):
- line = line[:-1] + b'\n'
- self._file.write(line.replace(b'\n', linesep))
- if line == b'\n' or not line:
- if first_pass:
- first_pass = False
- self._file.write(b'*** EOOH ***' + linesep)
- message.seek(original_pos)
- else:
- break
- while True:
- line = message.readline()
- if not line:
- break
- # Universal newline support.
- if line.endswith(b'\r\n'):
- line = line[:-2] + linesep
- elif line.endswith(b'\r'):
- line = line[:-1] + linesep
- elif line.endswith(b'\n'):
- line = line[:-1] + linesep
- self._file.write(line)
- else:
- raise TypeError('Invalid message type: %s' % type(message))
- stop = self._file.tell()
- return (start, stop)
- class Message(email.message.Message):
- """Message with mailbox-format-specific properties."""
- def __init__(self, message=None):
- """Initialize a Message instance."""
- if isinstance(message, email.message.Message):
- self._become_message(copy.deepcopy(message))
- if isinstance(message, Message):
- message._explain_to(self)
- elif isinstance(message, bytes):
- self._become_message(email.message_from_bytes(message))
- elif isinstance(message, str):
- self._become_message(email.message_from_string(message))
- elif isinstance(message, io.TextIOWrapper):
- self._become_message(email.message_from_file(message))
- elif hasattr(message, "read"):
- self._become_message(email.message_from_binary_file(message))
- elif message is None:
- email.message.Message.__init__(self)
- else:
- raise TypeError('Invalid message type: %s' % type(message))
- def _become_message(self, message):
- """Assume the non-format-specific state of message."""
- type_specific = getattr(message, '_type_specific_attributes', [])
- for name in message.__dict__:
- if name not in type_specific:
- self.__dict__[name] = message.__dict__[name]
- def _explain_to(self, message):
- """Copy format-specific state to message insofar as possible."""
- if isinstance(message, Message):
- return # There's nothing format-specific to explain.
- else:
- raise TypeError('Cannot convert to specified type')
- class MaildirMessage(Message):
- """Message with Maildir-specific properties."""
- _type_specific_attributes = ['_subdir', '_info', '_date']
- def __init__(self, message=None):
- """Initialize a MaildirMessage instance."""
- self._subdir = 'new'
- self._info = ''
- self._date = time.time()
- Message.__init__(self, message)
- def get_subdir(self):
- """Return 'new' or 'cur'."""
- return self._subdir
- def set_subdir(self, subdir):
- """Set subdir to 'new' or 'cur'."""
- if subdir == 'new' or subdir == 'cur':
- self._subdir = subdir
- else:
- raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
- def get_flags(self):
- """Return as a string the flags that are set."""
- if self._info.startswith('2,'):
- return self._info[2:]
- else:
- return ''
- def set_flags(self, flags):
- """Set the given flags and unset all others."""
- self._info = '2,' + ''.join(sorted(flags))
- def add_flag(self, flag):
- """Set the given flag(s) without changing others."""
- self.set_flags(''.join(set(self.get_flags()) | set(flag)))
- def remove_flag(self, flag):
- """Unset the given string flag(s) without changing others."""
- if self.get_flags():
- self.set_flags(''.join(set(self.get_flags()) - set(flag)))
- def get_date(self):
- """Return delivery date of message, in seconds since the epoch."""
- return self._date
- def set_date(self, date):
- """Set delivery date of message, in seconds since the epoch."""
- try:
- self._date = float(date)
- except ValueError:
- raise TypeError("can't convert to float: %s" % date) from None
- def get_info(self):
- """Get the message's "info" as a string."""
- return self._info
- def set_info(self, info):
- """Set the message's "info" string."""
- if isinstance(info, str):
- self._info = info
- else:
- raise TypeError('info must be a string: %s' % type(info))
- def _explain_to(self, message):
- """Copy Maildir-specific state to message insofar as possible."""
- if isinstance(message, MaildirMessage):
- message.set_flags(self.get_flags())
- message.set_subdir(self.get_subdir())
- message.set_date(self.get_date())
- elif isinstance(message, _mboxMMDFMessage):
- flags = set(self.get_flags())
- if 'S' in flags:
- message.add_flag('R')
- if self.get_subdir() == 'cur':
- message.add_flag('O')
- if 'T' in flags:
- message.add_flag('D')
- if 'F' in flags:
- message.add_flag('F')
- if 'R' in flags:
- message.add_flag('A')
- message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
- elif isinstance(message, MHMessage):
- flags = set(self.get_flags())
- if 'S' not in flags:
- message.add_sequence('unseen')
- if 'R' in flags:
- message.add_sequence('replied')
- if 'F' in flags:
- message.add_sequence('flagged')
- elif isinstance(message, BabylMessage):
- flags = set(self.get_flags())
- if 'S' not in flags:
- message.add_label('unseen')
- if 'T' in flags:
- message.add_label('deleted')
- if 'R' in flags:
- message.add_label('answered')
- if 'P' in flags:
- message.add_label('forwarded')
- elif isinstance(message, Message):
- pass
- else:
- raise TypeError('Cannot convert to specified type: %s' %
- type(message))
- class _mboxMMDFMessage(Message):
- """Message with mbox- or MMDF-specific properties."""
- _type_specific_attributes = ['_from']
- def __init__(self, message=None):
- """Initialize an mboxMMDFMessage instance."""
- self.set_from('MAILER-DAEMON', True)
- if isinstance(message, email.message.Message):
- unixfrom = message.get_unixfrom()
- if unixfrom is not None and unixfrom.startswith('From '):
- self.set_from(unixfrom[5:])
- Message.__init__(self, message)
- def get_from(self):
- """Return contents of "From " line."""
- return self._from
- def set_from(self, from_, time_=None):
- """Set "From " line, formatting and appending time_ if specified."""
- if time_ is not None:
- if time_ is True:
- time_ = time.gmtime()
- from_ += ' ' + time.asctime(time_)
- self._from = from_
- def get_flags(self):
- """Return as a string the flags that are set."""
- return self.get('Status', '') + self.get('X-Status', '')
- def set_flags(self, flags):
- """Set the given flags and unset all others."""
- flags = set(flags)
- status_flags, xstatus_flags = '', ''
- for flag in ('R', 'O'):
- if flag in flags:
- status_flags += flag
- flags.remove(flag)
- for flag in ('D', 'F', 'A'):
- if flag in flags:
- xstatus_flags += flag
- flags.remove(flag)
- xstatus_flags += ''.join(sorted(flags))
- try:
- self.replace_header('Status', status_flags)
- except KeyError:
- self.add_header('Status', status_flags)
- try:
- self.replace_header('X-Status', xstatus_flags)
- except KeyError:
- self.add_header('X-Status', xstatus_flags)
- def add_flag(self, flag):
- """Set the given flag(s) without changing others."""
- self.set_flags(''.join(set(self.get_flags()) | set(flag)))
- def remove_flag(self, flag):
- """Unset the given string flag(s) without changing others."""
- if 'Status' in self or 'X-Status' in self:
- self.set_flags(''.join(set(self.get_flags()) - set(flag)))
- def _explain_to(self, message):
- """Copy mbox- or MMDF-specific state to message insofar as possible."""
- if isinstance(message, MaildirMessage):
- flags = set(self.get_flags())
- if 'O' in flags:
- message.set_subdir('cur')
- if 'F' in flags:
- message.add_flag('F')
- if 'A' in flags:
- message.add_flag('R')
- if 'R' in flags:
- message.add_flag('S')
- if 'D' in flags:
- message.add_flag('T')
- del message['status']
- del message['x-status']
- maybe_date = ' '.join(self.get_from().split()[-5:])
- try:
- message.set_date(calendar.timegm(time.strptime(maybe_date,
- '%a %b %d %H:%M:%S %Y')))
- except (ValueError, OverflowError):
- pass
- elif isinstance(message, _mboxMMDFMessage):
- message.set_flags(self.get_flags())
- message.set_from(self.get_from())
- elif isinstance(message, MHMessage):
- flags = set(self.get_flags())
- if 'R' not in flags:
- message.add_sequence('unseen')
- if 'A' in flags:
- message.add_sequence('replied')
- if 'F' in flags:
- message.add_sequence('flagged')
- del message['status']
- del message['x-status']
- elif isinstance(message, BabylMessage):
- flags = set(self.get_flags())
- if 'R' not in flags:
- message.add_label('unseen')
- if 'D' in flags:
- message.add_label('deleted')
- if 'A' in flags:
- message.add_label('answered')
- del message['status']
- del message['x-status']
- elif isinstance(message, Message):
- pass
- else:
- raise TypeError('Cannot convert to specified type: %s' %
- type(message))
- class mboxMessage(_mboxMMDFMessage):
- """Message with mbox-specific properties."""
- class MHMessage(Message):
- """Message with MH-specific properties."""
- _type_specific_attributes = ['_sequences']
- def __init__(self, message=None):
- """Initialize an MHMessage instance."""
- self._sequences = []
- Message.__init__(self, message)
- def get_sequences(self):
- """Return a list of sequences that include the message."""
- return self._sequences[:]
- def set_sequences(self, sequences):
- """Set the list of sequences that include the message."""
- self._sequences = list(sequences)
- def add_sequence(self, sequence):
- """Add sequence to list of sequences including the message."""
- if isinstance(sequence, str):
- if not sequence in self._sequences:
- self._sequences.append(sequence)
- else:
- raise TypeError('sequence type must be str: %s' % type(sequence))
- def remove_sequence(self, sequence):
- """Remove sequence from the list of sequences including the message."""
- try:
- self._sequences.remove(sequence)
- except ValueError:
- pass
- def _explain_to(self, message):
- """Copy MH-specific state to message insofar as possible."""
- if isinstance(message, MaildirMessage):
- sequences = set(self.get_sequences())
- if 'unseen' in sequences:
- message.set_subdir('cur')
- else:
- message.set_subdir('cur')
- message.add_flag('S')
- if 'flagged' in sequences:
- message.add_flag('F')
- if 'replied' in sequences:
- message.add_flag('R')
- elif isinstance(message, _mboxMMDFMessage):
- sequences = set(self.get_sequences())
- if 'unseen' not in sequences:
- message.add_flag('RO')
- else:
- message.add_flag('O')
- if 'flagged' in sequences:
- message.add_flag('F')
- if 'replied' in sequences:
- message.add_flag('A')
- elif isinstance(message, MHMessage):
- for sequence in self.get_sequences():
- message.add_sequence(sequence)
- elif isinstance(message, BabylMessage):
- sequences = set(self.get_sequences())
- if 'unseen' in sequences:
- message.add_label('unseen')
- if 'replied' in sequences:
- message.add_label('answered')
- elif isinstance(message, Message):
- pass
- else:
- raise TypeError('Cannot convert to specified type: %s' %
- type(message))
- class BabylMessage(Message):
- """Message with Babyl-specific properties."""
- _type_specific_attributes = ['_labels', '_visible']
- def __init__(self, message=None):
- """Initialize a BabylMessage instance."""
- self._labels = []
- self._visible = Message()
- Message.__init__(self, message)
- def get_labels(self):
- """Return a list of labels on the message."""
- return self._labels[:]
- def set_labels(self, labels):
- """Set the list of labels on the message."""
- self._labels = list(labels)
- def add_label(self, label):
- """Add label to list of labels on the message."""
- if isinstance(label, str):
- if label not in self._labels:
- self._labels.append(label)
- else:
- raise TypeError('label must be a string: %s' % type(label))
- def remove_label(self, label):
- """Remove label from the list of labels on the message."""
- try:
- self._labels.remove(label)
- except ValueError:
- pass
- def get_visible(self):
- """Return a Message representation of visible headers."""
- return Message(self._visible)
- def set_visible(self, visible):
- """Set the Message representation of visible headers."""
- self._visible = Message(visible)
- def update_visible(self):
- """Update and/or sensibly generate a set of visible headers."""
- for header in self._visible.keys():
- if header in self:
- self._visible.replace_header(header, self[header])
- else:
- del self._visible[header]
- for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
- if header in self and header not in self._visible:
- self._visible[header] = self[header]
- def _explain_to(self, message):
- """Copy Babyl-specific state to message insofar as possible."""
- if isinstance(message, MaildirMessage):
- labels = set(self.get_labels())
- if 'unseen' in labels:
- message.set_subdir('cur')
- else:
- message.set_subdir('cur')
- message.add_flag('S')
- if 'forwarded' in labels or 'resent' in labels:
- message.add_flag('P')
- if 'answered' in labels:
- message.add_flag('R')
- if 'deleted' in labels:
- message.add_flag('T')
- elif isinstance(message, _mboxMMDFMessage):
- labels = set(self.get_labels())
- if 'unseen' not in labels:
- message.add_flag('RO')
- else:
- message.add_flag('O')
- if 'deleted' in labels:
- message.add_flag('D')
- if 'answered' in labels:
- message.add_flag('A')
- elif isinstance(message, MHMessage):
- labels = set(self.get_labels())
- if 'unseen' in labels:
- message.add_sequence('unseen')
- if 'answered' in labels:
- message.add_sequence('replied')
- elif isinstance(message, BabylMessage):
- message.set_visible(self.get_visible())
- for label in self.get_labels():
- message.add_label(label)
- elif isinstance(message, Message):
- pass
- else:
- raise TypeError('Cannot convert to specified type: %s' %
- type(message))
- class MMDFMessage(_mboxMMDFMessage):
- """Message with MMDF-specific properties."""
- class _ProxyFile:
- """A read-only wrapper of a file."""
- def __init__(self, f, pos=None):
- """Initialize a _ProxyFile."""
- self._file = f
- if pos is None:
- self._pos = f.tell()
- else:
- self._pos = pos
- def read(self, size=None):
- """Read bytes."""
- return self._read(size, self._file.read)
- def read1(self, size=None):
- """Read bytes."""
- return self._read(size, self._file.read1)
- def readline(self, size=None):
- """Read a line."""
- return self._read(size, self._file.readline)
- def readlines(self, sizehint=None):
- """Read multiple lines."""
- result = []
- for line in self:
- result.append(line)
- if sizehint is not None:
- sizehint -= len(line)
- if sizehint <= 0:
- break
- return result
- def __iter__(self):
- """Iterate over lines."""
- while True:
- line = self.readline()
- if not line:
- return
- yield line
- def tell(self):
- """Return the position."""
- return self._pos
- def seek(self, offset, whence=0):
- """Change position."""
- if whence == 1:
- self._file.seek(self._pos)
- self._file.seek(offset, whence)
- self._pos = self._file.tell()
- def close(self):
- """Close the file."""
- if hasattr(self, '_file'):
- try:
- if hasattr(self._file, 'close'):
- self._file.close()
- finally:
- del self._file
- def _read(self, size, read_method):
- """Read size bytes using read_method."""
- if size is None:
- size = -1
- self._file.seek(self._pos)
- result = read_method(size)
- self._pos = self._file.tell()
- return result
- def __enter__(self):
- """Context management protocol support."""
- return self
- def __exit__(self, *exc):
- self.close()
- def readable(self):
- return self._file.readable()
- def writable(self):
- return self._file.writable()
- def seekable(self):
- return self._file.seekable()
- def flush(self):
- return self._file.flush()
- @property
- def closed(self):
- if not hasattr(self, '_file'):
- return True
- if not hasattr(self._file, 'closed'):
- return False
- return self._file.closed
- __class_getitem__ = classmethod(GenericAlias)
- class _PartialFile(_ProxyFile):
- """A read-only wrapper of part of a file."""
- def __init__(self, f, start=None, stop=None):
- """Initialize a _PartialFile."""
- _ProxyFile.__init__(self, f, start)
- self._start = start
- self._stop = stop
- def tell(self):
- """Return the position with respect to start."""
- return _ProxyFile.tell(self) - self._start
- def seek(self, offset, whence=0):
- """Change position, possibly with respect to start or stop."""
- if whence == 0:
- self._pos = self._start
- whence = 1
- elif whence == 2:
- self._pos = self._stop
- whence = 1
- _ProxyFile.seek(self, offset, whence)
- def _read(self, size, read_method):
- """Read size bytes using read_method, honoring start and stop."""
- remaining = self._stop - self._pos
- if remaining <= 0:
- return b''
- if size is None or size < 0 or size > remaining:
- size = remaining
- return _ProxyFile._read(self, size, read_method)
- def close(self):
- # do *not* close the underlying file object for partial files,
- # since it's global to the mailbox object
- if hasattr(self, '_file'):
- del self._file
- def _lock_file(f, dotlock=True):
- """Lock file f using lockf and dot locking."""
- dotlock_done = False
- try:
- if fcntl:
- try:
- fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
- except OSError as e:
- if e.errno in (errno.EAGAIN, errno.EACCES, errno.EROFS):
- raise ExternalClashError('lockf: lock unavailable: %s' %
- f.name)
- else:
- raise
- if dotlock:
- try:
- pre_lock = _create_temporary(f.name + '.lock')
- pre_lock.close()
- except OSError as e:
- if e.errno in (errno.EACCES, errno.EROFS):
- return # Without write access, just skip dotlocking.
- else:
- raise
- try:
- try:
- os.link(pre_lock.name, f.name + '.lock')
- dotlock_done = True
- except (AttributeError, PermissionError):
- os.rename(pre_lock.name, f.name + '.lock')
- dotlock_done = True
- else:
- os.unlink(pre_lock.name)
- except FileExistsError:
- os.remove(pre_lock.name)
- raise ExternalClashError('dot lock unavailable: %s' %
- f.name)
- except:
- if fcntl:
- fcntl.lockf(f, fcntl.LOCK_UN)
- if dotlock_done:
- os.remove(f.name + '.lock')
- raise
- def _unlock_file(f):
- """Unlock file f using lockf and dot locking."""
- if fcntl:
- fcntl.lockf(f, fcntl.LOCK_UN)
- if os.path.exists(f.name + '.lock'):
- os.remove(f.name + '.lock')
- def _create_carefully(path):
- """Create a file if it doesn't exist and open for reading and writing."""
- fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR, 0o666)
- try:
- return open(path, 'rb+')
- finally:
- os.close(fd)
- def _create_temporary(path):
- """Create a temp file based on path and open for reading and writing."""
- return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
- socket.gethostname(),
- os.getpid()))
- def _sync_flush(f):
- """Ensure changes to file f are physically on disk."""
- f.flush()
- if hasattr(os, 'fsync'):
- os.fsync(f.fileno())
- def _sync_close(f):
- """Close file f, ensuring all changes are physically on disk."""
- _sync_flush(f)
- f.close()
- class Error(Exception):
- """Raised for module-specific errors."""
- class NoSuchMailboxError(Error):
- """The specified mailbox does not exist and won't be created."""
- class NotEmptyError(Error):
- """The specified mailbox is not empty and deletion was requested."""
- class ExternalClashError(Error):
- """Another process caused an action to fail."""
- class FormatError(Error):
- """A file appears to have an invalid format."""
|