cpython/Lib/mimetools.py

"""Various tools used by MIME-reading or MIME-writing programs."""


import os
import rfc822
import tempfile

__all__ = ["Message","choose_boundary","encode","decode","copyliteral",
           "copybinary"]

class Message(rfc822.Message):
    """A derived class of rfc822.Message that knows about MIME headers and
    contains some hooks for decoding encoded and multipart messages."""

    def __init__(self, fp, seekable = 1):
        rfc822.Message.__init__(self, fp, seekable)
        self.encodingheader = \
                self.getheader('content-transfer-encoding')
        self.typeheader = \
                self.getheader('content-type')
        self.parsetype()
        self.parseplist()

    def parsetype(self):
        str = self.typeheader
        if str is None:
            str = 'text/plain'
        if ';' in str:
            i = str.index(';')
            self.plisttext = str[i:]
            str = str[:i]
        else:
            self.plisttext = ''
        fields = str.split('/')
        for i in range(len(fields)):
            fields[i] = fields[i].strip().lower()
        self.type = '/'.join(fields)
        self.maintype = fields[0]
        self.subtype = '/'.join(fields[1:])

    def parseplist(self):
        str = self.plisttext
        self.plist = []
        while str[:1] == ';':
            str = str[1:]
            if ';' in str:
                # XXX Should parse quotes!
                end = str.index(';')
            else:
                end = len(str)
            f = str[:end]
            if '=' in f:
                i = f.index('=')
                f = f[:i].strip().lower() + \
                        '=' + f[i+1:].strip()
            self.plist.append(f.strip())
            str = str[end:]

    def getplist(self):
        return self.plist

    def getparam(self, name):
        name = name.lower() + '='
        n = len(name)
        for p in self.plist:
            if p[:n] == name:
                return rfc822.unquote(p[n:])
        return None

    def getparamnames(self):
        result = []
        for p in self.plist:
            i = p.find('=')
            if i >= 0:
                result.append(p[:i].lower())
        return result

    def getencoding(self):
        if self.encodingheader is None:
            return '7bit'
        return self.encodingheader.lower()

    def gettype(self):
        return self.type

    def getmaintype(self):
        return self.maintype

    def getsubtype(self):
        return self.subtype


# Utility functions
# -----------------


_prefix = None

def choose_boundary():
    """Return a random string usable as a multipart boundary.
    The method used is so that it is *very* unlikely that the same
    string of characters will every occur again in the Universe,
    so the caller needn't check the data it is packing for the
    occurrence of the boundary.

    The boundary contains dots so you have to quote it in the header."""

    global _prefix
    import time
    import random
    if _prefix is None:
        import socket
        hostid = socket.gethostbyname(socket.gethostname())
        try:
            uid = `os.getuid()`
        except AttributeError:
            uid = '1'
        try:
            pid = `os.getpid()`
        except AttributeError:
            pid = '1'
        _prefix = hostid + '.' + uid + '.' + pid
    timestamp = '%.3f' % time.time()
    seed = `random.randint(0, 32767)`
    return _prefix + '.' + timestamp + '.' + seed


# Subroutines for decoding some common content-transfer-types

def decode(input, output, encoding):
    """Decode common content-transfer-encodings (base64, quopri, uuencode)."""
    if encoding == 'base64':
        import base64
        return base64.decode(input, output)
    if encoding == 'quoted-printable':
        import quopri
        return quopri.decode(input, output)
    if encoding in ('uuencode', 'x-uuencode', 'uue', 'x-uue'):
        import uu
        return uu.decode(input, output)
    if encoding in ('7bit', '8bit'):
        return output.write(input.read())
    if encoding in decodetab:
        pipethrough(input, decodetab[encoding], output)
    else:
        raise ValueError, \
              'unknown Content-Transfer-Encoding: %s' % encoding

def encode(input, output, encoding):
    """Encode common content-transfer-encodings (base64, quopri, uuencode)."""
    if encoding == 'base64':
        import base64
        return base64.encode(input, output)
    if encoding == 'quoted-printable':
        import quopri
        return quopri.encode(input, output, 0)
    if encoding in ('uuencode', 'x-uuencode', 'uue', 'x-uue'):
        import uu
        return uu.encode(input, output)
    if encoding in ('7bit', '8bit'):
        return output.write(input.read())
    if encoding in encodetab:
        pipethrough(input, encodetab[encoding], output)
    else:
        raise ValueError, \
              'unknown Content-Transfer-Encoding: %s' % encoding

# The following is no longer used for standard encodings

# XXX This requires that uudecode and mmencode are in $PATH

uudecode_pipe = '''(
TEMP=/tmp/@uu.$$
sed "s%^begin [0-7][0-7]* .*%begin 600 $TEMP%" | uudecode
cat $TEMP
rm $TEMP
)'''

decodetab = {
        'uuencode':             uudecode_pipe,
        'x-uuencode':           uudecode_pipe,
        'uue':                  uudecode_pipe,
        'x-uue':                uudecode_pipe,
        'quoted-printable':     'mmencode -u -q',
        'base64':               'mmencode -u -b',
}

encodetab = {
        'x-uuencode':           'uuencode tempfile',
        'uuencode':             'uuencode tempfile',
        'x-uue':                'uuencode tempfile',
        'uue':                  'uuencode tempfile',
        'quoted-printable':     'mmencode -q',
        'base64':               'mmencode -b',
}

def pipeto(input, command):
    pipe = os.popen(command, 'w')
    copyliteral(input, pipe)
    pipe.close()

def pipethrough(input, command, output):
    (fd, tempname) = tempfile.mkstemp()
    temp = os.fdopen(fd, 'w')
    copyliteral(input, temp)
    temp.close()
    pipe = os.popen(command + ' <' + tempname, 'r')
    copybinary(pipe, output)
    pipe.close()
    os.unlink(tempname)

def copyliteral(input, output):
    while 1:
        line = input.readline()
        if not line: break
        output.write(line)

def copybinary(input, output):
    BUFSIZE = 8192
    while 1:
        line = input.read(BUFSIZE)
        if not line: break
        output.write(line)
More trivial comment -> docstring transformations by Ka-Ping Yee, who writes: Here is batch 2, as a big collection of CVS context diffs. Along with moving comments into docstrings, i've added a couple of missing docstrings and attempted to make sure more module docstrings begin with a one-line summary. I did not add docstrings to the methods in profile.py for fear of upsetting any careful optimizations there, though i did move class documentation into class docstrings. The convention i'm using is to leave credits/version/copyright type of stuff in # comments, and move the rest of the descriptive stuff about module usage into module docstrings. Hope this is okay. 2000-02-04 23:10:34 +08:00			`"""Various tools used by MIME-reading or MIME-writing programs."""`
New modules mimetools and rfc822. Minor, minor changes to commands.py and sndhdr.py. 1992-07-13 22:28:59 +08:00

Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00			`import os`
New modules mimetools and rfc822. Minor, minor changes to commands.py and sndhdr.py. 1992-07-13 22:28:59 +08:00			`import rfc822`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00			`import tempfile`
New modules mimetools and rfc822. Minor, minor changes to commands.py and sndhdr.py. 1992-07-13 22:28:59 +08:00
added a few more __all__ lists test___all__.py: fail silently in check_all if the module can't be imported 2001-01-25 23:29:22 +08:00			`__all__ = ["Message","choose_boundary","encode","decode","copyliteral",`
			`"copybinary"]`
New modules mimetools and rfc822. Minor, minor changes to commands.py and sndhdr.py. 1992-07-13 22:28:59 +08:00
			`class Message(rfc822.Message):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`"""A derived class of rfc822.Message that knows about MIME headers and`
			`contains some hooks for decoding encoded and multipart messages."""`

			`def __init__(self, fp, seekable = 1):`
			`rfc822.Message.__init__(self, fp, seekable)`
			`self.encodingheader = \`
			`self.getheader('content-transfer-encoding')`
			`self.typeheader = \`
			`self.getheader('content-type')`
			`self.parsetype()`
			`self.parseplist()`

			`def parsetype(self):`
			`str = self.typeheader`
			`if str is None:`
			`str = 'text/plain'`
			`if ';' in str:`
			`i = str.index(';')`
			`self.plisttext = str[i:]`
			`str = str[:i]`
			`else:`
			`self.plisttext = ''`
			`fields = str.split('/')`
			`for i in range(len(fields)):`
			`fields[i] = fields[i].strip().lower()`
			`self.type = '/'.join(fields)`
			`self.maintype = fields[0]`
			`self.subtype = '/'.join(fields[1:])`

			`def parseplist(self):`
			`str = self.plisttext`
			`self.plist = []`
			`while str[:1] == ';':`
			`str = str[1:]`
			`if ';' in str:`
			`# XXX Should parse quotes!`
			`end = str.index(';')`
			`else:`
			`end = len(str)`
			`f = str[:end]`
			`if '=' in f:`
			`i = f.index('=')`
			`f = f[:i].strip().lower() + \`
			`'=' + f[i+1:].strip()`
			`self.plist.append(f.strip())`
			`str = str[end:]`

			`def getplist(self):`
			`return self.plist`

			`def getparam(self, name):`
			`name = name.lower() + '='`
			`n = len(name)`
			`for p in self.plist:`
			`if p[:n] == name:`
			`return rfc822.unquote(p[n:])`
			`return None`

			`def getparamnames(self):`
			`result = []`
			`for p in self.plist:`
			`i = p.find('=')`
			`if i >= 0:`
			`result.append(p[:i].lower())`
			`return result`

			`def getencoding(self):`
			`if self.encodingheader is None:`
			`return '7bit'`
			`return self.encodingheader.lower()`

			`def gettype(self):`
			`return self.type`

			`def getmaintype(self):`
			`return self.maintype`

			`def getsubtype(self):`
			`return self.subtype`
New modules mimetools and rfc822. Minor, minor changes to commands.py and sndhdr.py. 1992-07-13 22:28:59 +08:00



			`# Utility functions`
			`# -----------------`


			`_prefix = None`

			`def choose_boundary():`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`"""Return a random string usable as a multipart boundary.`
			`The method used is so that it is very unlikely that the same`
			`string of characters will every occur again in the Universe,`
			`so the caller needn't check the data it is packing for the`
			`occurrence of the boundary.`

			`The boundary contains dots so you have to quote it in the header."""`

			`global _prefix`
			`import time`
			`import random`
			`if _prefix is None:`
			`import socket`
			`hostid = socket.gethostbyname(socket.gethostname())`
			`try:`
			uid = `os.getuid()`
Only AttributeError can be raised in this situation - on systems without getuid or getpid. posix_getuid & posix_getpid never raise exceptions when called with no args. 2002-03-23 13:58:52 +08:00			`except AttributeError:`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`uid = '1'`
			`try:`
			pid = `os.getpid()`
Only AttributeError can be raised in this situation - on systems without getuid or getpid. posix_getuid & posix_getpid never raise exceptions when called with no args. 2002-03-23 13:58:52 +08:00			`except AttributeError:`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`pid = '1'`
			`_prefix = hostid + '.' + uid + '.' + pid`
			`timestamp = '%.3f' % time.time()`
			seed = `random.randint(0, 32767)`
			`return _prefix + '.' + timestamp + '.' + seed`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00

			`# Subroutines for decoding some common content-transfer-types`

			`def decode(input, output, encoding):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`"""Decode common content-transfer-encodings (base64, quopri, uuencode)."""`
			`if encoding == 'base64':`
			`import base64`
			`return base64.decode(input, output)`
			`if encoding == 'quoted-printable':`
			`import quopri`
			`return quopri.decode(input, output)`
			`if encoding in ('uuencode', 'x-uuencode', 'uue', 'x-uue'):`
			`import uu`
			`return uu.decode(input, output)`
			`if encoding in ('7bit', '8bit'):`
			`return output.write(input.read())`
SF 563203. Replaced 'has_key()' with 'in'. 2002-06-01 22:18:47 +08:00			`if encoding in decodetab:`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`pipethrough(input, decodetab[encoding], output)`
			`else:`
			`raise ValueError, \`
			`'unknown Content-Transfer-Encoding: %s' % encoding`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00
			`def encode(input, output, encoding):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`"""Encode common content-transfer-encodings (base64, quopri, uuencode)."""`
			`if encoding == 'base64':`
			`import base64`
			`return base64.encode(input, output)`
			`if encoding == 'quoted-printable':`
			`import quopri`
			`return quopri.encode(input, output, 0)`
			`if encoding in ('uuencode', 'x-uuencode', 'uue', 'x-uue'):`
			`import uu`
			`return uu.encode(input, output)`
			`if encoding in ('7bit', '8bit'):`
			`return output.write(input.read())`
SF 563203. Replaced 'has_key()' with 'in'. 2002-06-01 22:18:47 +08:00			`if encoding in encodetab:`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`pipethrough(input, encodetab[encoding], output)`
			`else:`
			`raise ValueError, \`
			`'unknown Content-Transfer-Encoding: %s' % encoding`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00
Use the modules base64, quopri, and uu, instead of external programs to decode/encode the standard transfer encodings. 1997-07-12 00:33:26 +08:00			`# The following is no longer used for standard encodings`

			`# XXX This requires that uudecode and mmencode are in $PATH`

Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00			`uudecode_pipe = '''(`
			`TEMP=/tmp/@uu.$$`
			`sed "s%^begin [0-7][0-7]* .*%begin 600 $TEMP%" \| uudecode`
			`cat $TEMP`
			`rm $TEMP`
			`)'''`

			`decodetab = {`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`'uuencode': uudecode_pipe,`
			`'x-uuencode': uudecode_pipe,`
			`'uue': uudecode_pipe,`
			`'x-uue': uudecode_pipe,`
			`'quoted-printable': 'mmencode -u -q',`
			`'base64': 'mmencode -u -b',`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00			`}`

			`encodetab = {`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`'x-uuencode': 'uuencode tempfile',`
			`'uuencode': 'uuencode tempfile',`
			`'x-uue': 'uuencode tempfile',`
			`'uue': 'uuencode tempfile',`
			`'quoted-printable': 'mmencode -q',`
			`'base64': 'mmencode -b',`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00			`}`

			`def pipeto(input, command):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`pipe = os.popen(command, 'w')`
			`copyliteral(input, pipe)`
			`pipe.close()`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00
			`def pipethrough(input, command, output):`
Massive changes from SF 589982 (tempfile.py rewrite, by Zack Weinberg). This changes all uses of deprecated tempfile functions to the recommended ones. 2002-08-10 00:38:32 +08:00			`(fd, tempname) = tempfile.mkstemp()`
			`temp = os.fdopen(fd, 'w')`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`copyliteral(input, temp)`
			`temp.close()`
			`pipe = os.popen(command + ' <' + tempname, 'r')`
			`copybinary(pipe, output)`
			`pipe.close()`
			`os.unlink(tempname)`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00
			`def copyliteral(input, output):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`while 1:`
			`line = input.readline()`
			`if not line: break`
			`output.write(line)`
Merge alpha100 branch back to main trunk 1994-08-01 19:34:53 +08:00
			`def copybinary(input, output):`
Whitespace normalization. 2001-01-15 07:47:14 +08:00			`BUFSIZE = 8192`
			`while 1:`
			`line = input.read(BUFSIZE)`
			`if not line: break`
			`output.write(line)`