2003-12-15 18:16:09 +08:00
|
|
|
r"""File-like objects that read from or write to a string buffer.
|
2000-02-02 23:10:15 +08:00
|
|
|
|
|
|
|
This implements (nearly) all stdio methods.
|
|
|
|
|
|
|
|
f = StringIO() # ready for writing
|
|
|
|
f = StringIO(buf) # ready for reading
|
|
|
|
f.close() # explicitly release resources held
|
|
|
|
flag = f.isatty() # always false
|
|
|
|
pos = f.tell() # get current position
|
|
|
|
f.seek(pos) # set current position
|
|
|
|
f.seek(pos, mode) # mode 0: absolute; 1: relative; 2: relative to EOF
|
|
|
|
buf = f.read() # read until EOF
|
|
|
|
buf = f.read(n) # read up to n bytes
|
|
|
|
buf = f.readline() # read until end of line ('\n') or EOF
|
|
|
|
list = f.readlines()# list of f.readline() results until EOF
|
2000-09-28 12:21:06 +08:00
|
|
|
f.truncate([size]) # truncate file at to at most size (default: current pos)
|
2000-02-02 23:10:15 +08:00
|
|
|
f.write(buf) # write at current position
|
|
|
|
f.writelines(list) # for line in list: f.write(line)
|
|
|
|
f.getvalue() # return whole file's contents as a string
|
|
|
|
|
|
|
|
Notes:
|
|
|
|
- Using a real file is often faster (but less convenient).
|
2000-02-28 23:12:25 +08:00
|
|
|
- There's also a much faster implementation in C, called cStringIO, but
|
|
|
|
it's not subclassable.
|
2000-02-02 23:10:15 +08:00
|
|
|
- fileno() is left unimplemented so that code which uses it triggers
|
|
|
|
an exception early.
|
|
|
|
- Seeking far beyond EOF and then writing will insert real null
|
|
|
|
bytes that occupy space in the buffer.
|
|
|
|
- There's a simple test set (see end of this file).
|
|
|
|
"""
|
2000-12-13 07:12:23 +08:00
|
|
|
try:
|
2000-12-13 07:16:51 +08:00
|
|
|
from errno import EINVAL
|
2000-12-13 07:12:23 +08:00
|
|
|
except ImportError:
|
2000-12-13 07:16:51 +08:00
|
|
|
EINVAL = 22
|
2000-12-13 07:12:23 +08:00
|
|
|
|
2001-01-21 03:54:20 +08:00
|
|
|
__all__ = ["StringIO"]
|
|
|
|
|
2003-10-18 18:20:42 +08:00
|
|
|
def _complain_ifclosed(closed):
|
|
|
|
if closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
|
1994-06-23 19:53:27 +08:00
|
|
|
class StringIO:
|
2002-05-23 23:15:30 +08:00
|
|
|
"""class StringIO([buffer])
|
|
|
|
|
2002-05-15 10:56:03 +08:00
|
|
|
When a StringIO object is created, it can be initialized to an existing
|
|
|
|
string by passing the string to the constructor. If no string is given,
|
2002-05-23 23:15:30 +08:00
|
|
|
the StringIO will start empty.
|
2002-05-15 10:56:03 +08:00
|
|
|
|
|
|
|
The StringIO object can accept either Unicode or 8-bit strings, but
|
|
|
|
mixing the two may take some care. If both are used, 8-bit strings that
|
|
|
|
cannot be interpreted as 7-bit ASCII (that use the 8th bit) will cause
|
2002-05-23 23:15:30 +08:00
|
|
|
a UnicodeError to be raised when getvalue() is called.
|
2002-05-15 10:56:03 +08:00
|
|
|
"""
|
2000-12-13 07:16:51 +08:00
|
|
|
def __init__(self, buf = ''):
|
2002-01-07 01:15:05 +08:00
|
|
|
# Force self.buf to be a string or unicode
|
Remove uses of the string and types modules:
x in string.whitespace => x.isspace()
type(x) in types.StringTypes => isinstance(x, basestring)
isinstance(x, types.StringTypes) => isinstance(x, basestring)
type(x) is types.StringType => isinstance(x, str)
type(x) == types.StringType => isinstance(x, str)
string.split(x, ...) => x.split(...)
string.join(x, y) => y.join(x)
string.zfill(x, ...) => x.zfill(...)
string.count(x, ...) => x.count(...)
hasattr(types, "UnicodeType") => try: unicode except NameError:
type(x) != types.TupleTuple => not isinstance(x, tuple)
isinstance(x, types.TupleType) => isinstance(x, tuple)
type(x) is types.IntType => isinstance(x, int)
Do not mention the string module in the rlcompleter docstring.
This partially applies SF patch http://www.python.org/sf/562373
(with basestring instead of string). (It excludes the changes to
unittest.py and does not change the os.stat stuff.)
2002-06-03 23:58:32 +08:00
|
|
|
if not isinstance(buf, basestring):
|
2002-01-07 01:15:05 +08:00
|
|
|
buf = str(buf)
|
|
|
|
self.buf = buf
|
2000-12-14 04:23:11 +08:00
|
|
|
self.len = len(buf)
|
|
|
|
self.buflist = []
|
|
|
|
self.pos = 0
|
2003-10-18 18:20:42 +08:00
|
|
|
self.closed = False
|
2000-12-14 04:23:11 +08:00
|
|
|
self.softspace = 0
|
2000-12-13 07:16:51 +08:00
|
|
|
|
2001-09-22 12:34:54 +08:00
|
|
|
def __iter__(self):
|
2003-02-01 00:04:15 +08:00
|
|
|
return self
|
|
|
|
|
|
|
|
def next(self):
|
|
|
|
if self.closed:
|
|
|
|
raise StopIteration
|
|
|
|
r = self.readline()
|
|
|
|
if not r:
|
|
|
|
raise StopIteration
|
|
|
|
return r
|
2001-09-22 12:34:54 +08:00
|
|
|
|
2000-12-13 07:16:51 +08:00
|
|
|
def close(self):
|
2002-05-23 23:15:30 +08:00
|
|
|
"""Free the memory buffer.
|
2002-05-15 10:56:03 +08:00
|
|
|
"""
|
2000-12-14 04:23:11 +08:00
|
|
|
if not self.closed:
|
2003-10-18 18:20:42 +08:00
|
|
|
self.closed = True
|
2000-12-14 04:23:11 +08:00
|
|
|
del self.buf, self.pos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def isatty(self):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2002-04-07 14:36:23 +08:00
|
|
|
return False
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def seek(self, pos, mode = 0):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
if mode == 1:
|
|
|
|
pos += self.pos
|
|
|
|
elif mode == 2:
|
|
|
|
pos += self.len
|
|
|
|
self.pos = max(0, pos)
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def tell(self):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
return self.pos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def read(self, n = -1):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
if n < 0:
|
|
|
|
newpos = self.len
|
|
|
|
else:
|
|
|
|
newpos = min(self.pos+n, self.len)
|
|
|
|
r = self.buf[self.pos:newpos]
|
|
|
|
self.pos = newpos
|
|
|
|
return r
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def readline(self, length=None):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
i = self.buf.find('\n', self.pos)
|
|
|
|
if i < 0:
|
|
|
|
newpos = self.len
|
|
|
|
else:
|
|
|
|
newpos = i+1
|
|
|
|
if length is not None:
|
|
|
|
if self.pos + length < newpos:
|
|
|
|
newpos = self.pos + length
|
|
|
|
r = self.buf[self.pos:newpos]
|
|
|
|
self.pos = newpos
|
|
|
|
return r
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def readlines(self, sizehint = 0):
|
2000-12-14 04:23:11 +08:00
|
|
|
total = 0
|
|
|
|
lines = []
|
|
|
|
line = self.readline()
|
|
|
|
while line:
|
|
|
|
lines.append(line)
|
|
|
|
total += len(line)
|
|
|
|
if 0 < sizehint <= total:
|
|
|
|
break
|
|
|
|
line = self.readline()
|
|
|
|
return lines
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def truncate(self, size=None):
|
2004-01-19 04:29:55 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
if size is None:
|
|
|
|
size = self.pos
|
|
|
|
elif size < 0:
|
|
|
|
raise IOError(EINVAL, "Negative size not allowed")
|
|
|
|
elif size < self.pos:
|
|
|
|
self.pos = size
|
|
|
|
self.buf = self.getvalue()[:size]
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def write(self, s):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-14 04:23:11 +08:00
|
|
|
if not s: return
|
2002-01-07 01:15:05 +08:00
|
|
|
# Force s to be a string or unicode
|
Remove uses of the string and types modules:
x in string.whitespace => x.isspace()
type(x) in types.StringTypes => isinstance(x, basestring)
isinstance(x, types.StringTypes) => isinstance(x, basestring)
type(x) is types.StringType => isinstance(x, str)
type(x) == types.StringType => isinstance(x, str)
string.split(x, ...) => x.split(...)
string.join(x, y) => y.join(x)
string.zfill(x, ...) => x.zfill(...)
string.count(x, ...) => x.count(...)
hasattr(types, "UnicodeType") => try: unicode except NameError:
type(x) != types.TupleTuple => not isinstance(x, tuple)
isinstance(x, types.TupleType) => isinstance(x, tuple)
type(x) is types.IntType => isinstance(x, int)
Do not mention the string module in the rlcompleter docstring.
This partially applies SF patch http://www.python.org/sf/562373
(with basestring instead of string). (It excludes the changes to
unittest.py and does not change the os.stat stuff.)
2002-06-03 23:58:32 +08:00
|
|
|
if not isinstance(s, basestring):
|
2002-01-07 01:15:05 +08:00
|
|
|
s = str(s)
|
2002-09-18 02:10:34 +08:00
|
|
|
if self.pos == self.len:
|
|
|
|
self.buflist.append(s)
|
|
|
|
self.len = self.pos = self.pos + len(s)
|
|
|
|
return
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.pos > self.len:
|
|
|
|
self.buflist.append('\0'*(self.pos - self.len))
|
|
|
|
self.len = self.pos
|
|
|
|
newpos = self.pos + len(s)
|
|
|
|
if self.pos < self.len:
|
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
self.buflist = [self.buf[:self.pos], s, self.buf[newpos:]]
|
|
|
|
self.buf = ''
|
|
|
|
if newpos > self.len:
|
|
|
|
self.len = newpos
|
|
|
|
else:
|
|
|
|
self.buflist.append(s)
|
|
|
|
self.len = newpos
|
|
|
|
self.pos = newpos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def writelines(self, list):
|
2001-02-09 21:37:37 +08:00
|
|
|
self.write(''.join(list))
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def flush(self):
|
2003-10-18 18:20:42 +08:00
|
|
|
_complain_ifclosed(self.closed)
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def getvalue(self):
|
2002-05-15 10:56:03 +08:00
|
|
|
"""
|
|
|
|
Retrieve the entire contents of the "file" at any time before
|
|
|
|
the StringIO object's close() method is called.
|
|
|
|
|
|
|
|
The StringIO object can accept either Unicode or 8-bit strings,
|
|
|
|
but mixing the two may take some care. If both are used, 8-bit
|
|
|
|
strings that cannot be interpreted as 7-bit ASCII (that use the
|
|
|
|
8th bit) will cause a UnicodeError to be raised when getvalue()
|
2002-05-23 23:15:30 +08:00
|
|
|
is called.
|
2002-05-15 10:56:03 +08:00
|
|
|
"""
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
return self.buf
|
1994-06-23 19:53:27 +08:00
|
|
|
|
|
|
|
|
|
|
|
# A little test suite
|
|
|
|
|
|
|
|
def test():
|
2000-12-13 07:16:51 +08:00
|
|
|
import sys
|
|
|
|
if sys.argv[1:]:
|
2000-12-14 04:23:11 +08:00
|
|
|
file = sys.argv[1]
|
2000-12-13 07:16:51 +08:00
|
|
|
else:
|
2000-12-14 04:23:11 +08:00
|
|
|
file = '/etc/passwd'
|
2000-12-13 07:16:51 +08:00
|
|
|
lines = open(file, 'r').readlines()
|
|
|
|
text = open(file, 'r').read()
|
|
|
|
f = StringIO()
|
|
|
|
for line in lines[:-2]:
|
2000-12-14 04:23:11 +08:00
|
|
|
f.write(line)
|
2000-12-13 07:16:51 +08:00
|
|
|
f.writelines(lines[-2:])
|
|
|
|
if f.getvalue() != text:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'write failed'
|
2000-12-13 07:16:51 +08:00
|
|
|
length = f.tell()
|
|
|
|
print 'File length =', length
|
|
|
|
f.seek(len(lines[0]))
|
|
|
|
f.write(lines[1])
|
|
|
|
f.seek(0)
|
2004-02-13 01:35:32 +08:00
|
|
|
print 'First line =', repr(f.readline())
|
2002-02-12 01:52:18 +08:00
|
|
|
print 'Position =', f.tell()
|
2000-12-13 07:16:51 +08:00
|
|
|
line = f.readline()
|
2004-02-13 01:35:32 +08:00
|
|
|
print 'Second line =', repr(line)
|
2000-12-13 07:16:51 +08:00
|
|
|
f.seek(-len(line), 1)
|
|
|
|
line2 = f.read(len(line))
|
|
|
|
if line != line2:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad result after seek back'
|
2000-12-13 07:16:51 +08:00
|
|
|
f.seek(len(line2), 1)
|
|
|
|
list = f.readlines()
|
|
|
|
line = list[-1]
|
|
|
|
f.seek(f.tell() - len(line))
|
|
|
|
line2 = f.read()
|
|
|
|
if line != line2:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad result after seek back from EOF'
|
2000-12-13 07:16:51 +08:00
|
|
|
print 'Read', len(list), 'more lines'
|
|
|
|
print 'File length =', f.tell()
|
|
|
|
if f.tell() != length:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad length'
|
2000-12-13 07:16:51 +08:00
|
|
|
f.close()
|
1994-06-23 19:53:27 +08:00
|
|
|
|
|
|
|
if __name__ == '__main__':
|
2000-12-13 07:16:51 +08:00
|
|
|
test()
|