2000-02-02 23:10:15 +08:00
|
|
|
"""File-like objects that read from or write to a string buffer.
|
|
|
|
|
|
|
|
This implements (nearly) all stdio methods.
|
|
|
|
|
|
|
|
f = StringIO() # ready for writing
|
|
|
|
f = StringIO(buf) # ready for reading
|
|
|
|
f.close() # explicitly release resources held
|
|
|
|
flag = f.isatty() # always false
|
|
|
|
pos = f.tell() # get current position
|
|
|
|
f.seek(pos) # set current position
|
|
|
|
f.seek(pos, mode) # mode 0: absolute; 1: relative; 2: relative to EOF
|
|
|
|
buf = f.read() # read until EOF
|
|
|
|
buf = f.read(n) # read up to n bytes
|
|
|
|
buf = f.readline() # read until end of line ('\n') or EOF
|
|
|
|
list = f.readlines()# list of f.readline() results until EOF
|
2000-09-28 12:21:06 +08:00
|
|
|
f.truncate([size]) # truncate file at to at most size (default: current pos)
|
2000-02-02 23:10:15 +08:00
|
|
|
f.write(buf) # write at current position
|
|
|
|
f.writelines(list) # for line in list: f.write(line)
|
|
|
|
f.getvalue() # return whole file's contents as a string
|
|
|
|
|
|
|
|
Notes:
|
|
|
|
- Using a real file is often faster (but less convenient).
|
2000-02-28 23:12:25 +08:00
|
|
|
- There's also a much faster implementation in C, called cStringIO, but
|
|
|
|
it's not subclassable.
|
2000-02-02 23:10:15 +08:00
|
|
|
- fileno() is left unimplemented so that code which uses it triggers
|
|
|
|
an exception early.
|
|
|
|
- Seeking far beyond EOF and then writing will insert real null
|
|
|
|
bytes that occupy space in the buffer.
|
|
|
|
- There's a simple test set (see end of this file).
|
|
|
|
"""
|
2002-01-07 01:15:05 +08:00
|
|
|
import types
|
2000-12-13 07:12:23 +08:00
|
|
|
try:
|
2000-12-13 07:16:51 +08:00
|
|
|
from errno import EINVAL
|
2000-12-13 07:12:23 +08:00
|
|
|
except ImportError:
|
2000-12-13 07:16:51 +08:00
|
|
|
EINVAL = 22
|
2000-12-13 07:12:23 +08:00
|
|
|
|
2001-01-21 03:54:20 +08:00
|
|
|
__all__ = ["StringIO"]
|
|
|
|
|
1994-06-23 19:53:27 +08:00
|
|
|
class StringIO:
|
2000-12-13 07:16:51 +08:00
|
|
|
def __init__(self, buf = ''):
|
2002-01-07 01:15:05 +08:00
|
|
|
# Force self.buf to be a string or unicode
|
|
|
|
if type(buf) is not types.UnicodeType:
|
|
|
|
buf = str(buf)
|
|
|
|
self.buf = buf
|
2000-12-14 04:23:11 +08:00
|
|
|
self.len = len(buf)
|
|
|
|
self.buflist = []
|
|
|
|
self.pos = 0
|
|
|
|
self.closed = 0
|
|
|
|
self.softspace = 0
|
2000-12-13 07:16:51 +08:00
|
|
|
|
2001-09-22 12:34:54 +08:00
|
|
|
def __iter__(self):
|
|
|
|
return iter(self.readline, '')
|
|
|
|
|
2000-12-13 07:16:51 +08:00
|
|
|
def close(self):
|
2000-12-14 04:23:11 +08:00
|
|
|
if not self.closed:
|
|
|
|
self.closed = 1
|
|
|
|
del self.buf, self.pos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def isatty(self):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
return 0
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def seek(self, pos, mode = 0):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
if mode == 1:
|
|
|
|
pos += self.pos
|
|
|
|
elif mode == 2:
|
|
|
|
pos += self.len
|
|
|
|
self.pos = max(0, pos)
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def tell(self):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
return self.pos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def read(self, n = -1):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
if n < 0:
|
|
|
|
newpos = self.len
|
|
|
|
else:
|
|
|
|
newpos = min(self.pos+n, self.len)
|
|
|
|
r = self.buf[self.pos:newpos]
|
|
|
|
self.pos = newpos
|
|
|
|
return r
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def readline(self, length=None):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
i = self.buf.find('\n', self.pos)
|
|
|
|
if i < 0:
|
|
|
|
newpos = self.len
|
|
|
|
else:
|
|
|
|
newpos = i+1
|
|
|
|
if length is not None:
|
|
|
|
if self.pos + length < newpos:
|
|
|
|
newpos = self.pos + length
|
|
|
|
r = self.buf[self.pos:newpos]
|
|
|
|
self.pos = newpos
|
|
|
|
return r
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def readlines(self, sizehint = 0):
|
2000-12-14 04:23:11 +08:00
|
|
|
total = 0
|
|
|
|
lines = []
|
|
|
|
line = self.readline()
|
|
|
|
while line:
|
|
|
|
lines.append(line)
|
|
|
|
total += len(line)
|
|
|
|
if 0 < sizehint <= total:
|
|
|
|
break
|
|
|
|
line = self.readline()
|
|
|
|
return lines
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def truncate(self, size=None):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
if size is None:
|
|
|
|
size = self.pos
|
|
|
|
elif size < 0:
|
|
|
|
raise IOError(EINVAL, "Negative size not allowed")
|
|
|
|
elif size < self.pos:
|
|
|
|
self.pos = size
|
|
|
|
self.buf = self.getvalue()[:size]
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def write(self, s):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
|
|
|
if not s: return
|
2002-01-07 01:15:05 +08:00
|
|
|
# Force s to be a string or unicode
|
|
|
|
if type(s) is not types.UnicodeType:
|
|
|
|
s = str(s)
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.pos > self.len:
|
|
|
|
self.buflist.append('\0'*(self.pos - self.len))
|
|
|
|
self.len = self.pos
|
|
|
|
newpos = self.pos + len(s)
|
|
|
|
if self.pos < self.len:
|
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
self.buflist = [self.buf[:self.pos], s, self.buf[newpos:]]
|
|
|
|
self.buf = ''
|
|
|
|
if newpos > self.len:
|
|
|
|
self.len = newpos
|
|
|
|
else:
|
|
|
|
self.buflist.append(s)
|
|
|
|
self.len = newpos
|
|
|
|
self.pos = newpos
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def writelines(self, list):
|
2001-02-09 21:37:37 +08:00
|
|
|
self.write(''.join(list))
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def flush(self):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.closed:
|
|
|
|
raise ValueError, "I/O operation on closed file"
|
2000-12-13 07:16:51 +08:00
|
|
|
|
|
|
|
def getvalue(self):
|
2000-12-14 04:23:11 +08:00
|
|
|
if self.buflist:
|
2001-02-09 21:37:37 +08:00
|
|
|
self.buf += ''.join(self.buflist)
|
2000-12-14 04:23:11 +08:00
|
|
|
self.buflist = []
|
|
|
|
return self.buf
|
1994-06-23 19:53:27 +08:00
|
|
|
|
|
|
|
|
|
|
|
# A little test suite
|
|
|
|
|
|
|
|
def test():
|
2000-12-13 07:16:51 +08:00
|
|
|
import sys
|
|
|
|
if sys.argv[1:]:
|
2000-12-14 04:23:11 +08:00
|
|
|
file = sys.argv[1]
|
2000-12-13 07:16:51 +08:00
|
|
|
else:
|
2000-12-14 04:23:11 +08:00
|
|
|
file = '/etc/passwd'
|
2000-12-13 07:16:51 +08:00
|
|
|
lines = open(file, 'r').readlines()
|
|
|
|
text = open(file, 'r').read()
|
|
|
|
f = StringIO()
|
|
|
|
for line in lines[:-2]:
|
2000-12-14 04:23:11 +08:00
|
|
|
f.write(line)
|
2000-12-13 07:16:51 +08:00
|
|
|
f.writelines(lines[-2:])
|
|
|
|
if f.getvalue() != text:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'write failed'
|
2000-12-13 07:16:51 +08:00
|
|
|
length = f.tell()
|
|
|
|
print 'File length =', length
|
|
|
|
f.seek(len(lines[0]))
|
|
|
|
f.write(lines[1])
|
|
|
|
f.seek(0)
|
|
|
|
print 'First line =', `f.readline()`
|
2002-02-12 01:52:18 +08:00
|
|
|
print 'Position =', f.tell()
|
2000-12-13 07:16:51 +08:00
|
|
|
line = f.readline()
|
|
|
|
print 'Second line =', `line`
|
|
|
|
f.seek(-len(line), 1)
|
|
|
|
line2 = f.read(len(line))
|
|
|
|
if line != line2:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad result after seek back'
|
2000-12-13 07:16:51 +08:00
|
|
|
f.seek(len(line2), 1)
|
|
|
|
list = f.readlines()
|
|
|
|
line = list[-1]
|
|
|
|
f.seek(f.tell() - len(line))
|
|
|
|
line2 = f.read()
|
|
|
|
if line != line2:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad result after seek back from EOF'
|
2000-12-13 07:16:51 +08:00
|
|
|
print 'Read', len(list), 'more lines'
|
|
|
|
print 'File length =', f.tell()
|
|
|
|
if f.tell() != length:
|
2000-12-14 04:23:11 +08:00
|
|
|
raise RuntimeError, 'bad length'
|
2000-12-13 07:16:51 +08:00
|
|
|
f.close()
|
1994-06-23 19:53:27 +08:00
|
|
|
|
|
|
|
if __name__ == '__main__':
|
2000-12-13 07:16:51 +08:00
|
|
|
test()
|