Blame - Lib/_pyio.py - platform/external/python/cpython2

blob: f022a4e88b8ed7ff197b7ae82f0f8b61c20e3fc0 [file] [log] [blame]

Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1	"""
				2	Python implementation of the io module.
				3	"""
				4
Benjamin Peterson	fed4abc	2010-04-27 21:17:22 +0000	[diff] [blame]	5	from __future__ import (print_function, unicode_literals)
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	6
				7	import os
				8	import abc
				9	import codecs
Serhiy Storchaka	c7797dc	2015-05-31 20:21:00 +0300	[diff] [blame]	10	import sys
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	11	import warnings
Antoine Pitrou	5aa7df3	2011-11-21 20:16:44 +0100	[diff] [blame]	12	import errno
Benjamin Peterson	5e9cc5e	2010-04-27 21:15:28 +0000	[diff] [blame]	13	# Import thread instead of threading to reduce startup cost
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	14	try:
				15	from thread import allocate_lock as Lock
				16	except ImportError:
				17	from dummy_thread import allocate_lock as Lock
				18
				19	import io
Benjamin Peterson	2773725	2010-04-27 21:18:30 +0000	[diff] [blame]	20	from io import (__all__, SEEK_SET, SEEK_CUR, SEEK_END)
Antoine Pitrou	6439c00	2011-02-25 21:35:47 +0000	[diff] [blame]	21	from errno import EINTR
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	22
				23	__metaclass__ = type
				24
				25	# open() uses st_blksize whenever we can
				26	DEFAULT_BUFFER_SIZE = 8 * 1024 # bytes
				27
				28	# NOTE: Base classes defined here are registered with the "official" ABCs
Benjamin Peterson	6a74a51	2015-03-18 21:35:38 -0500	[diff] [blame]	29	# defined in io.py. We don't use real inheritance though, because we don't want
				30	# to inherit the C implementations.
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	31
				32
				33	class BlockingIOError(IOError):
				34
				35	"""Exception raised when I/O would block on a non-blocking I/O stream."""
				36
				37	def __init__(self, errno, strerror, characters_written=0):
				38	super(IOError, self).__init__(errno, strerror)
				39	if not isinstance(characters_written, (int, long)):
				40	raise TypeError("characters_written must be a integer")
				41	self.characters_written = characters_written
				42
				43
Benjamin Peterson	a9bd6d5	2010-04-27 21:01:54 +0000	[diff] [blame]	44	def open(file, mode="r", buffering=-1,
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	45	encoding=None, errors=None,
				46	newline=None, closefd=True):
				47
				48	r"""Open file and return a stream. Raise IOError upon failure.
				49
				50	file is either a text or byte string giving the name (and the path
				51	if the file isn't in the current working directory) of the file to
				52	be opened or an integer file descriptor of the file to be
				53	wrapped. (If a file descriptor is given, it is closed when the
				54	returned I/O object is closed, unless closefd is set to False.)
				55
				56	mode is an optional string that specifies the mode in which the file
				57	is opened. It defaults to 'r' which means open for reading in text
				58	mode. Other common values are 'w' for writing (truncating the file if
				59	it already exists), and 'a' for appending (which on some Unix systems,
				60	means that all writes append to the end of the file regardless of the
				61	current seek position). In text mode, if encoding is not specified the
				62	encoding used is platform dependent. (For reading and writing raw
				63	bytes use binary mode and leave encoding unspecified.) The available
				64	modes are:
				65
				66	========= ===============================================================
				67	Character Meaning
				68	--------- ---------------------------------------------------------------
				69	'r' open for reading (default)
				70	'w' open for writing, truncating the file first
				71	'a' open for writing, appending to the end of the file if it exists
				72	'b' binary mode
				73	't' text mode (default)
				74	'+' open a disk file for updating (reading and writing)
				75	'U' universal newline mode (for backwards compatibility; unneeded
				76	for new code)
				77	========= ===============================================================
				78
				79	The default mode is 'rt' (open for reading text). For binary random
				80	access, the mode 'w+b' opens and truncates the file to 0 bytes, while
				81	'r+b' opens the file without truncation.
				82
				83	Python distinguishes between files opened in binary and text modes,
				84	even when the underlying operating system doesn't. Files opened in
				85	binary mode (appending 'b' to the mode argument) return contents as
				86	bytes objects without any decoding. In text mode (the default, or when
				87	't' is appended to the mode argument), the contents of the file are
				88	returned as strings, the bytes having been first decoded using a
				89	platform-dependent encoding or using the specified encoding if given.
				90
Antoine Pitrou	e812d29	2009-12-19 21:01:10 +0000	[diff] [blame]	91	buffering is an optional integer used to set the buffering policy.
				92	Pass 0 to switch buffering off (only allowed in binary mode), 1 to select
				93	line buffering (only usable in text mode), and an integer > 1 to indicate
				94	the size of a fixed-size chunk buffer. When no buffering argument is
				95	given, the default buffering policy works as follows:
				96
				97	* Binary files are buffered in fixed-size chunks; the size of the buffer
				98	is chosen using a heuristic trying to determine the underlying device's
				99	"block size" and falling back on `io.DEFAULT_BUFFER_SIZE`.
				100	On many systems, the buffer will typically be 4096 or 8192 bytes long.
				101
				102	* "Interactive" text files (files for which isatty() returns True)
				103	use line buffering. Other text files use the policy described above
				104	for binary files.
				105
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	106	encoding is the name of the encoding used to decode or encode the
				107	file. This should only be used in text mode. The default encoding is
				108	platform dependent, but any encoding supported by Python can be
				109	passed. See the codecs module for the list of supported encodings.
				110
				111	errors is an optional string that specifies how encoding errors are to
				112	be handled---this argument should not be used in binary mode. Pass
				113	'strict' to raise a ValueError exception if there is an encoding error
				114	(the default of None has the same effect), or pass 'ignore' to ignore
				115	errors. (Note that ignoring encoding errors can lead to data loss.)
				116	See the documentation for codecs.register for a list of the permitted
				117	encoding error strings.
				118
				119	newline controls how universal newlines works (it only applies to text
				120	mode). It can be None, '', '\n', '\r', and '\r\n'. It works as
				121	follows:
				122
				123	* On input, if newline is None, universal newlines mode is
				124	enabled. Lines in the input can end in '\n', '\r', or '\r\n', and
				125	these are translated into '\n' before being returned to the
				126	caller. If it is '', universal newline mode is enabled, but line
				127	endings are returned to the caller untranslated. If it has any of
				128	the other legal values, input lines are only terminated by the given
				129	string, and the line ending is returned to the caller untranslated.
				130
				131	* On output, if newline is None, any '\n' characters written are
				132	translated to the system default line separator, os.linesep. If
				133	newline is '', no translation takes place. If newline is any of the
				134	other legal values, any '\n' characters written are translated to
				135	the given string.
				136
				137	If closefd is False, the underlying file descriptor will be kept open
				138	when the file is closed. This does not work when a file name is given
				139	and must be True in that case.
				140
				141	open() returns a file object whose type depends on the mode, and
				142	through which the standard file operations such as reading and writing
				143	are performed. When open() is used to open a file in a text mode ('w',
				144	'r', 'wt', 'rt', etc.), it returns a TextIOWrapper. When used to open
				145	a file in a binary mode, the returned class varies: in read binary
				146	mode, it returns a BufferedReader; in write binary and append binary
				147	modes, it returns a BufferedWriter, and in read/write mode, it returns
				148	a BufferedRandom.
				149
				150	It is also possible to use a string or bytearray as a file for both
				151	reading and writing. For strings StringIO can be used like a file
				152	opened in a text mode, and for bytes a BytesIO can be used like a file
				153	opened in a binary mode.
				154	"""
				155	if not isinstance(file, (basestring, int, long)):
				156	raise TypeError("invalid file: %r" % file)
				157	if not isinstance(mode, basestring):
				158	raise TypeError("invalid mode: %r" % mode)
Benjamin Peterson	a9bd6d5	2010-04-27 21:01:54 +0000	[diff] [blame]	159	if not isinstance(buffering, (int, long)):
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	160	raise TypeError("invalid buffering: %r" % buffering)
				161	if encoding is not None and not isinstance(encoding, basestring):
				162	raise TypeError("invalid encoding: %r" % encoding)
				163	if errors is not None and not isinstance(errors, basestring):
				164	raise TypeError("invalid errors: %r" % errors)
				165	modes = set(mode)
				166	if modes - set("arwb+tU") or len(mode) > len(modes):
				167	raise ValueError("invalid mode: %r" % mode)
				168	reading = "r" in modes
				169	writing = "w" in modes
				170	appending = "a" in modes
				171	updating = "+" in modes
				172	text = "t" in modes
				173	binary = "b" in modes
				174	if "U" in modes:
				175	if writing or appending:
				176	raise ValueError("can't use U and writing mode at once")
				177	reading = True
				178	if text and binary:
				179	raise ValueError("can't have text and binary mode at once")
				180	if reading + writing + appending > 1:
				181	raise ValueError("can't have read/write/append mode at once")
				182	if not (reading or writing or appending):
				183	raise ValueError("must have exactly one of read/write/append mode")
				184	if binary and encoding is not None:
				185	raise ValueError("binary mode doesn't take an encoding argument")
				186	if binary and errors is not None:
				187	raise ValueError("binary mode doesn't take an errors argument")
				188	if binary and newline is not None:
				189	raise ValueError("binary mode doesn't take a newline argument")
				190	raw = FileIO(file,
				191	(reading and "r" or "") +
				192	(writing and "w" or "") +
				193	(appending and "a" or "") +
				194	(updating and "+" or ""),
				195	closefd)
Serhiy Storchaka	05b0a1b	2014-06-09 13:32:08 +0300	[diff] [blame]	196	result = raw
				197	try:
				198	line_buffering = False
				199	if buffering == 1 or buffering < 0 and raw.isatty():
				200	buffering = -1
				201	line_buffering = True
				202	if buffering < 0:
				203	buffering = DEFAULT_BUFFER_SIZE
				204	try:
				205	bs = os.fstat(raw.fileno()).st_blksize
				206	except (os.error, AttributeError):
				207	pass
				208	else:
				209	if bs > 1:
				210	buffering = bs
				211	if buffering < 0:
				212	raise ValueError("invalid buffering size")
				213	if buffering == 0:
				214	if binary:
				215	return result
				216	raise ValueError("can't have unbuffered text I/O")
				217	if updating:
				218	buffer = BufferedRandom(raw, buffering)
				219	elif writing or appending:
				220	buffer = BufferedWriter(raw, buffering)
				221	elif reading:
				222	buffer = BufferedReader(raw, buffering)
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	223	else:
Serhiy Storchaka	05b0a1b	2014-06-09 13:32:08 +0300	[diff] [blame]	224	raise ValueError("unknown mode: %r" % mode)
				225	result = buffer
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	226	if binary:
Serhiy Storchaka	05b0a1b	2014-06-09 13:32:08 +0300	[diff] [blame]	227	return result
				228	text = TextIOWrapper(buffer, encoding, errors, newline, line_buffering)
				229	result = text
				230	text.mode = mode
				231	return result
				232	except:
				233	result.close()
				234	raise
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	235
				236
				237	class DocDescriptor:
				238	"""Helper for builtins.open.__doc__
				239	"""
				240	def __get__(self, obj, typ):
				241	return (
Benjamin Peterson	ae9f8bd	2010-04-27 21:19:06 +0000	[diff] [blame]	242	"open(file, mode='r', buffering=-1, encoding=None, "
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	243	"errors=None, newline=None, closefd=True)\n\n" +
				244	open.__doc__)
				245
				246	class OpenWrapper:
				247	"""Wrapper for builtins.open
				248
				249	Trick so that open won't become a bound method when stored
				250	as a class variable (as dbm.dumb does).
				251
				252	See initstdio() in Python/pythonrun.c.
				253	"""
				254	__doc__ = DocDescriptor()
				255
				256	def __new__(cls, args, *kwargs):
				257	return open(args, *kwargs)
				258
				259
				260	class UnsupportedOperation(ValueError, IOError):
				261	pass
				262
				263
				264	class IOBase:
				265	__metaclass__ = abc.ABCMeta
				266
				267	"""The abstract base class for all I/O classes, acting on streams of
				268	bytes. There is no public constructor.
				269
				270	This class provides dummy implementations for many methods that
				271	derived classes can override selectively; the default implementations
				272	represent a file that cannot be read, written or seeked.
				273
				274	Even though IOBase does not declare read, readinto, or write because
				275	their signatures will vary, implementations and clients should
				276	consider those methods part of the interface. Also, implementations
Martin Panter	b362f75	2015-11-02 03:37:02 +0000	[diff] [blame]	277	may raise an IOError when operations they do not support are called.
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	278
				279	The basic type used for binary data read from or written to a file is
Martin Panter	c9813d8	2016-06-03 05:59:20 +0000	[diff] [blame]	280	the bytes type. Method arguments may also be bytearray or memoryview of
				281	arrays of bytes. In some cases, such as readinto, a writable object such
				282	as bytearray is required. Text I/O classes work with unicode data.
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	283
				284	Note that calling any method (even inquiries) on a closed stream is
				285	undefined. Implementations may raise IOError in this case.
				286
				287	IOBase (and its subclasses) support the iterator protocol, meaning
				288	that an IOBase object can be iterated over yielding the lines in a
				289	stream.
				290
				291	IOBase also supports the :keyword:`with` statement. In this example,
				292	fp is closed after the suite of the with statement is complete:
				293
				294	with open('spam.txt', 'r') as fp:
				295	fp.write('Spam and eggs!')
				296	"""
				297
				298	### Internal ###
				299
				300	def _unsupported(self, name):
				301	"""Internal: raise an exception for unsupported operations."""
				302	raise UnsupportedOperation("%s.%s() not supported" %
				303	(self.__class__.__name__, name))
				304
				305	### Positioning ###
				306
				307	def seek(self, pos, whence=0):
				308	"""Change stream position.
				309
Terry Jan Reedy	a70f60a	2013-03-11 17:56:17 -0400	[diff] [blame]	310	Change the stream position to byte offset pos. Argument pos is
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	311	interpreted relative to the position indicated by whence. Values
				312	for whence are:
				313
				314	* 0 -- start of stream (the default); offset should be zero or positive
				315	* 1 -- current stream position; offset may be negative
				316	* 2 -- end of stream; offset is usually negative
				317
				318	Return the new absolute position.
				319	"""
				320	self._unsupported("seek")
				321
				322	def tell(self):
				323	"""Return current stream position."""
				324	return self.seek(0, 1)
				325
				326	def truncate(self, pos=None):
				327	"""Truncate file to size bytes.
				328
				329	Size defaults to the current IO position as reported by tell(). Return
				330	the new size.
				331	"""
				332	self._unsupported("truncate")
				333
				334	### Flush and close ###
				335
				336	def flush(self):
				337	"""Flush write buffers, if applicable.
				338
				339	This is not implemented for read-only and non-blocking streams.
				340	"""
Antoine Pitrou	f7fd8e4	2010-05-03 16:25:33 +0000	[diff] [blame]	341	self._checkClosed()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	342	# XXX Should this return the number of bytes written???
				343
				344	__closed = False
				345
				346	def close(self):
				347	"""Flush and close the IO object.
				348
				349	This method has no effect if the file is already closed.
				350	"""
				351	if not self.__closed:
Benjamin Peterson	a2d6d71	2012-12-20 12:24:10 -0600	[diff] [blame]	352	try:
				353	self.flush()
				354	finally:
				355	self.__closed = True
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	356
				357	def __del__(self):
				358	"""Destructor. Calls close()."""
				359	# The try/except block is in case this is called at program
				360	# exit time, when it's possible that globals have already been
				361	# deleted, and then the close() call might fail. Since
				362	# there's nothing we can do about such failures and they annoy
				363	# the end users, we suppress the traceback.
				364	try:
				365	self.close()
				366	except:
				367	pass
				368
				369	### Inquiries ###
				370
				371	def seekable(self):
				372	"""Return whether object supports random access.
				373
				374	If False, seek(), tell() and truncate() will raise IOError.
				375	This method may need to do a test seek().
				376	"""
				377	return False
				378
				379	def _checkSeekable(self, msg=None):
				380	"""Internal: raise an IOError if file is not seekable
				381	"""
				382	if not self.seekable():
				383	raise IOError("File or stream is not seekable."
				384	if msg is None else msg)
				385
				386
				387	def readable(self):
				388	"""Return whether object was opened for reading.
				389
				390	If False, read() will raise IOError.
				391	"""
				392	return False
				393
				394	def _checkReadable(self, msg=None):
				395	"""Internal: raise an IOError if file is not readable
				396	"""
				397	if not self.readable():
				398	raise IOError("File or stream is not readable."
				399	if msg is None else msg)
				400
				401	def writable(self):
				402	"""Return whether object was opened for writing.
				403
				404	If False, write() and truncate() will raise IOError.
				405	"""
				406	return False
				407
				408	def _checkWritable(self, msg=None):
				409	"""Internal: raise an IOError if file is not writable
				410	"""
				411	if not self.writable():
				412	raise IOError("File or stream is not writable."
				413	if msg is None else msg)
				414
				415	@property
				416	def closed(self):
				417	"""closed: bool. True iff the file has been closed.
				418
				419	For backwards compatibility, this is a property, not a predicate.
				420	"""
				421	return self.__closed
				422
				423	def _checkClosed(self, msg=None):
Serhiy Storchaka	9a118f1	2016-04-17 09:37:36 +0300	[diff] [blame]	424	"""Internal: raise a ValueError if file is closed
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	425	"""
				426	if self.closed:
				427	raise ValueError("I/O operation on closed file."
				428	if msg is None else msg)
				429
				430	### Context manager ###
				431
				432	def __enter__(self):
				433	"""Context management protocol. Returns self."""
				434	self._checkClosed()
				435	return self
				436
				437	def __exit__(self, *args):
				438	"""Context management protocol. Calls close()"""
				439	self.close()
				440
				441	### Lower-level APIs ###
				442
				443	# XXX Should these be present even if unimplemented?
				444
				445	def fileno(self):
				446	"""Returns underlying file descriptor if one exists.
				447
				448	An IOError is raised if the IO object does not use a file descriptor.
				449	"""
				450	self._unsupported("fileno")
				451
				452	def isatty(self):
				453	"""Return whether this is an 'interactive' stream.
				454
				455	Return False if it can't be determined.
				456	"""
				457	self._checkClosed()
				458	return False
				459
				460	### Readline[s] and writelines ###
				461
				462	def readline(self, limit=-1):
				463	r"""Read and return a line from the stream.
				464
				465	If limit is specified, at most limit bytes will be read.
				466
				467	The line terminator is always b'\n' for binary files; for text
				468	files, the newlines argument to open can be used to select the line
				469	terminator(s) recognized.
				470	"""
				471	# For backwards compatibility, a (slowish) readline().
				472	if hasattr(self, "peek"):
				473	def nreadahead():
				474	readahead = self.peek(1)
				475	if not readahead:
				476	return 1
				477	n = (readahead.find(b"\n") + 1) or len(readahead)
				478	if limit >= 0:
				479	n = min(n, limit)
				480	return n
				481	else:
				482	def nreadahead():
				483	return 1
				484	if limit is None:
				485	limit = -1
				486	elif not isinstance(limit, (int, long)):
				487	raise TypeError("limit must be an integer")
				488	res = bytearray()
				489	while limit < 0 or len(res) < limit:
				490	b = self.read(nreadahead())
				491	if not b:
				492	break
				493	res += b
				494	if res.endswith(b"\n"):
				495	break
				496	return bytes(res)
				497
				498	def __iter__(self):
				499	self._checkClosed()
				500	return self
				501
				502	def next(self):
				503	line = self.readline()
				504	if not line:
				505	raise StopIteration
				506	return line
				507
				508	def readlines(self, hint=None):
				509	"""Return a list of lines from the stream.
				510
				511	hint can be specified to control the number of lines read: no more
				512	lines will be read if the total size (in bytes/characters) of all
				513	lines so far exceeds hint.
				514	"""
				515	if hint is not None and not isinstance(hint, (int, long)):
				516	raise TypeError("integer or None expected")
				517	if hint is None or hint <= 0:
				518	return list(self)
				519	n = 0
				520	lines = []
				521	for line in self:
				522	lines.append(line)
				523	n += len(line)
				524	if n >= hint:
				525	break
				526	return lines
				527
				528	def writelines(self, lines):
				529	self._checkClosed()
				530	for line in lines:
				531	self.write(line)
				532
				533	io.IOBase.register(IOBase)
				534
				535
				536	class RawIOBase(IOBase):
				537
				538	"""Base class for raw binary I/O."""
				539
				540	# The read() method is implemented by calling readinto(); derived
				541	# classes that want to support read() only need to implement
				542	# readinto() as a primitive operation. In general, readinto() can be
				543	# more efficient than read().
				544
				545	# (It would be tempting to also provide an implementation of
				546	# readinto() in terms of read(), in case the latter is a more suitable
				547	# primitive operation, but that would lead to nasty recursion in case
				548	# a subclass doesn't implement either.)
				549
				550	def read(self, n=-1):
				551	"""Read and return up to n bytes.
				552
				553	Returns an empty bytes object on EOF, or None if the object is
				554	set not to block and has no data to read.
				555	"""
				556	if n is None:
				557	n = -1
				558	if n < 0:
				559	return self.readall()
				560	b = bytearray(n.__index__())
				561	n = self.readinto(b)
Antoine Pitrou	6391b34	2010-09-14 18:48:19 +0000	[diff] [blame]	562	if n is None:
				563	return None
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	564	del b[n:]
				565	return bytes(b)
				566
				567	def readall(self):
				568	"""Read until EOF, using multiple read() call."""
				569	res = bytearray()
				570	while True:
				571	data = self.read(DEFAULT_BUFFER_SIZE)
				572	if not data:
				573	break
				574	res += data
Victor Stinner	daf17e9	2011-05-25 22:52:37 +0200	[diff] [blame]	575	if res:
				576	return bytes(res)
				577	else:
				578	# b'' or None
				579	return data
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	580
				581	def readinto(self, b):
				582	"""Read up to len(b) bytes into b.
				583
				584	Returns number of bytes read (0 for EOF), or None if the object
Antoine Pitrou	6391b34	2010-09-14 18:48:19 +0000	[diff] [blame]	585	is set not to block and has no data to read.
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	586	"""
				587	self._unsupported("readinto")
				588
				589	def write(self, b):
				590	"""Write the given buffer to the IO stream.
				591
				592	Returns the number of bytes written, which may be less than len(b).
				593	"""
				594	self._unsupported("write")
				595
				596	io.RawIOBase.register(RawIOBase)
				597	from _io import FileIO
				598	RawIOBase.register(FileIO)
				599
				600
				601	class BufferedIOBase(IOBase):
				602
				603	"""Base class for buffered IO objects.
				604
				605	The main difference with RawIOBase is that the read() method
				606	supports omitting the size argument, and does not have a default
				607	implementation that defers to readinto().
				608
				609	In addition, read(), readinto() and write() may raise
				610	BlockingIOError if the underlying raw stream is in non-blocking
				611	mode and not ready; unlike their raw counterparts, they will never
				612	return None.
				613
				614	A typical implementation should not inherit from a RawIOBase
				615	implementation, but wrap one.
				616	"""
				617
				618	def read(self, n=None):
				619	"""Read and return up to n bytes.
				620
				621	If the argument is omitted, None, or negative, reads and
				622	returns all data until EOF.
				623
				624	If the argument is positive, and the underlying raw stream is
				625	not 'interactive', multiple raw reads may be issued to satisfy
				626	the byte count (unless EOF is reached first). But for
				627	interactive raw streams (XXX and for pipes?), at most one raw
				628	read will be issued, and a short result does not imply that
				629	EOF is imminent.
				630
				631	Returns an empty bytes array on EOF.
				632
				633	Raises BlockingIOError if the underlying raw stream has no
				634	data at the moment.
				635	"""
				636	self._unsupported("read")
				637
				638	def read1(self, n=None):
				639	"""Read up to n bytes with at most one read() system call."""
				640	self._unsupported("read1")
				641
				642	def readinto(self, b):
				643	"""Read up to len(b) bytes into b.
				644
				645	Like read(), this may issue multiple reads to the underlying raw
				646	stream, unless the latter is 'interactive'.
				647
				648	Returns the number of bytes read (0 for EOF).
				649
				650	Raises BlockingIOError if the underlying raw stream has no
				651	data at the moment.
				652	"""
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	653	data = self.read(len(b))
				654	n = len(data)
				655	try:
				656	b[:n] = data
				657	except TypeError as err:
				658	import array
				659	if not isinstance(b, array.array):
				660	raise err
				661	b[:n] = array.array(b'b', data)
				662	return n
				663
				664	def write(self, b):
				665	"""Write the given buffer to the IO stream.
				666
Martin Panter	c9813d8	2016-06-03 05:59:20 +0000	[diff] [blame]	667	Return the number of bytes written, which is always len(b).
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	668
				669	Raises BlockingIOError if the buffer is full and the
				670	underlying raw stream cannot accept more data at the moment.
				671	"""
				672	self._unsupported("write")
				673
				674	def detach(self):
				675	"""
				676	Separate the underlying raw stream from the buffer and return it.
				677
				678	After the raw stream has been detached, the buffer is in an unusable
				679	state.
				680	"""
				681	self._unsupported("detach")
				682
				683	io.BufferedIOBase.register(BufferedIOBase)
				684
				685
				686	class _BufferedIOMixin(BufferedIOBase):
				687
				688	"""A mixin implementation of BufferedIOBase with an underlying raw stream.
				689
				690	This passes most requests on to the underlying raw stream. It
				691	does not provide implementations of read(), readinto() or
				692	write().
				693	"""
				694
				695	def __init__(self, raw):
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	696	self._raw = raw
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	697
				698	### Positioning ###
				699
				700	def seek(self, pos, whence=0):
				701	new_position = self.raw.seek(pos, whence)
				702	if new_position < 0:
				703	raise IOError("seek() returned an invalid position")
				704	return new_position
				705
				706	def tell(self):
				707	pos = self.raw.tell()
				708	if pos < 0:
				709	raise IOError("tell() returned an invalid position")
				710	return pos
				711
				712	def truncate(self, pos=None):
				713	# Flush the stream. We're mixing buffered I/O with lower-level I/O,
				714	# and a flush may be necessary to synch both views of the current
				715	# file state.
				716	self.flush()
				717
				718	if pos is None:
				719	pos = self.tell()
				720	# XXX: Should seek() be used, instead of passing the position
				721	# XXX directly to truncate?
				722	return self.raw.truncate(pos)
				723
				724	### Flush and close ###
				725
				726	def flush(self):
Antoine Pitrou	f7fd8e4	2010-05-03 16:25:33 +0000	[diff] [blame]	727	if self.closed:
				728	raise ValueError("flush of closed file")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	729	self.raw.flush()
				730
				731	def close(self):
Antoine Pitrou	f7fd8e4	2010-05-03 16:25:33 +0000	[diff] [blame]	732	if self.raw is not None and not self.closed:
Antoine Pitrou	5aa7df3	2011-11-21 20:16:44 +0100	[diff] [blame]	733	try:
				734	# may raise BlockingIOError or BrokenPipeError etc
				735	self.flush()
				736	finally:
				737	self.raw.close()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	738
				739	def detach(self):
				740	if self.raw is None:
				741	raise ValueError("raw stream already detached")
				742	self.flush()
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	743	raw = self._raw
				744	self._raw = None
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	745	return raw
				746
				747	### Inquiries ###
				748
				749	def seekable(self):
				750	return self.raw.seekable()
				751
				752	def readable(self):
				753	return self.raw.readable()
				754
				755	def writable(self):
				756	return self.raw.writable()
				757
				758	@property
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	759	def raw(self):
				760	return self._raw
				761
				762	@property
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	763	def closed(self):
				764	return self.raw.closed
				765
				766	@property
				767	def name(self):
				768	return self.raw.name
				769
				770	@property
				771	def mode(self):
				772	return self.raw.mode
				773
				774	def __repr__(self):
				775	clsname = self.__class__.__name__
				776	try:
				777	name = self.name
Benjamin Peterson	53ae614	2014-12-21 20:51:50 -0600	[diff] [blame]	778	except Exception:
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	779	return "<_pyio.{0}>".format(clsname)
				780	else:
				781	return "<_pyio.{0} name={1!r}>".format(clsname, name)
				782
				783	### Lower-level APIs ###
				784
				785	def fileno(self):
				786	return self.raw.fileno()
				787
				788	def isatty(self):
				789	return self.raw.isatty()
				790
				791
				792	class BytesIO(BufferedIOBase):
				793
				794	"""Buffered I/O implementation using an in-memory bytes buffer."""
				795
				796	def __init__(self, initial_bytes=None):
				797	buf = bytearray()
				798	if initial_bytes is not None:
				799	buf.extend(initial_bytes)
				800	self._buffer = buf
				801	self._pos = 0
				802
Antoine Pitrou	fa94e80	2009-10-24 12:23:18 +0000	[diff] [blame]	803	def __getstate__(self):
				804	if self.closed:
				805	raise ValueError("__getstate__ on closed file")
				806	return self.__dict__.copy()
				807
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	808	def getvalue(self):
				809	"""Return the bytes value (contents) of the buffer
				810	"""
				811	if self.closed:
				812	raise ValueError("getvalue on closed file")
				813	return bytes(self._buffer)
				814
				815	def read(self, n=None):
				816	if self.closed:
				817	raise ValueError("read from closed file")
				818	if n is None:
				819	n = -1
				820	if not isinstance(n, (int, long)):
				821	raise TypeError("integer argument expected, got {0!r}".format(
				822	type(n)))
				823	if n < 0:
				824	n = len(self._buffer)
				825	if len(self._buffer) <= self._pos:
				826	return b""
				827	newpos = min(len(self._buffer), self._pos + n)
				828	b = self._buffer[self._pos : newpos]
				829	self._pos = newpos
				830	return bytes(b)
				831
				832	def read1(self, n):
				833	"""This is the same as read.
				834	"""
				835	return self.read(n)
				836
				837	def write(self, b):
				838	if self.closed:
				839	raise ValueError("write to closed file")
				840	if isinstance(b, unicode):
				841	raise TypeError("can't write unicode to binary stream")
				842	n = len(b)
				843	if n == 0:
				844	return 0
				845	pos = self._pos
				846	if pos > len(self._buffer):
				847	# Inserts null bytes between the current end of the file
				848	# and the new write position.
				849	padding = b'\x00' * (pos - len(self._buffer))
				850	self._buffer += padding
				851	self._buffer[pos:pos + n] = b
				852	self._pos += n
				853	return n
				854
				855	def seek(self, pos, whence=0):
				856	if self.closed:
				857	raise ValueError("seek on closed file")
				858	try:
Florent Xicluna	1f3b4e1	2010-03-07 12:14:25 +0000	[diff] [blame]	859	pos.__index__
				860	except AttributeError:
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	861	raise TypeError("an integer is required")
				862	if whence == 0:
				863	if pos < 0:
				864	raise ValueError("negative seek position %r" % (pos,))
				865	self._pos = pos
				866	elif whence == 1:
				867	self._pos = max(0, self._pos + pos)
				868	elif whence == 2:
				869	self._pos = max(0, len(self._buffer) + pos)
				870	else:
				871	raise ValueError("invalid whence value")
				872	return self._pos
				873
				874	def tell(self):
				875	if self.closed:
				876	raise ValueError("tell on closed file")
				877	return self._pos
				878
				879	def truncate(self, pos=None):
				880	if self.closed:
				881	raise ValueError("truncate on closed file")
				882	if pos is None:
				883	pos = self._pos
Florent Xicluna	1f3b4e1	2010-03-07 12:14:25 +0000	[diff] [blame]	884	else:
				885	try:
				886	pos.__index__
				887	except AttributeError:
				888	raise TypeError("an integer is required")
				889	if pos < 0:
				890	raise ValueError("negative truncate position %r" % (pos,))
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	891	del self._buffer[pos:]
Antoine Pitrou	f3fa074	2010-01-31 22:26:04 +0000	[diff] [blame]	892	return pos
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	893
				894	def readable(self):
Antoine Pitrou	c5eec0e	2012-09-05 20:11:49 +0200	[diff] [blame]	895	if self.closed:
				896	raise ValueError("I/O operation on closed file.")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	897	return True
				898
				899	def writable(self):
Antoine Pitrou	c5eec0e	2012-09-05 20:11:49 +0200	[diff] [blame]	900	if self.closed:
				901	raise ValueError("I/O operation on closed file.")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	902	return True
				903
				904	def seekable(self):
Antoine Pitrou	c5eec0e	2012-09-05 20:11:49 +0200	[diff] [blame]	905	if self.closed:
				906	raise ValueError("I/O operation on closed file.")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	907	return True
				908
				909
				910	class BufferedReader(_BufferedIOMixin):
				911
				912	"""BufferedReader(raw[, buffer_size])
				913
				914	A buffer for a readable, sequential BaseRawIO object.
				915
				916	The constructor creates a BufferedReader for the given readable raw
				917	stream and buffer_size. If buffer_size is omitted, DEFAULT_BUFFER_SIZE
				918	is used.
				919	"""
				920
				921	def __init__(self, raw, buffer_size=DEFAULT_BUFFER_SIZE):
				922	"""Create a new buffered reader using the given readable raw IO object.
				923	"""
				924	if not raw.readable():
				925	raise IOError('"raw" argument must be readable.')
				926
				927	_BufferedIOMixin.__init__(self, raw)
				928	if buffer_size <= 0:
				929	raise ValueError("invalid buffer size")
				930	self.buffer_size = buffer_size
				931	self._reset_read_buf()
				932	self._read_lock = Lock()
				933
				934	def _reset_read_buf(self):
				935	self._read_buf = b""
				936	self._read_pos = 0
				937
				938	def read(self, n=None):
				939	"""Read n bytes.
				940
				941	Returns exactly n bytes of data unless the underlying raw IO
				942	stream reaches EOF or if the call would block in non-blocking
				943	mode. If n is negative, read until EOF or until read() would
				944	block.
				945	"""
				946	if n is not None and n < -1:
				947	raise ValueError("invalid number of bytes to read")
				948	with self._read_lock:
				949	return self._read_unlocked(n)
				950
				951	def _read_unlocked(self, n=None):
				952	nodata_val = b""
				953	empty_values = (b"", None)
				954	buf = self._read_buf
				955	pos = self._read_pos
				956
				957	# Special case for when the number of bytes to read is unspecified.
				958	if n is None or n == -1:
				959	self._reset_read_buf()
				960	chunks = [buf[pos:]] # Strip the consumed bytes.
				961	current_size = 0
				962	while True:
				963	# Read until EOF or until read() would block.
Antoine Pitrou	6439c00	2011-02-25 21:35:47 +0000	[diff] [blame]	964	try:
				965	chunk = self.raw.read()
				966	except IOError as e:
				967	if e.errno != EINTR:
				968	raise
				969	continue
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	970	if chunk in empty_values:
				971	nodata_val = chunk
				972	break
				973	current_size += len(chunk)
				974	chunks.append(chunk)
				975	return b"".join(chunks) or nodata_val
				976
				977	# The number of bytes to read is specified, return at most n bytes.
				978	avail = len(buf) - pos # Length of the available buffered data.
				979	if n <= avail:
				980	# Fast path: the data to read is fully buffered.
				981	self._read_pos += n
				982	return buf[pos:pos+n]
				983	# Slow path: read from the stream until enough bytes are read,
				984	# or until an EOF occurs or until read() would block.
				985	chunks = [buf[pos:]]
				986	wanted = max(self.buffer_size, n)
				987	while avail < n:
Antoine Pitrou	6439c00	2011-02-25 21:35:47 +0000	[diff] [blame]	988	try:
				989	chunk = self.raw.read(wanted)
				990	except IOError as e:
				991	if e.errno != EINTR:
				992	raise
				993	continue
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	994	if chunk in empty_values:
				995	nodata_val = chunk
				996	break
				997	avail += len(chunk)
				998	chunks.append(chunk)
Martin Panter	8d496ad	2016-06-02 10:35:44 +0000	[diff] [blame]	999	# n is more than avail only when an EOF occurred or when
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1000	# read() would have blocked.
				1001	n = min(n, avail)
				1002	out = b"".join(chunks)
				1003	self._read_buf = out[n:] # Save the extra data in the buffer.
				1004	self._read_pos = 0
				1005	return out[:n] if out else nodata_val
				1006
				1007	def peek(self, n=0):
				1008	"""Returns buffered bytes without advancing the position.
				1009
				1010	The argument indicates a desired minimal number of bytes; we
				1011	do at most one raw read to satisfy it. We never return more
				1012	than self.buffer_size.
				1013	"""
				1014	with self._read_lock:
				1015	return self._peek_unlocked(n)
				1016
				1017	def _peek_unlocked(self, n=0):
				1018	want = min(n, self.buffer_size)
				1019	have = len(self._read_buf) - self._read_pos
				1020	if have < want or have <= 0:
				1021	to_read = self.buffer_size - have
Antoine Pitrou	6439c00	2011-02-25 21:35:47 +0000	[diff] [blame]	1022	while True:
				1023	try:
				1024	current = self.raw.read(to_read)
				1025	except IOError as e:
				1026	if e.errno != EINTR:
				1027	raise
				1028	continue
				1029	break
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1030	if current:
				1031	self._read_buf = self._read_buf[self._read_pos:] + current
				1032	self._read_pos = 0
				1033	return self._read_buf[self._read_pos:]
				1034
				1035	def read1(self, n):
				1036	"""Reads up to n bytes, with at most one read() system call."""
				1037	# Returns up to n bytes. If at least one byte is buffered, we
				1038	# only return buffered bytes. Otherwise, we do one raw read.
				1039	if n < 0:
				1040	raise ValueError("number of bytes to read must be positive")
				1041	if n == 0:
				1042	return b""
				1043	with self._read_lock:
				1044	self._peek_unlocked(1)
				1045	return self._read_unlocked(
				1046	min(n, len(self._read_buf) - self._read_pos))
				1047
				1048	def tell(self):
				1049	return _BufferedIOMixin.tell(self) - len(self._read_buf) + self._read_pos
				1050
				1051	def seek(self, pos, whence=0):
				1052	if not (0 <= whence <= 2):
				1053	raise ValueError("invalid whence value")
				1054	with self._read_lock:
				1055	if whence == 1:
				1056	pos -= len(self._read_buf) - self._read_pos
				1057	pos = _BufferedIOMixin.seek(self, pos, whence)
				1058	self._reset_read_buf()
				1059	return pos
				1060
				1061	class BufferedWriter(_BufferedIOMixin):
				1062
				1063	"""A buffer for a writeable sequential RawIO object.
				1064
				1065	The constructor creates a BufferedWriter for the given writeable raw
				1066	stream. If the buffer_size is not given, it defaults to
				1067	DEFAULT_BUFFER_SIZE.
				1068	"""
				1069
				1070	_warning_stack_offset = 2
				1071
				1072	def __init__(self, raw,
				1073	buffer_size=DEFAULT_BUFFER_SIZE, max_buffer_size=None):
				1074	if not raw.writable():
				1075	raise IOError('"raw" argument must be writable.')
				1076
				1077	_BufferedIOMixin.__init__(self, raw)
				1078	if buffer_size <= 0:
				1079	raise ValueError("invalid buffer size")
				1080	if max_buffer_size is not None:
				1081	warnings.warn("max_buffer_size is deprecated", DeprecationWarning,
				1082	self._warning_stack_offset)
				1083	self.buffer_size = buffer_size
				1084	self._write_buf = bytearray()
				1085	self._write_lock = Lock()
				1086
				1087	def write(self, b):
				1088	if self.closed:
				1089	raise ValueError("write to closed file")
				1090	if isinstance(b, unicode):
				1091	raise TypeError("can't write unicode to binary stream")
				1092	with self._write_lock:
				1093	# XXX we can implement some more tricks to try and avoid
				1094	# partial writes
				1095	if len(self._write_buf) > self.buffer_size:
Antoine Pitrou	5aa7df3	2011-11-21 20:16:44 +0100	[diff] [blame]	1096	# We're full, so let's pre-flush the buffer. (This may
				1097	# raise BlockingIOError with characters_written == 0.)
				1098	self._flush_unlocked()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1099	before = len(self._write_buf)
				1100	self._write_buf.extend(b)
				1101	written = len(self._write_buf) - before
				1102	if len(self._write_buf) > self.buffer_size:
				1103	try:
				1104	self._flush_unlocked()
				1105	except BlockingIOError as e:
				1106	if len(self._write_buf) > self.buffer_size:
				1107	# We've hit the buffer_size. We have to accept a partial
				1108	# write and cut back our buffer.
				1109	overage = len(self._write_buf) - self.buffer_size
				1110	written -= overage
				1111	self._write_buf = self._write_buf[:self.buffer_size]
				1112	raise BlockingIOError(e.errno, e.strerror, written)
				1113	return written
				1114
				1115	def truncate(self, pos=None):
				1116	with self._write_lock:
				1117	self._flush_unlocked()
				1118	if pos is None:
				1119	pos = self.raw.tell()
				1120	return self.raw.truncate(pos)
				1121
				1122	def flush(self):
				1123	with self._write_lock:
				1124	self._flush_unlocked()
				1125
				1126	def _flush_unlocked(self):
				1127	if self.closed:
				1128	raise ValueError("flush of closed file")
Antoine Pitrou	5aa7df3	2011-11-21 20:16:44 +0100	[diff] [blame]	1129	while self._write_buf:
				1130	try:
				1131	n = self.raw.write(self._write_buf)
				1132	except BlockingIOError:
				1133	raise RuntimeError("self.raw should implement RawIOBase: it "
				1134	"should not raise BlockingIOError")
				1135	except IOError as e:
				1136	if e.errno != EINTR:
				1137	raise
				1138	continue
				1139	if n is None:
				1140	raise BlockingIOError(
				1141	errno.EAGAIN,
				1142	"write could not complete without blocking", 0)
				1143	if n > len(self._write_buf) or n < 0:
				1144	raise IOError("write() returned incorrect number of bytes")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1145	del self._write_buf[:n]
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1146
				1147	def tell(self):
				1148	return _BufferedIOMixin.tell(self) + len(self._write_buf)
				1149
				1150	def seek(self, pos, whence=0):
				1151	if not (0 <= whence <= 2):
				1152	raise ValueError("invalid whence")
				1153	with self._write_lock:
				1154	self._flush_unlocked()
				1155	return _BufferedIOMixin.seek(self, pos, whence)
				1156
				1157
				1158	class BufferedRWPair(BufferedIOBase):
				1159
				1160	"""A buffered reader and writer object together.
				1161
				1162	A buffered reader object and buffered writer object put together to
				1163	form a sequential IO object that can read and write. This is typically
				1164	used with a socket or two-way pipe.
				1165
				1166	reader and writer are RawIOBase objects that are readable and
				1167	writeable respectively. If the buffer_size is omitted it defaults to
				1168	DEFAULT_BUFFER_SIZE.
				1169	"""
				1170
				1171	# XXX The usefulness of this (compared to having two separate IO
				1172	# objects) is questionable.
				1173
				1174	def __init__(self, reader, writer,
				1175	buffer_size=DEFAULT_BUFFER_SIZE, max_buffer_size=None):
				1176	"""Constructor.
				1177
				1178	The arguments are two RawIO instances.
				1179	"""
				1180	if max_buffer_size is not None:
				1181	warnings.warn("max_buffer_size is deprecated", DeprecationWarning, 2)
				1182
				1183	if not reader.readable():
				1184	raise IOError('"reader" argument must be readable.')
				1185
				1186	if not writer.writable():
				1187	raise IOError('"writer" argument must be writable.')
				1188
				1189	self.reader = BufferedReader(reader, buffer_size)
				1190	self.writer = BufferedWriter(writer, buffer_size)
				1191
				1192	def read(self, n=None):
				1193	if n is None:
				1194	n = -1
				1195	return self.reader.read(n)
				1196
				1197	def readinto(self, b):
				1198	return self.reader.readinto(b)
				1199
				1200	def write(self, b):
				1201	return self.writer.write(b)
				1202
				1203	def peek(self, n=0):
				1204	return self.reader.peek(n)
				1205
				1206	def read1(self, n):
				1207	return self.reader.read1(n)
				1208
				1209	def readable(self):
				1210	return self.reader.readable()
				1211
				1212	def writable(self):
				1213	return self.writer.writable()
				1214
				1215	def flush(self):
				1216	return self.writer.flush()
				1217
				1218	def close(self):
Serhiy Storchaka	f95a57f	2015-03-24 23:23:42 +0200	[diff] [blame]	1219	try:
				1220	self.writer.close()
				1221	finally:
				1222	self.reader.close()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1223
				1224	def isatty(self):
				1225	return self.reader.isatty() or self.writer.isatty()
				1226
				1227	@property
				1228	def closed(self):
				1229	return self.writer.closed
				1230
				1231
				1232	class BufferedRandom(BufferedWriter, BufferedReader):
				1233
				1234	"""A buffered interface to random access streams.
				1235
				1236	The constructor creates a reader and writer for a seekable stream,
				1237	raw, given in the first argument. If the buffer_size is omitted it
				1238	defaults to DEFAULT_BUFFER_SIZE.
				1239	"""
				1240
				1241	_warning_stack_offset = 3
				1242
				1243	def __init__(self, raw,
				1244	buffer_size=DEFAULT_BUFFER_SIZE, max_buffer_size=None):
				1245	raw._checkSeekable()
				1246	BufferedReader.__init__(self, raw, buffer_size)
				1247	BufferedWriter.__init__(self, raw, buffer_size, max_buffer_size)
				1248
				1249	def seek(self, pos, whence=0):
				1250	if not (0 <= whence <= 2):
				1251	raise ValueError("invalid whence")
				1252	self.flush()
				1253	if self._read_buf:
				1254	# Undo read ahead.
				1255	with self._read_lock:
				1256	self.raw.seek(self._read_pos - len(self._read_buf), 1)
				1257	# First do the raw seek, then empty the read buffer, so that
				1258	# if the raw seek fails, we don't lose buffered data forever.
				1259	pos = self.raw.seek(pos, whence)
				1260	with self._read_lock:
				1261	self._reset_read_buf()
				1262	if pos < 0:
				1263	raise IOError("seek() returned invalid position")
				1264	return pos
				1265
				1266	def tell(self):
				1267	if self._write_buf:
				1268	return BufferedWriter.tell(self)
				1269	else:
				1270	return BufferedReader.tell(self)
				1271
				1272	def truncate(self, pos=None):
				1273	if pos is None:
				1274	pos = self.tell()
				1275	# Use seek to flush the read buffer.
Antoine Pitrou	f3fa074	2010-01-31 22:26:04 +0000	[diff] [blame]	1276	return BufferedWriter.truncate(self, pos)
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1277
				1278	def read(self, n=None):
				1279	if n is None:
				1280	n = -1
				1281	self.flush()
				1282	return BufferedReader.read(self, n)
				1283
				1284	def readinto(self, b):
				1285	self.flush()
				1286	return BufferedReader.readinto(self, b)
				1287
				1288	def peek(self, n=0):
				1289	self.flush()
				1290	return BufferedReader.peek(self, n)
				1291
				1292	def read1(self, n):
				1293	self.flush()
				1294	return BufferedReader.read1(self, n)
				1295
				1296	def write(self, b):
				1297	if self._read_buf:
				1298	# Undo readahead
				1299	with self._read_lock:
				1300	self.raw.seek(self._read_pos - len(self._read_buf), 1)
				1301	self._reset_read_buf()
				1302	return BufferedWriter.write(self, b)
				1303
				1304
				1305	class TextIOBase(IOBase):
				1306
				1307	"""Base class for text I/O.
				1308
				1309	This class provides a character and line based interface to stream
				1310	I/O. There is no readinto method because Python's character strings
				1311	are immutable. There is no public constructor.
				1312	"""
				1313
				1314	def read(self, n=-1):
				1315	"""Read at most n characters from stream.
				1316
				1317	Read from underlying buffer until we have n characters or we hit EOF.
				1318	If n is negative or omitted, read until EOF.
				1319	"""
				1320	self._unsupported("read")
				1321
				1322	def write(self, s):
				1323	"""Write string s to stream."""
				1324	self._unsupported("write")
				1325
				1326	def truncate(self, pos=None):
				1327	"""Truncate size to pos."""
				1328	self._unsupported("truncate")
				1329
				1330	def readline(self):
				1331	"""Read until newline or EOF.
				1332
				1333	Returns an empty string if EOF is hit immediately.
				1334	"""
				1335	self._unsupported("readline")
				1336
				1337	def detach(self):
				1338	"""
				1339	Separate the underlying buffer from the TextIOBase and return it.
				1340
				1341	After the underlying buffer has been detached, the TextIO is in an
				1342	unusable state.
				1343	"""
				1344	self._unsupported("detach")
				1345
				1346	@property
				1347	def encoding(self):
				1348	"""Subclasses should override."""
				1349	return None
				1350
				1351	@property
				1352	def newlines(self):
				1353	"""Line endings translated so far.
				1354
				1355	Only line endings translated during reading are considered.
				1356
				1357	Subclasses should override.
				1358	"""
				1359	return None
				1360
				1361	@property
				1362	def errors(self):
				1363	"""Error setting of the decoder or encoder.
				1364
				1365	Subclasses should override."""
				1366	return None
				1367
				1368	io.TextIOBase.register(TextIOBase)
				1369
				1370
				1371	class IncrementalNewlineDecoder(codecs.IncrementalDecoder):
				1372	r"""Codec used when reading a file in universal newlines mode. It wraps
				1373	another incremental decoder, translating \r\n and \r into \n. It also
				1374	records the types of newlines encountered. When used with
				1375	translate=False, it ensures that the newline sequence is returned in
				1376	one piece.
				1377	"""
				1378	def __init__(self, decoder, translate, errors='strict'):
				1379	codecs.IncrementalDecoder.__init__(self, errors=errors)
				1380	self.translate = translate
				1381	self.decoder = decoder
				1382	self.seennl = 0
				1383	self.pendingcr = False
				1384
				1385	def decode(self, input, final=False):
				1386	# decode input (with the eventual \r from a previous pass)
				1387	if self.decoder is None:
				1388	output = input
				1389	else:
				1390	output = self.decoder.decode(input, final=final)
				1391	if self.pendingcr and (output or final):
				1392	output = "\r" + output
				1393	self.pendingcr = False
				1394
				1395	# retain last \r even when not translating data:
				1396	# then readline() is sure to get \r\n in one pass
				1397	if output.endswith("\r") and not final:
				1398	output = output[:-1]
				1399	self.pendingcr = True
				1400
				1401	# Record which newlines are read
				1402	crlf = output.count('\r\n')
				1403	cr = output.count('\r') - crlf
				1404	lf = output.count('\n') - crlf
				1405	self.seennl \|= (lf and self._LF) \| (cr and self._CR) \
				1406	\| (crlf and self._CRLF)
				1407
				1408	if self.translate:
				1409	if crlf:
				1410	output = output.replace("\r\n", "\n")
				1411	if cr:
				1412	output = output.replace("\r", "\n")
				1413
				1414	return output
				1415
				1416	def getstate(self):
				1417	if self.decoder is None:
				1418	buf = b""
				1419	flag = 0
				1420	else:
				1421	buf, flag = self.decoder.getstate()
				1422	flag <<= 1
				1423	if self.pendingcr:
				1424	flag \|= 1
				1425	return buf, flag
				1426
				1427	def setstate(self, state):
				1428	buf, flag = state
				1429	self.pendingcr = bool(flag & 1)
				1430	if self.decoder is not None:
				1431	self.decoder.setstate((buf, flag >> 1))
				1432
				1433	def reset(self):
				1434	self.seennl = 0
				1435	self.pendingcr = False
				1436	if self.decoder is not None:
				1437	self.decoder.reset()
				1438
				1439	_LF = 1
				1440	_CR = 2
				1441	_CRLF = 4
				1442
				1443	@property
				1444	def newlines(self):
				1445	return (None,
				1446	"\n",
				1447	"\r",
				1448	("\r", "\n"),
				1449	"\r\n",
				1450	("\n", "\r\n"),
				1451	("\r", "\r\n"),
				1452	("\r", "\n", "\r\n")
				1453	)[self.seennl]
				1454
				1455
				1456	class TextIOWrapper(TextIOBase):
				1457
				1458	r"""Character and line based layer over a BufferedIOBase object, buffer.
				1459
				1460	encoding gives the name of the encoding that the stream will be
				1461	decoded or encoded with. It defaults to locale.getpreferredencoding.
				1462
				1463	errors determines the strictness of encoding and decoding (see the
				1464	codecs.register) and defaults to "strict".
				1465
				1466	newline can be None, '', '\n', '\r', or '\r\n'. It controls the
				1467	handling of line endings. If it is None, universal newlines is
				1468	enabled. With this enabled, on input, the lines endings '\n', '\r',
				1469	or '\r\n' are translated to '\n' before being returned to the
				1470	caller. Conversely, on output, '\n' is translated to the system
Éric Araujo	7f4b3be	2012-02-26 01:41:39 +0100	[diff] [blame]	1471	default line separator, os.linesep. If newline is any other of its
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1472	legal values, that newline becomes the newline when the file is read
				1473	and it is returned untranslated. On output, '\n' is converted to the
				1474	newline.
				1475
				1476	If line_buffering is True, a call to flush is implied when a call to
				1477	write contains a newline character.
				1478	"""
				1479
				1480	_CHUNK_SIZE = 2048
				1481
				1482	def __init__(self, buffer, encoding=None, errors=None, newline=None,
				1483	line_buffering=False):
				1484	if newline is not None and not isinstance(newline, basestring):
				1485	raise TypeError("illegal newline type: %r" % (type(newline),))
				1486	if newline not in (None, "", "\n", "\r", "\r\n"):
				1487	raise ValueError("illegal newline value: %r" % (newline,))
				1488	if encoding is None:
				1489	try:
Victor Stinner	7120219	2010-05-04 11:35:36 +0000	[diff] [blame]	1490	import locale
				1491	except ImportError:
				1492	# Importing locale may fail if Python is being built
				1493	encoding = "ascii"
				1494	else:
				1495	encoding = locale.getpreferredencoding()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1496
				1497	if not isinstance(encoding, basestring):
				1498	raise ValueError("invalid encoding: %r" % encoding)
				1499
Serhiy Storchaka	c7797dc	2015-05-31 20:21:00 +0300	[diff] [blame]	1500	if sys.py3kwarning and not codecs.lookup(encoding)._is_text_encoding:
				1501	msg = ("%r is not a text encoding; "
				1502	"use codecs.open() to handle arbitrary codecs")
				1503	warnings.warnpy3k(msg % encoding, stacklevel=2)
				1504
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1505	if errors is None:
				1506	errors = "strict"
				1507	else:
				1508	if not isinstance(errors, basestring):
				1509	raise ValueError("invalid errors: %r" % errors)
				1510
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	1511	self._buffer = buffer
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1512	self._line_buffering = line_buffering
				1513	self._encoding = encoding
				1514	self._errors = errors
				1515	self._readuniversal = not newline
				1516	self._readtranslate = newline is None
				1517	self._readnl = newline
				1518	self._writetranslate = newline != ''
				1519	self._writenl = newline or os.linesep
				1520	self._encoder = None
				1521	self._decoder = None
				1522	self._decoded_chars = '' # buffer for text returned from decoder
				1523	self._decoded_chars_used = 0 # offset into _decoded_chars for read()
				1524	self._snapshot = None # info for reconstructing decoder state
				1525	self._seekable = self._telling = self.buffer.seekable()
				1526
				1527	if self._seekable and self.writable():
				1528	position = self.buffer.tell()
				1529	if position != 0:
				1530	try:
				1531	self._get_encoder().setstate(0)
				1532	except LookupError:
				1533	# Sometimes the encoder doesn't exist
				1534	pass
				1535
				1536	# self._snapshot is either None, or a tuple (dec_flags, next_input)
				1537	# where dec_flags is the second (integer) item of the decoder state
				1538	# and next_input is the chunk of input bytes that comes next after the
				1539	# snapshot point. We use this to reconstruct decoder states in tell().
				1540
				1541	# Naming convention:
				1542	# - "bytes_..." for integer variables that count input bytes
				1543	# - "chars_..." for integer variables that count decoded characters
				1544
				1545	def __repr__(self):
				1546	try:
				1547	name = self.name
Benjamin Peterson	53ae614	2014-12-21 20:51:50 -0600	[diff] [blame]	1548	except Exception:
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1549	return "<_pyio.TextIOWrapper encoding='{0}'>".format(self.encoding)
				1550	else:
				1551	return "<_pyio.TextIOWrapper name={0!r} encoding='{1}'>".format(
				1552	name, self.encoding)
				1553
				1554	@property
				1555	def encoding(self):
				1556	return self._encoding
				1557
				1558	@property
				1559	def errors(self):
				1560	return self._errors
				1561
				1562	@property
				1563	def line_buffering(self):
				1564	return self._line_buffering
				1565
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	1566	@property
				1567	def buffer(self):
				1568	return self._buffer
				1569
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1570	def seekable(self):
Antoine Pitrou	c5eec0e	2012-09-05 20:11:49 +0200	[diff] [blame]	1571	if self.closed:
				1572	raise ValueError("I/O operation on closed file.")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1573	return self._seekable
				1574
				1575	def readable(self):
				1576	return self.buffer.readable()
				1577
				1578	def writable(self):
				1579	return self.buffer.writable()
				1580
				1581	def flush(self):
				1582	self.buffer.flush()
				1583	self._telling = self._seekable
				1584
				1585	def close(self):
Antoine Pitrou	f7fd8e4	2010-05-03 16:25:33 +0000	[diff] [blame]	1586	if self.buffer is not None and not self.closed:
Benjamin Peterson	a2d6d71	2012-12-20 12:24:10 -0600	[diff] [blame]	1587	try:
				1588	self.flush()
				1589	finally:
				1590	self.buffer.close()
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1591
				1592	@property
				1593	def closed(self):
				1594	return self.buffer.closed
				1595
				1596	@property
				1597	def name(self):
				1598	return self.buffer.name
				1599
				1600	def fileno(self):
				1601	return self.buffer.fileno()
				1602
				1603	def isatty(self):
				1604	return self.buffer.isatty()
				1605
				1606	def write(self, s):
				1607	if self.closed:
				1608	raise ValueError("write to closed file")
				1609	if not isinstance(s, unicode):
				1610	raise TypeError("can't write %s to text stream" %
				1611	s.__class__.__name__)
				1612	length = len(s)
				1613	haslf = (self._writetranslate or self._line_buffering) and "\n" in s
				1614	if haslf and self._writetranslate and self._writenl != "\n":
				1615	s = s.replace("\n", self._writenl)
				1616	encoder = self._encoder or self._get_encoder()
				1617	# XXX What if we were just reading?
				1618	b = encoder.encode(s)
				1619	self.buffer.write(b)
				1620	if self._line_buffering and (haslf or "\r" in s):
				1621	self.flush()
				1622	self._snapshot = None
				1623	if self._decoder:
				1624	self._decoder.reset()
				1625	return length
				1626
				1627	def _get_encoder(self):
				1628	make_encoder = codecs.getincrementalencoder(self._encoding)
				1629	self._encoder = make_encoder(self._errors)
				1630	return self._encoder
				1631
				1632	def _get_decoder(self):
				1633	make_decoder = codecs.getincrementaldecoder(self._encoding)
				1634	decoder = make_decoder(self._errors)
				1635	if self._readuniversal:
				1636	decoder = IncrementalNewlineDecoder(decoder, self._readtranslate)
				1637	self._decoder = decoder
				1638	return decoder
				1639
				1640	# The following three methods implement an ADT for _decoded_chars.
				1641	# Text returned from the decoder is buffered here until the client
				1642	# requests it by calling our read() or readline() method.
				1643	def _set_decoded_chars(self, chars):
				1644	"""Set the _decoded_chars buffer."""
				1645	self._decoded_chars = chars
				1646	self._decoded_chars_used = 0
				1647
				1648	def _get_decoded_chars(self, n=None):
				1649	"""Advance into the _decoded_chars buffer."""
				1650	offset = self._decoded_chars_used
				1651	if n is None:
				1652	chars = self._decoded_chars[offset:]
				1653	else:
				1654	chars = self._decoded_chars[offset:offset + n]
				1655	self._decoded_chars_used += len(chars)
				1656	return chars
				1657
				1658	def _rewind_decoded_chars(self, n):
				1659	"""Rewind the _decoded_chars buffer."""
				1660	if self._decoded_chars_used < n:
				1661	raise AssertionError("rewind decoded_chars out of bounds")
				1662	self._decoded_chars_used -= n
				1663
				1664	def _read_chunk(self):
				1665	"""
				1666	Read and decode the next chunk of data from the BufferedReader.
				1667	"""
				1668
				1669	# The return value is True unless EOF was reached. The decoded
				1670	# string is placed in self._decoded_chars (replacing its previous
				1671	# value). The entire input chunk is sent to the decoder, though
				1672	# some of it may remain buffered in the decoder, yet to be
				1673	# converted.
				1674
				1675	if self._decoder is None:
				1676	raise ValueError("no decoder")
				1677
				1678	if self._telling:
				1679	# To prepare for tell(), we need to snapshot a point in the
				1680	# file where the decoder's input buffer is empty.
				1681
				1682	dec_buffer, dec_flags = self._decoder.getstate()
				1683	# Given this, we know there was a valid snapshot point
				1684	# len(dec_buffer) bytes ago with decoder state (b'', dec_flags).
				1685
				1686	# Read a chunk, decode it, and put the result in self._decoded_chars.
				1687	input_chunk = self.buffer.read1(self._CHUNK_SIZE)
				1688	eof = not input_chunk
				1689	self._set_decoded_chars(self._decoder.decode(input_chunk, eof))
				1690
				1691	if self._telling:
				1692	# At the snapshot point, len(dec_buffer) bytes before the read,
				1693	# the next input to be decoded is dec_buffer + input_chunk.
				1694	self._snapshot = (dec_flags, dec_buffer + input_chunk)
				1695
				1696	return not eof
				1697
				1698	def _pack_cookie(self, position, dec_flags=0,
				1699	bytes_to_feed=0, need_eof=0, chars_to_skip=0):
				1700	# The meaning of a tell() cookie is: seek to position, set the
				1701	# decoder flags to dec_flags, read bytes_to_feed bytes, feed them
				1702	# into the decoder with need_eof as the EOF flag, then skip
				1703	# chars_to_skip characters of the decoded result. For most simple
				1704	# decoders, tell() will often just give a byte offset in the file.
				1705	return (position \| (dec_flags<<64) \| (bytes_to_feed<<128) \|
				1706	(chars_to_skip<<192) \| bool(need_eof)<<256)
				1707
				1708	def _unpack_cookie(self, bigint):
				1709	rest, position = divmod(bigint, 1<<64)
				1710	rest, dec_flags = divmod(rest, 1<<64)
				1711	rest, bytes_to_feed = divmod(rest, 1<<64)
				1712	need_eof, chars_to_skip = divmod(rest, 1<<64)
				1713	return position, dec_flags, bytes_to_feed, need_eof, chars_to_skip
				1714
				1715	def tell(self):
				1716	if not self._seekable:
				1717	raise IOError("underlying stream is not seekable")
				1718	if not self._telling:
				1719	raise IOError("telling position disabled by next() call")
				1720	self.flush()
				1721	position = self.buffer.tell()
				1722	decoder = self._decoder
				1723	if decoder is None or self._snapshot is None:
				1724	if self._decoded_chars:
				1725	# This should never happen.
				1726	raise AssertionError("pending decoded text")
				1727	return position
				1728
				1729	# Skip backward to the snapshot point (see _read_chunk).
				1730	dec_flags, next_input = self._snapshot
				1731	position -= len(next_input)
				1732
				1733	# How many decoded characters have been used up since the snapshot?
				1734	chars_to_skip = self._decoded_chars_used
				1735	if chars_to_skip == 0:
				1736	# We haven't moved from the snapshot point.
				1737	return self._pack_cookie(position, dec_flags)
				1738
				1739	# Starting from the snapshot position, we will walk the decoder
				1740	# forward until it gives us enough decoded characters.
				1741	saved_state = decoder.getstate()
				1742	try:
				1743	# Note our initial start point.
				1744	decoder.setstate((b'', dec_flags))
				1745	start_pos = position
				1746	start_flags, bytes_fed, chars_decoded = dec_flags, 0, 0
				1747	need_eof = 0
				1748
				1749	# Feed the decoder one byte at a time. As we go, note the
				1750	# nearest "safe start point" before the current location
				1751	# (a point where the decoder has nothing buffered, so seek()
				1752	# can safely start from there and advance to this location).
				1753	for next_byte in next_input:
				1754	bytes_fed += 1
				1755	chars_decoded += len(decoder.decode(next_byte))
				1756	dec_buffer, dec_flags = decoder.getstate()
				1757	if not dec_buffer and chars_decoded <= chars_to_skip:
				1758	# Decoder buffer is empty, so this is a safe start point.
				1759	start_pos += bytes_fed
				1760	chars_to_skip -= chars_decoded
				1761	start_flags, bytes_fed, chars_decoded = dec_flags, 0, 0
				1762	if chars_decoded >= chars_to_skip:
				1763	break
				1764	else:
				1765	# We didn't get enough decoded data; signal EOF to get more.
				1766	chars_decoded += len(decoder.decode(b'', final=True))
				1767	need_eof = 1
				1768	if chars_decoded < chars_to_skip:
				1769	raise IOError("can't reconstruct logical file position")
				1770
				1771	# The returned cookie corresponds to the last safe start point.
				1772	return self._pack_cookie(
				1773	start_pos, start_flags, bytes_fed, need_eof, chars_to_skip)
				1774	finally:
				1775	decoder.setstate(saved_state)
				1776
				1777	def truncate(self, pos=None):
				1778	self.flush()
				1779	if pos is None:
				1780	pos = self.tell()
Antoine Pitrou	f3fa074	2010-01-31 22:26:04 +0000	[diff] [blame]	1781	return self.buffer.truncate(pos)
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1782
				1783	def detach(self):
				1784	if self.buffer is None:
				1785	raise ValueError("buffer is already detached")
				1786	self.flush()
Antoine Pitrou	fc9ead6	2010-12-21 21:26:55 +0000	[diff] [blame]	1787	buffer = self._buffer
				1788	self._buffer = None
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1789	return buffer
				1790
				1791	def seek(self, cookie, whence=0):
				1792	if self.closed:
				1793	raise ValueError("tell on closed file")
				1794	if not self._seekable:
				1795	raise IOError("underlying stream is not seekable")
				1796	if whence == 1: # seek relative to current position
				1797	if cookie != 0:
				1798	raise IOError("can't do nonzero cur-relative seeks")
				1799	# Seeking to the current position should attempt to
				1800	# sync the underlying buffer with the current position.
				1801	whence = 0
				1802	cookie = self.tell()
				1803	if whence == 2: # seek relative to end of file
				1804	if cookie != 0:
				1805	raise IOError("can't do nonzero end-relative seeks")
				1806	self.flush()
				1807	position = self.buffer.seek(0, 2)
				1808	self._set_decoded_chars('')
				1809	self._snapshot = None
				1810	if self._decoder:
				1811	self._decoder.reset()
				1812	return position
				1813	if whence != 0:
				1814	raise ValueError("invalid whence (%r, should be 0, 1 or 2)" %
				1815	(whence,))
				1816	if cookie < 0:
				1817	raise ValueError("negative seek position %r" % (cookie,))
				1818	self.flush()
				1819
				1820	# The strategy of seek() is to go back to the safe start point
				1821	# and replay the effect of read(chars_to_skip) from there.
				1822	start_pos, dec_flags, bytes_to_feed, need_eof, chars_to_skip = \
				1823	self._unpack_cookie(cookie)
				1824
				1825	# Seek back to the safe start point.
				1826	self.buffer.seek(start_pos)
				1827	self._set_decoded_chars('')
				1828	self._snapshot = None
				1829
				1830	# Restore the decoder to its state from the safe start point.
				1831	if cookie == 0 and self._decoder:
				1832	self._decoder.reset()
				1833	elif self._decoder or dec_flags or chars_to_skip:
				1834	self._decoder = self._decoder or self._get_decoder()
				1835	self._decoder.setstate((b'', dec_flags))
				1836	self._snapshot = (dec_flags, b'')
				1837
				1838	if chars_to_skip:
				1839	# Just like _read_chunk, feed the decoder and save a snapshot.
				1840	input_chunk = self.buffer.read(bytes_to_feed)
				1841	self._set_decoded_chars(
				1842	self._decoder.decode(input_chunk, need_eof))
				1843	self._snapshot = (dec_flags, input_chunk)
				1844
				1845	# Skip chars_to_skip of the decoded characters.
				1846	if len(self._decoded_chars) < chars_to_skip:
				1847	raise IOError("can't restore logical file position")
				1848	self._decoded_chars_used = chars_to_skip
				1849
				1850	# Finally, reset the encoder (merely useful for proper BOM handling)
				1851	try:
				1852	encoder = self._encoder or self._get_encoder()
				1853	except LookupError:
				1854	# Sometimes the encoder doesn't exist
				1855	pass
				1856	else:
				1857	if cookie != 0:
				1858	encoder.setstate(0)
				1859	else:
				1860	encoder.reset()
				1861	return cookie
				1862
				1863	def read(self, n=None):
				1864	self._checkReadable()
				1865	if n is None:
				1866	n = -1
				1867	decoder = self._decoder or self._get_decoder()
Florent Xicluna	1f3b4e1	2010-03-07 12:14:25 +0000	[diff] [blame]	1868	try:
				1869	n.__index__
				1870	except AttributeError:
				1871	raise TypeError("an integer is required")
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	1872	if n < 0:
				1873	# Read everything.
				1874	result = (self._get_decoded_chars() +
				1875	decoder.decode(self.buffer.read(), final=True))
				1876	self._set_decoded_chars('')
				1877	self._snapshot = None
				1878	return result
				1879	else:
				1880	# Keep reading chunks until we have n characters to return.
				1881	eof = False
				1882	result = self._get_decoded_chars(n)
				1883	while len(result) < n and not eof:
				1884	eof = not self._read_chunk()
				1885	result += self._get_decoded_chars(n - len(result))
				1886	return result
				1887
				1888	def next(self):
				1889	self._telling = False
				1890	line = self.readline()
				1891	if not line:
				1892	self._snapshot = None
				1893	self._telling = self._seekable
				1894	raise StopIteration
				1895	return line
				1896
				1897	def readline(self, limit=None):
				1898	if self.closed:
				1899	raise ValueError("read from closed file")
				1900	if limit is None:
				1901	limit = -1
				1902	elif not isinstance(limit, (int, long)):
				1903	raise TypeError("limit must be an integer")
				1904
				1905	# Grab all the decoded text (we will rewind any extra bits later).
				1906	line = self._get_decoded_chars()
				1907
				1908	start = 0
				1909	# Make the decoder if it doesn't already exist.
				1910	if not self._decoder:
				1911	self._get_decoder()
				1912
				1913	pos = endpos = None
				1914	while True:
				1915	if self._readtranslate:
				1916	# Newlines are already translated, only search for \n
				1917	pos = line.find('\n', start)
				1918	if pos >= 0:
				1919	endpos = pos + 1
				1920	break
				1921	else:
				1922	start = len(line)
				1923
				1924	elif self._readuniversal:
				1925	# Universal newline search. Find any of \r, \r\n, \n
				1926	# The decoder ensures that \r\n are not split in two pieces
				1927
				1928	# In C we'd look for these in parallel of course.
				1929	nlpos = line.find("\n", start)
				1930	crpos = line.find("\r", start)
				1931	if crpos == -1:
				1932	if nlpos == -1:
				1933	# Nothing found
				1934	start = len(line)
				1935	else:
				1936	# Found \n
				1937	endpos = nlpos + 1
				1938	break
				1939	elif nlpos == -1:
				1940	# Found lone \r
				1941	endpos = crpos + 1
				1942	break
				1943	elif nlpos < crpos:
				1944	# Found \n
				1945	endpos = nlpos + 1
				1946	break
				1947	elif nlpos == crpos + 1:
				1948	# Found \r\n
				1949	endpos = crpos + 2
				1950	break
				1951	else:
				1952	# Found \r
				1953	endpos = crpos + 1
				1954	break
				1955	else:
				1956	# non-universal
				1957	pos = line.find(self._readnl)
				1958	if pos >= 0:
				1959	endpos = pos + len(self._readnl)
				1960	break
				1961
				1962	if limit >= 0 and len(line) >= limit:
				1963	endpos = limit # reached length limit
				1964	break
				1965
				1966	# No line ending seen yet - get more data'
				1967	while self._read_chunk():
				1968	if self._decoded_chars:
				1969	break
				1970	if self._decoded_chars:
				1971	line += self._get_decoded_chars()
				1972	else:
				1973	# end of file
				1974	self._set_decoded_chars('')
				1975	self._snapshot = None
				1976	return line
				1977
				1978	if limit >= 0 and endpos > limit:
				1979	endpos = limit # don't exceed limit
				1980
				1981	# Rewind _decoded_chars to just after the line ending we found.
				1982	self._rewind_decoded_chars(len(line) - endpos)
				1983	return line[:endpos]
				1984
				1985	@property
				1986	def newlines(self):
				1987	return self._decoder.newlines if self._decoder else None
				1988
				1989
				1990	class StringIO(TextIOWrapper):
				1991	"""Text I/O implementation using an in-memory buffer.
				1992
				1993	The initial_value argument sets the value of object. The newline
				1994	argument is like the one of TextIOWrapper's constructor.
				1995	"""
				1996
				1997	def __init__(self, initial_value="", newline="\n"):
				1998	super(StringIO, self).__init__(BytesIO(),
				1999	encoding="utf-8",
				2000	errors="strict",
				2001	newline=newline)
				2002	# Issue #5645: make universal newlines semantics the same as in the
				2003	# C version, even under Windows.
				2004	if newline is None:
				2005	self._writetranslate = False
				2006	if initial_value:
				2007	if not isinstance(initial_value, unicode):
				2008	initial_value = unicode(initial_value)
				2009	self.write(initial_value)
				2010	self.seek(0)
				2011
				2012	def getvalue(self):
				2013	self.flush()
Antoine Pitrou	c06634a	2014-02-02 23:37:29 +0100	[diff] [blame]	2014	decoder = self._decoder or self._get_decoder()
				2015	old_state = decoder.getstate()
				2016	decoder.reset()
				2017	try:
				2018	return decoder.decode(self.buffer.getvalue(), final=True)
				2019	finally:
				2020	decoder.setstate(old_state)
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	2021
				2022	def __repr__(self):
				2023	# TextIOWrapper tells the encoding in its repr. In StringIO,
Serhiy Storchaka	9a118f1	2016-04-17 09:37:36 +0300	[diff] [blame]	2024	# that's an implementation detail.
Antoine Pitrou	1969059	2009-06-12 20:14:08 +0000	[diff] [blame]	2025	return object.__repr__(self)
				2026
				2027	@property
				2028	def errors(self):
				2029	return None
				2030
				2031	@property
				2032	def encoding(self):
				2033	return None
				2034
				2035	def detach(self):
				2036	# This doesn't make sense on StringIO.
				2037	self._unsupported("detach")