blob: b4abac582ac8bbf2e5e0ad99055c16b0a1e1984e [file] [log] [blame]
Guido van Rossumda5b8f22007-06-12 23:30:11 +00001/* File object implementation (what's left of it -- see io.py) */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002
Martin v. Löwis18e16552006-02-15 17:27:45 +00003#define PY_SSIZE_T_CLEAN
Guido van Rossumc0b618a1997-05-02 03:12:38 +00004#include "Python.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00005
Jack Jansen7b8c7542002-04-14 20:12:41 +00006#ifdef HAVE_GETC_UNLOCKED
7#define GETC(f) getc_unlocked(f)
8#define FLOCKFILE(f) flockfile(f)
9#define FUNLOCKFILE(f) funlockfile(f)
10#else
11#define GETC(f) getc(f)
12#define FLOCKFILE(f)
13#define FUNLOCKFILE(f)
14#endif
15
Guido van Rossumda5b8f22007-06-12 23:30:11 +000016/* Newline flags */
Jack Jansen7b8c7542002-04-14 20:12:41 +000017#define NEWLINE_UNKNOWN 0 /* No newline seen, yet */
18#define NEWLINE_CR 1 /* \r newline seen */
19#define NEWLINE_LF 2 /* \n newline seen */
20#define NEWLINE_CRLF 4 /* \r\n newline seen */
Trent Mickf29f47b2000-08-11 19:02:59 +000021
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000022#ifdef __cplusplus
23extern "C" {
24#endif
25
Guido van Rossumda5b8f22007-06-12 23:30:11 +000026/* External C interface */
Tim Peters59c9a642001-09-13 05:38:56 +000027
28PyObject *
Guido van Rossum40d20bc2007-10-22 00:09:51 +000029PyFile_FromFd(int fd, char *name, char *mode, int buffering, char *encoding,
30 char *newline)
Tim Peters59c9a642001-09-13 05:38:56 +000031{
Guido van Rossum40d20bc2007-10-22 00:09:51 +000032 PyObject *io, *stream, *nameobj = NULL;
Guido van Rossum53970392007-06-12 00:28:30 +000033
34 io = PyImport_ImportModule("io");
35 if (io == NULL)
36 return NULL;
Guido van Rossum40d20bc2007-10-22 00:09:51 +000037 stream = PyObject_CallMethod(io, "open", "isiss", fd, mode,
38 buffering, encoding, newline);
Guido van Rossumce3a72a2007-10-19 23:16:50 +000039 Py_DECREF(io);
Guido van Rossumda5b8f22007-06-12 23:30:11 +000040 if (stream == NULL)
Guido van Rossum53970392007-06-12 00:28:30 +000041 return NULL;
Guido van Rossumce3a72a2007-10-19 23:16:50 +000042 if (name != NULL) {
43 nameobj = PyUnicode_FromString(name);
44 if (nameobj == NULL)
Guido van Rossumda5b8f22007-06-12 23:30:11 +000045 PyErr_Clear();
Guido van Rossumce3a72a2007-10-19 23:16:50 +000046 else {
47 if (PyObject_SetAttrString(stream, "name", nameobj) < 0)
48 PyErr_Clear();
49 Py_DECREF(nameobj);
50 }
Tim Peters59c9a642001-09-13 05:38:56 +000051 }
Guido van Rossum53970392007-06-12 00:28:30 +000052 return stream;
Tim Peters59c9a642001-09-13 05:38:56 +000053}
54
55PyObject *
Fred Drakefd99de62000-07-09 05:02:18 +000056PyFile_GetLine(PyObject *f, int n)
Guido van Rossum0bd24411991-04-04 15:21:57 +000057{
Guido van Rossum4ddf0a02001-01-07 20:51:39 +000058 PyObject *result;
59
Guido van Rossum3165fe61992-09-25 21:59:05 +000060 if (f == NULL) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +000061 PyErr_BadInternalCall();
Guido van Rossum0bd24411991-04-04 15:21:57 +000062 return NULL;
63 }
Guido van Rossum4ddf0a02001-01-07 20:51:39 +000064
Guido van Rossumda5b8f22007-06-12 23:30:11 +000065 {
Guido van Rossumc0b618a1997-05-02 03:12:38 +000066 PyObject *reader;
67 PyObject *args;
Guido van Rossum4ddf0a02001-01-07 20:51:39 +000068
Guido van Rossumc0b618a1997-05-02 03:12:38 +000069 reader = PyObject_GetAttrString(f, "readline");
Guido van Rossum3165fe61992-09-25 21:59:05 +000070 if (reader == NULL)
71 return NULL;
72 if (n <= 0)
Raymond Hettinger8ae46892003-10-12 19:09:37 +000073 args = PyTuple_New(0);
Guido van Rossum3165fe61992-09-25 21:59:05 +000074 else
Guido van Rossumc0b618a1997-05-02 03:12:38 +000075 args = Py_BuildValue("(i)", n);
Guido van Rossum3165fe61992-09-25 21:59:05 +000076 if (args == NULL) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +000077 Py_DECREF(reader);
Guido van Rossum3165fe61992-09-25 21:59:05 +000078 return NULL;
79 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +000080 result = PyEval_CallObject(reader, args);
81 Py_DECREF(reader);
82 Py_DECREF(args);
Martin v. Löwisaf6a27a2003-01-03 19:16:14 +000083 if (result != NULL && !PyString_Check(result) &&
84 !PyUnicode_Check(result)) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +000085 Py_DECREF(result);
Guido van Rossum3165fe61992-09-25 21:59:05 +000086 result = NULL;
Guido van Rossumc0b618a1997-05-02 03:12:38 +000087 PyErr_SetString(PyExc_TypeError,
Guido van Rossum3165fe61992-09-25 21:59:05 +000088 "object.readline() returned non-string");
89 }
Guido van Rossum4ddf0a02001-01-07 20:51:39 +000090 }
91
92 if (n < 0 && result != NULL && PyString_Check(result)) {
93 char *s = PyString_AS_STRING(result);
Martin v. Löwis18e16552006-02-15 17:27:45 +000094 Py_ssize_t len = PyString_GET_SIZE(result);
Guido van Rossum4ddf0a02001-01-07 20:51:39 +000095 if (len == 0) {
96 Py_DECREF(result);
97 result = NULL;
98 PyErr_SetString(PyExc_EOFError,
99 "EOF when reading a line");
100 }
101 else if (s[len-1] == '\n') {
102 if (result->ob_refcnt == 1)
103 _PyString_Resize(&result, len-1);
104 else {
105 PyObject *v;
106 v = PyString_FromStringAndSize(s, len-1);
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000107 Py_DECREF(result);
Guido van Rossum4ddf0a02001-01-07 20:51:39 +0000108 result = v;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000109 }
110 }
Guido van Rossum3165fe61992-09-25 21:59:05 +0000111 }
Martin v. Löwisaf6a27a2003-01-03 19:16:14 +0000112 if (n < 0 && result != NULL && PyUnicode_Check(result)) {
113 Py_UNICODE *s = PyUnicode_AS_UNICODE(result);
Martin v. Löwis18e16552006-02-15 17:27:45 +0000114 Py_ssize_t len = PyUnicode_GET_SIZE(result);
Martin v. Löwisaf6a27a2003-01-03 19:16:14 +0000115 if (len == 0) {
116 Py_DECREF(result);
117 result = NULL;
118 PyErr_SetString(PyExc_EOFError,
119 "EOF when reading a line");
120 }
121 else if (s[len-1] == '\n') {
122 if (result->ob_refcnt == 1)
123 PyUnicode_Resize(&result, len-1);
124 else {
125 PyObject *v;
126 v = PyUnicode_FromUnicode(s, len-1);
127 Py_DECREF(result);
128 result = v;
129 }
130 }
131 }
Guido van Rossum4ddf0a02001-01-07 20:51:39 +0000132 return result;
Guido van Rossum0bd24411991-04-04 15:21:57 +0000133}
134
Guido van Rossum3165fe61992-09-25 21:59:05 +0000135/* Interfaces to write objects/strings to file-like objects */
136
137int
Fred Drakefd99de62000-07-09 05:02:18 +0000138PyFile_WriteObject(PyObject *v, PyObject *f, int flags)
Guido van Rossum3165fe61992-09-25 21:59:05 +0000139{
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000140 PyObject *writer, *value, *args, *result;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000141 if (f == NULL) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000142 PyErr_SetString(PyExc_TypeError, "writeobject with NULL file");
Guido van Rossum3165fe61992-09-25 21:59:05 +0000143 return -1;
144 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000145 writer = PyObject_GetAttrString(f, "write");
Guido van Rossum3165fe61992-09-25 21:59:05 +0000146 if (writer == NULL)
147 return -1;
Martin v. Löwis2777c022001-09-19 13:47:32 +0000148 if (flags & Py_PRINT_RAW) {
Guido van Rossum55b4a7b2007-07-11 09:28:11 +0000149 value = _PyObject_Str(v);
Martin v. Löwis2777c022001-09-19 13:47:32 +0000150 }
Guido van Rossum55b4a7b2007-07-11 09:28:11 +0000151 else
Guido van Rossume518bf32007-10-09 21:55:58 +0000152 value = PyObject_Repr(v);
Guido van Rossumc6004111993-11-05 10:22:19 +0000153 if (value == NULL) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000154 Py_DECREF(writer);
Guido van Rossumc6004111993-11-05 10:22:19 +0000155 return -1;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000156 }
Raymond Hettinger8ae46892003-10-12 19:09:37 +0000157 args = PyTuple_Pack(1, value);
Guido van Rossume9eec541997-05-22 14:02:25 +0000158 if (args == NULL) {
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000159 Py_DECREF(value);
160 Py_DECREF(writer);
Guido van Rossumd3f9a1a1995-07-10 23:32:26 +0000161 return -1;
162 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000163 result = PyEval_CallObject(writer, args);
164 Py_DECREF(args);
165 Py_DECREF(value);
166 Py_DECREF(writer);
Guido van Rossum3165fe61992-09-25 21:59:05 +0000167 if (result == NULL)
168 return -1;
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000169 Py_DECREF(result);
Guido van Rossum3165fe61992-09-25 21:59:05 +0000170 return 0;
171}
172
Guido van Rossum27a60b11997-05-22 22:25:11 +0000173int
Tim Petersc1bbcb82001-11-28 22:13:25 +0000174PyFile_WriteString(const char *s, PyObject *f)
Guido van Rossum3165fe61992-09-25 21:59:05 +0000175{
176 if (f == NULL) {
Guido van Rossum27a60b11997-05-22 22:25:11 +0000177 /* Should be caused by a pre-existing error */
Fred Drakefd99de62000-07-09 05:02:18 +0000178 if (!PyErr_Occurred())
Guido van Rossum27a60b11997-05-22 22:25:11 +0000179 PyErr_SetString(PyExc_SystemError,
180 "null file for PyFile_WriteString");
181 return -1;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000182 }
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000183 else if (!PyErr_Occurred()) {
Guido van Rossum11019802007-08-09 22:58:05 +0000184 PyObject *v = PyUnicode_FromString(s);
Guido van Rossum27a60b11997-05-22 22:25:11 +0000185 int err;
186 if (v == NULL)
187 return -1;
188 err = PyFile_WriteObject(v, f, Py_PRINT_RAW);
189 Py_DECREF(v);
190 return err;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000191 }
Guido van Rossum74ba2471997-07-13 03:56:50 +0000192 else
193 return -1;
Guido van Rossum3165fe61992-09-25 21:59:05 +0000194}
Andrew M. Kuchling06051ed2000-07-13 23:56:54 +0000195
196/* Try to get a file-descriptor from a Python object. If the object
197 is an integer or long integer, its value is returned. If not, the
198 object's fileno() method is called if it exists; the method must return
199 an integer or long integer, which is returned as the file descriptor value.
200 -1 is returned on failure.
201*/
202
Guido van Rossumda5b8f22007-06-12 23:30:11 +0000203int
204PyObject_AsFileDescriptor(PyObject *o)
Andrew M. Kuchling06051ed2000-07-13 23:56:54 +0000205{
206 int fd;
207 PyObject *meth;
208
209 if (PyInt_Check(o)) {
210 fd = PyInt_AsLong(o);
211 }
212 else if (PyLong_Check(o)) {
213 fd = PyLong_AsLong(o);
214 }
215 else if ((meth = PyObject_GetAttrString(o, "fileno")) != NULL)
216 {
217 PyObject *fno = PyEval_CallObject(meth, NULL);
218 Py_DECREF(meth);
219 if (fno == NULL)
220 return -1;
Tim Peters86821b22001-01-07 21:19:34 +0000221
Andrew M. Kuchling06051ed2000-07-13 23:56:54 +0000222 if (PyInt_Check(fno)) {
223 fd = PyInt_AsLong(fno);
224 Py_DECREF(fno);
225 }
226 else if (PyLong_Check(fno)) {
227 fd = PyLong_AsLong(fno);
228 Py_DECREF(fno);
229 }
230 else {
231 PyErr_SetString(PyExc_TypeError,
232 "fileno() returned a non-integer");
233 Py_DECREF(fno);
234 return -1;
235 }
236 }
237 else {
238 PyErr_SetString(PyExc_TypeError,
239 "argument must be an int, or have a fileno() method.");
240 return -1;
241 }
242
Guido van Rossumddefaf32007-01-14 03:31:43 +0000243 if (fd == -1 && PyErr_Occurred())
244 return -1;
Andrew M. Kuchling06051ed2000-07-13 23:56:54 +0000245 if (fd < 0) {
246 PyErr_Format(PyExc_ValueError,
247 "file descriptor cannot be a negative integer (%i)",
248 fd);
249 return -1;
250 }
251 return fd;
252}
Jack Jansen7b8c7542002-04-14 20:12:41 +0000253
Jack Jansen7b8c7542002-04-14 20:12:41 +0000254/*
255** Py_UniversalNewlineFgets is an fgets variation that understands
256** all of \r, \n and \r\n conventions.
257** The stream should be opened in binary mode.
258** If fobj is NULL the routine always does newline conversion, and
259** it may peek one char ahead to gobble the second char in \r\n.
260** If fobj is non-NULL it must be a PyFileObject. In this case there
261** is no readahead but in stead a flag is used to skip a following
262** \n on the next read. Also, if the file is open in binary mode
263** the whole conversion is skipped. Finally, the routine keeps track of
264** the different types of newlines seen.
265** Note that we need no error handling: fgets() treats error and eof
266** identically.
267*/
268char *
269Py_UniversalNewlineFgets(char *buf, int n, FILE *stream, PyObject *fobj)
270{
271 char *p = buf;
272 int c;
273 int newlinetypes = 0;
274 int skipnextlf = 0;
Tim Peters058b1412002-04-21 07:29:14 +0000275
Jack Jansen7b8c7542002-04-14 20:12:41 +0000276 if (fobj) {
Guido van Rossumda5b8f22007-06-12 23:30:11 +0000277 errno = ENXIO; /* What can you do... */
278 return NULL;
Jack Jansen7b8c7542002-04-14 20:12:41 +0000279 }
280 FLOCKFILE(stream);
281 c = 'x'; /* Shut up gcc warning */
282 while (--n > 0 && (c = GETC(stream)) != EOF ) {
283 if (skipnextlf ) {
284 skipnextlf = 0;
285 if (c == '\n') {
286 /* Seeing a \n here with skipnextlf true
287 ** means we saw a \r before.
288 */
289 newlinetypes |= NEWLINE_CRLF;
290 c = GETC(stream);
291 if (c == EOF) break;
292 } else {
293 /*
294 ** Note that c == EOF also brings us here,
295 ** so we're okay if the last char in the file
296 ** is a CR.
297 */
298 newlinetypes |= NEWLINE_CR;
299 }
300 }
301 if (c == '\r') {
302 /* A \r is translated into a \n, and we skip
303 ** an adjacent \n, if any. We don't set the
304 ** newlinetypes flag until we've seen the next char.
305 */
306 skipnextlf = 1;
307 c = '\n';
308 } else if ( c == '\n') {
309 newlinetypes |= NEWLINE_LF;
310 }
311 *p++ = c;
312 if (c == '\n') break;
313 }
314 if ( c == EOF && skipnextlf )
315 newlinetypes |= NEWLINE_CR;
316 FUNLOCKFILE(stream);
317 *p = '\0';
Guido van Rossumda5b8f22007-06-12 23:30:11 +0000318 if ( skipnextlf ) {
Jack Jansen7b8c7542002-04-14 20:12:41 +0000319 /* If we have no file object we cannot save the
320 ** skipnextlf flag. We have to readahead, which
321 ** will cause a pause if we're reading from an
322 ** interactive stream, but that is very unlikely
323 ** unless we're doing something silly like
Neal Norwitz01688022007-08-12 00:43:29 +0000324 ** exec(open("/dev/tty").read()).
Jack Jansen7b8c7542002-04-14 20:12:41 +0000325 */
326 c = GETC(stream);
327 if ( c != '\n' )
328 ungetc(c, stream);
329 }
330 if (p == buf)
331 return NULL;
332 return buf;
333}
334
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000335#ifdef __cplusplus
336}
337#endif