blob: 8c1fabe360cdcf7cf032a9bd88d538d21b411eef [file] [log] [blame]
Guido van Rossuma9e20242007-03-08 00:43:48 +00001/* Author: Daniel Stutzbach */
2
3#define PY_SSIZE_T_CLEAN
4#include "Python.h"
Antoine Pitroue033e062010-10-29 10:38:18 +00005#include "structmember.h"
Benjamin Peterson2614cda2010-03-21 22:36:19 +00006#ifdef HAVE_SYS_TYPES_H
Guido van Rossuma9e20242007-03-08 00:43:48 +00007#include <sys/types.h>
Benjamin Peterson2614cda2010-03-21 22:36:19 +00008#endif
9#ifdef HAVE_SYS_STAT_H
Guido van Rossuma9e20242007-03-08 00:43:48 +000010#include <sys/stat.h>
Benjamin Peterson2614cda2010-03-21 22:36:19 +000011#endif
12#ifdef HAVE_FCNTL_H
Guido van Rossuma9e20242007-03-08 00:43:48 +000013#include <fcntl.h>
Benjamin Peterson2614cda2010-03-21 22:36:19 +000014#endif
Guido van Rossuma9e20242007-03-08 00:43:48 +000015#include <stddef.h> /* For offsetof */
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000016#include "_iomodule.h"
Guido van Rossuma9e20242007-03-08 00:43:48 +000017
18/*
19 * Known likely problems:
20 *
21 * - Files larger then 2**32-1
22 * - Files with unicode filenames
23 * - Passing numbers greater than 2**32-1 when an integer is expected
24 * - Making it work on Windows and other oddball platforms
25 *
26 * To Do:
27 *
28 * - autoconfify header file inclusion
Guido van Rossuma9e20242007-03-08 00:43:48 +000029 */
30
31#ifdef MS_WINDOWS
32/* can simulate truncate with Win32 API functions; see file_truncate */
Thomas Hellerfdeee3a2007-07-12 11:21:36 +000033#define HAVE_FTRUNCATE
Guido van Rossuma9e20242007-03-08 00:43:48 +000034#define WIN32_LEAN_AND_MEAN
35#include <windows.h>
36#endif
37
Christian Heimesa872de52008-12-05 08:26:55 +000038#if BUFSIZ < (8*1024)
39#define SMALLCHUNK (8*1024)
40#elif (BUFSIZ >= (2 << 25))
41#error "unreasonable BUFSIZ > 64MB defined"
42#else
43#define SMALLCHUNK BUFSIZ
44#endif
45
Guido van Rossuma9e20242007-03-08 00:43:48 +000046typedef struct {
Antoine Pitrouae4b4722010-05-05 16:31:07 +000047 PyObject_HEAD
48 int fd;
Charles-François Natalidc3044c2012-01-09 22:40:02 +010049 unsigned int created : 1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +000050 unsigned int readable : 1;
51 unsigned int writable : 1;
52 signed int seekable : 2; /* -1 means unknown */
53 unsigned int closefd : 1;
Antoine Pitroue033e062010-10-29 10:38:18 +000054 unsigned int deallocating: 1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +000055 PyObject *weakreflist;
56 PyObject *dict;
Benjamin Peterson680bf1a2009-06-12 02:07:12 +000057} fileio;
Guido van Rossuma9e20242007-03-08 00:43:48 +000058
Collin Winteraf334382007-03-08 21:46:15 +000059PyTypeObject PyFileIO_Type;
60
Guido van Rossuma9e20242007-03-08 00:43:48 +000061#define PyFileIO_Check(op) (PyObject_TypeCheck((op), &PyFileIO_Type))
62
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000063int
64_PyFileIO_closed(PyObject *self)
65{
Antoine Pitrouae4b4722010-05-05 16:31:07 +000066 return ((fileio *)self)->fd < 0;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000067}
Antoine Pitrou08838b62009-01-21 00:55:13 +000068
Antoine Pitroue033e062010-10-29 10:38:18 +000069/* Because this can call arbitrary code, it shouldn't be called when
70 the refcount is 0 (that is, not directly from tp_dealloc unless
71 the refcount has been temporarily re-incremented). */
72static PyObject *
73fileio_dealloc_warn(fileio *self, PyObject *source)
74{
75 if (self->fd >= 0 && self->closefd) {
76 PyObject *exc, *val, *tb;
77 PyErr_Fetch(&exc, &val, &tb);
78 if (PyErr_WarnFormat(PyExc_ResourceWarning, 1,
79 "unclosed file %R", source)) {
80 /* Spurious errors can appear at shutdown */
81 if (PyErr_ExceptionMatches(PyExc_Warning))
82 PyErr_WriteUnraisable((PyObject *) self);
83 }
84 PyErr_Restore(exc, val, tb);
85 }
86 Py_RETURN_NONE;
87}
88
Antoine Pitrou7fb111b2009-03-04 11:14:01 +000089static PyObject *
90portable_lseek(int fd, PyObject *posobj, int whence);
91
Antoine Pitroua28fcfd2009-03-13 23:42:55 +000092static PyObject *portable_lseek(int fd, PyObject *posobj, int whence);
93
Kristján Valur Jónsson19288c22008-12-18 17:15:54 +000094/* Returns 0 on success, -1 with exception set on failure. */
Neal Norwitz88b44da2007-08-12 17:23:54 +000095static int
Benjamin Peterson680bf1a2009-06-12 02:07:12 +000096internal_close(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +000097{
Antoine Pitrouae4b4722010-05-05 16:31:07 +000098 int err = 0;
99 int save_errno = 0;
100 if (self->fd >= 0) {
101 int fd = self->fd;
102 self->fd = -1;
103 /* fd is accessible and someone else may have closed it */
104 if (_PyVerify_fd(fd)) {
105 Py_BEGIN_ALLOW_THREADS
106 err = close(fd);
107 if (err < 0)
108 save_errno = errno;
109 Py_END_ALLOW_THREADS
110 } else {
111 save_errno = errno;
112 err = -1;
113 }
114 }
115 if (err < 0) {
116 errno = save_errno;
117 PyErr_SetFromErrno(PyExc_IOError);
118 return -1;
119 }
120 return 0;
Neal Norwitz88b44da2007-08-12 17:23:54 +0000121}
122
123static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000124fileio_close(fileio *self)
Neal Norwitz88b44da2007-08-12 17:23:54 +0000125{
Martin v. Löwisbd928fe2011-10-14 10:20:37 +0200126 _Py_IDENTIFIER(close);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000127 if (!self->closefd) {
128 self->fd = -1;
129 Py_RETURN_NONE;
130 }
Antoine Pitroue033e062010-10-29 10:38:18 +0000131 if (self->deallocating) {
132 PyObject *r = fileio_dealloc_warn(self, (PyObject *) self);
133 if (r)
134 Py_DECREF(r);
135 else
136 PyErr_Clear();
137 }
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000138 errno = internal_close(self);
139 if (errno < 0)
140 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000141
Martin v. Löwisafe55bb2011-10-09 10:38:36 +0200142 return _PyObject_CallMethodId((PyObject*)&PyRawIOBase_Type,
143 &PyId_close, "O", self);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000144}
145
146static PyObject *
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000147fileio_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000148{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000149 fileio *self;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000150
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000151 assert(type != NULL && type->tp_alloc != NULL);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000152
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000153 self = (fileio *) type->tp_alloc(type, 0);
154 if (self != NULL) {
155 self->fd = -1;
Charles-François Natalidc3044c2012-01-09 22:40:02 +0100156 self->created = 0;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000157 self->readable = 0;
158 self->writable = 0;
159 self->seekable = -1;
160 self->closefd = 1;
161 self->weakreflist = NULL;
162 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000163
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000164 return (PyObject *) self;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000165}
166
167/* On Unix, open will succeed for directories.
168 In Python, there should be no file objects referring to
169 directories, so we need a check. */
170
171static int
Antoine Pitrou9235b252012-07-06 18:48:24 +0200172dircheck(fileio* self, PyObject *nameobj)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000173{
174#if defined(HAVE_FSTAT) && defined(S_IFDIR) && defined(EISDIR)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000175 struct stat buf;
176 if (self->fd < 0)
177 return 0;
178 if (fstat(self->fd, &buf) == 0 && S_ISDIR(buf.st_mode)) {
Antoine Pitrou9235b252012-07-06 18:48:24 +0200179 errno = EISDIR;
180 PyErr_SetFromErrnoWithFilenameObject(PyExc_IOError, nameobj);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000181 return -1;
182 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000183#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000184 return 0;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000185}
186
Benjamin Peterson806d4022009-01-19 15:11:51 +0000187static int
188check_fd(int fd)
189{
190#if defined(HAVE_FSTAT)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000191 struct stat buf;
192 if (!_PyVerify_fd(fd) || (fstat(fd, &buf) < 0 && errno == EBADF)) {
193 PyObject *exc;
194 char *msg = strerror(EBADF);
195 exc = PyObject_CallFunction(PyExc_OSError, "(is)",
196 EBADF, msg);
197 PyErr_SetObject(PyExc_OSError, exc);
198 Py_XDECREF(exc);
199 return -1;
200 }
Benjamin Peterson806d4022009-01-19 15:11:51 +0000201#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000202 return 0;
Benjamin Peterson806d4022009-01-19 15:11:51 +0000203}
204
Guido van Rossuma9e20242007-03-08 00:43:48 +0000205
206static int
207fileio_init(PyObject *oself, PyObject *args, PyObject *kwds)
208{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000209 fileio *self = (fileio *) oself;
Ross Lagerwall59142db2011-10-31 20:34:46 +0200210 static char *kwlist[] = {"file", "mode", "closefd", "opener", NULL};
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000211 const char *name = NULL;
Ross Lagerwall59142db2011-10-31 20:34:46 +0200212 PyObject *nameobj, *stringobj = NULL, *opener = Py_None;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000213 char *mode = "r";
214 char *s;
Thomas Helleraf2be262007-07-12 11:03:13 +0000215#ifdef MS_WINDOWS
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000216 Py_UNICODE *widename = NULL;
Thomas Helleraf2be262007-07-12 11:03:13 +0000217#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000218 int ret = 0;
219 int rwa = 0, plus = 0, append = 0;
220 int flags = 0;
221 int fd = -1;
222 int closefd = 1;
Hynek Schlawack9ed8b4e2012-06-21 20:20:25 +0200223 int fd_is_own = 0;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000224
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000225 assert(PyFileIO_Check(oself));
226 if (self->fd >= 0) {
Hynek Schlawack2cc71562012-05-25 10:05:53 +0200227 if (self->closefd) {
228 /* Have to close the existing file first. */
229 if (internal_close(self) < 0)
230 return -1;
231 }
232 else
233 self->fd = -1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000234 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000235
Ross Lagerwall59142db2011-10-31 20:34:46 +0200236 if (!PyArg_ParseTupleAndKeywords(args, kwds, "O|siO:fileio",
237 kwlist, &nameobj, &mode, &closefd,
238 &opener))
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000239 return -1;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000240
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000241 if (PyFloat_Check(nameobj)) {
242 PyErr_SetString(PyExc_TypeError,
243 "integer argument expected, got float");
244 return -1;
245 }
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000246
Serhiy Storchaka441d30f2013-01-19 12:26:26 +0200247 fd = _PyLong_AsInt(nameobj);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000248 if (fd < 0) {
249 if (!PyErr_Occurred()) {
250 PyErr_SetString(PyExc_ValueError,
251 "Negative filedescriptor");
252 return -1;
253 }
254 PyErr_Clear();
255 }
Guido van Rossumb0428152007-04-08 17:44:42 +0000256
Hirokazu Yamamoto8223c242009-05-17 04:21:53 +0000257#ifdef MS_WINDOWS
Victor Stinnerfe9a8612011-09-29 23:19:04 +0200258 if (PyUnicode_Check(nameobj)) {
Antoine Pitrou13348842012-01-29 18:36:34 +0100259 int rv = _PyUnicode_HasNULChars(nameobj);
260 if (rv) {
261 if (rv != -1)
262 PyErr_SetString(PyExc_TypeError, "embedded NUL character");
263 return -1;
264 }
Victor Stinnerfe9a8612011-09-29 23:19:04 +0200265 widename = PyUnicode_AsUnicode(nameobj);
266 if (widename == NULL)
267 return -1;
268 } else
Guido van Rossuma9e20242007-03-08 00:43:48 +0000269#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000270 if (fd < 0)
271 {
Antoine Pitrou13348842012-01-29 18:36:34 +0100272 if (!PyUnicode_FSConverter(nameobj, &stringobj)) {
273 return -1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000274 }
Antoine Pitrou13348842012-01-29 18:36:34 +0100275 name = PyBytes_AS_STRING(stringobj);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000276 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000277
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000278 s = mode;
279 while (*s) {
280 switch (*s++) {
Charles-François Natalidc3044c2012-01-09 22:40:02 +0100281 case 'x':
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000282 if (rwa) {
283 bad_mode:
284 PyErr_SetString(PyExc_ValueError,
Charles-François Natalidc3044c2012-01-09 22:40:02 +0100285 "Must have exactly one of create/read/write/append "
Georg Brandl28928ae2010-10-21 13:45:52 +0000286 "mode and at most one plus");
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000287 goto error;
288 }
289 rwa = 1;
Charles-François Natalidc3044c2012-01-09 22:40:02 +0100290 self->created = 1;
291 self->writable = 1;
292 flags |= O_EXCL | O_CREAT;
293 break;
294 case 'r':
295 if (rwa)
296 goto bad_mode;
297 rwa = 1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000298 self->readable = 1;
299 break;
300 case 'w':
301 if (rwa)
302 goto bad_mode;
303 rwa = 1;
304 self->writable = 1;
305 flags |= O_CREAT | O_TRUNC;
306 break;
307 case 'a':
308 if (rwa)
309 goto bad_mode;
310 rwa = 1;
311 self->writable = 1;
312 flags |= O_CREAT;
313 append = 1;
314 break;
315 case 'b':
316 break;
317 case '+':
318 if (plus)
319 goto bad_mode;
320 self->readable = self->writable = 1;
321 plus = 1;
322 break;
323 default:
324 PyErr_Format(PyExc_ValueError,
325 "invalid mode: %.200s", mode);
326 goto error;
327 }
328 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000329
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000330 if (!rwa)
331 goto bad_mode;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000332
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000333 if (self->readable && self->writable)
334 flags |= O_RDWR;
335 else if (self->readable)
336 flags |= O_RDONLY;
337 else
338 flags |= O_WRONLY;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000339
340#ifdef O_BINARY
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000341 flags |= O_BINARY;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000342#endif
343
Walter Dörwald0e411482007-06-06 16:55:38 +0000344#ifdef O_APPEND
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000345 if (append)
346 flags |= O_APPEND;
Walter Dörwald0e411482007-06-06 16:55:38 +0000347#endif
348
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000349 if (fd >= 0) {
350 if (check_fd(fd))
351 goto error;
352 self->fd = fd;
353 self->closefd = closefd;
354 }
355 else {
356 self->closefd = 1;
357 if (!closefd) {
358 PyErr_SetString(PyExc_ValueError,
359 "Cannot use closefd=False with file name");
360 goto error;
361 }
Guido van Rossum2dced8b2007-10-30 17:27:30 +0000362
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000363 errno = 0;
Ross Lagerwall59142db2011-10-31 20:34:46 +0200364 if (opener == Py_None) {
365 Py_BEGIN_ALLOW_THREADS
Thomas Helleraf2be262007-07-12 11:03:13 +0000366#ifdef MS_WINDOWS
Ross Lagerwall59142db2011-10-31 20:34:46 +0200367 if (widename != NULL)
368 self->fd = _wopen(widename, flags, 0666);
369 else
Thomas Helleraf2be262007-07-12 11:03:13 +0000370#endif
Ross Lagerwall59142db2011-10-31 20:34:46 +0200371 self->fd = open(name, flags, 0666);
372 Py_END_ALLOW_THREADS
373 } else {
374 PyObject *fdobj = PyObject_CallFunction(
375 opener, "Oi", nameobj, flags);
376 if (fdobj == NULL)
377 goto error;
378 if (!PyLong_Check(fdobj)) {
379 Py_DECREF(fdobj);
380 PyErr_SetString(PyExc_TypeError,
381 "expected integer from opener");
382 goto error;
383 }
384
Serhiy Storchaka9101e232013-01-19 12:41:45 +0200385 self->fd = _PyLong_AsInt(fdobj);
Ross Lagerwall59142db2011-10-31 20:34:46 +0200386 Py_DECREF(fdobj);
387 if (self->fd == -1) {
388 goto error;
389 }
390 }
391
Hynek Schlawack7f59fd72012-06-22 09:32:22 +0200392 fd_is_own = 1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000393 if (self->fd < 0) {
Christian Heimes0b489542007-10-31 19:20:48 +0000394#ifdef MS_WINDOWS
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000395 if (widename != NULL)
Victor Stinnerfe9a8612011-09-29 23:19:04 +0200396 PyErr_SetFromErrnoWithFilenameObject(PyExc_IOError, nameobj);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000397 else
Christian Heimes0b489542007-10-31 19:20:48 +0000398#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000399 PyErr_SetFromErrnoWithFilename(PyExc_IOError, name);
400 goto error;
401 }
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000402 }
Antoine Pitrou9235b252012-07-06 18:48:24 +0200403 if (dircheck(self, nameobj) < 0)
404 goto error;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000405
Victor Stinner89e34362011-01-07 18:47:22 +0000406#if defined(MS_WINDOWS) || defined(__CYGWIN__)
407 /* don't translate newlines (\r\n <=> \n) */
408 _setmode(self->fd, O_BINARY);
409#endif
410
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000411 if (PyObject_SetAttrString((PyObject *)self, "name", nameobj) < 0)
412 goto error;
Antoine Pitrou08838b62009-01-21 00:55:13 +0000413
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000414 if (append) {
415 /* For consistent behaviour, we explicitly seek to the
416 end of file (otherwise, it might be done only on the
417 first write()). */
418 PyObject *pos = portable_lseek(self->fd, NULL, 2);
Hynek Schlawack9ed8b4e2012-06-21 20:20:25 +0200419 if (pos == NULL)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000420 goto error;
421 Py_DECREF(pos);
422 }
Antoine Pitrou7fb111b2009-03-04 11:14:01 +0000423
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000424 goto done;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000425
426 error:
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000427 ret = -1;
Hynek Schlawack9ed8b4e2012-06-21 20:20:25 +0200428 if (!fd_is_own)
429 self->fd = -1;
Benjamin Petersonbbb04122010-10-30 23:16:28 +0000430 if (self->fd >= 0)
431 internal_close(self);
Guido van Rossum53807da2007-04-10 19:01:47 +0000432
Guido van Rossuma9e20242007-03-08 00:43:48 +0000433 done:
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000434 Py_CLEAR(stringobj);
435 return ret;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000436}
437
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000438static int
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000439fileio_traverse(fileio *self, visitproc visit, void *arg)
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000440{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000441 Py_VISIT(self->dict);
442 return 0;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000443}
444
445static int
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000446fileio_clear(fileio *self)
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000447{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000448 Py_CLEAR(self->dict);
449 return 0;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000450}
451
Guido van Rossuma9e20242007-03-08 00:43:48 +0000452static void
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000453fileio_dealloc(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000454{
Antoine Pitroue033e062010-10-29 10:38:18 +0000455 self->deallocating = 1;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000456 if (_PyIOBase_finalize((PyObject *) self) < 0)
457 return;
458 _PyObject_GC_UNTRACK(self);
459 if (self->weakreflist != NULL)
460 PyObject_ClearWeakRefs((PyObject *) self);
461 Py_CLEAR(self->dict);
462 Py_TYPE(self)->tp_free((PyObject *)self);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000463}
464
465static PyObject *
466err_closed(void)
467{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000468 PyErr_SetString(PyExc_ValueError, "I/O operation on closed file");
469 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000470}
471
472static PyObject *
Guido van Rossum53807da2007-04-10 19:01:47 +0000473err_mode(char *action)
474{
Antoine Pitrou0d739d72010-09-05 23:01:12 +0000475 PyErr_Format(IO_STATE->unsupported_operation,
476 "File not open for %s", action);
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000477 return NULL;
Guido van Rossum53807da2007-04-10 19:01:47 +0000478}
479
480static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000481fileio_fileno(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000482{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000483 if (self->fd < 0)
484 return err_closed();
485 return PyLong_FromLong((long) self->fd);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000486}
487
488static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000489fileio_readable(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000490{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000491 if (self->fd < 0)
492 return err_closed();
493 return PyBool_FromLong((long) self->readable);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000494}
495
496static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000497fileio_writable(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000498{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000499 if (self->fd < 0)
500 return err_closed();
501 return PyBool_FromLong((long) self->writable);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000502}
503
504static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000505fileio_seekable(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000506{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000507 if (self->fd < 0)
508 return err_closed();
509 if (self->seekable < 0) {
510 PyObject *pos = portable_lseek(self->fd, NULL, SEEK_CUR);
511 if (pos == NULL) {
512 PyErr_Clear();
513 self->seekable = 0;
514 } else {
515 Py_DECREF(pos);
516 self->seekable = 1;
517 }
518 }
519 return PyBool_FromLong((long) self->seekable);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000520}
521
522static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000523fileio_readinto(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000524{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000525 Py_buffer pbuf;
Victor Stinnere6edec22011-01-04 00:29:35 +0000526 Py_ssize_t n, len;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100527 int err;
Guido van Rossum53807da2007-04-10 19:01:47 +0000528
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000529 if (self->fd < 0)
530 return err_closed();
531 if (!self->readable)
532 return err_mode("reading");
Guido van Rossum53807da2007-04-10 19:01:47 +0000533
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000534 if (!PyArg_ParseTuple(args, "w*", &pbuf))
535 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000536
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000537 if (_PyVerify_fd(self->fd)) {
Victor Stinnere6edec22011-01-04 00:29:35 +0000538 len = pbuf.len;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000539 Py_BEGIN_ALLOW_THREADS
540 errno = 0;
Victor Stinnere6edec22011-01-04 00:29:35 +0000541#if defined(MS_WIN64) || defined(MS_WINDOWS)
542 if (len > INT_MAX)
543 len = INT_MAX;
544 n = read(self->fd, pbuf.buf, (int)len);
545#else
Victor Stinner72344792011-01-11 00:04:12 +0000546 n = read(self->fd, pbuf.buf, len);
Victor Stinnere6edec22011-01-04 00:29:35 +0000547#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000548 Py_END_ALLOW_THREADS
549 } else
550 n = -1;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100551 err = errno;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000552 PyBuffer_Release(&pbuf);
553 if (n < 0) {
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100554 if (err == EAGAIN)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000555 Py_RETURN_NONE;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100556 errno = err;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000557 PyErr_SetFromErrno(PyExc_IOError);
558 return NULL;
559 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000560
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000561 return PyLong_FromSsize_t(n);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000562}
563
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000564static size_t
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200565new_buffersize(fileio *self, size_t currentsize
566#ifdef HAVE_FSTAT
Victor Stinnera2a64772011-10-11 22:45:02 +0200567 , Py_off_t pos, Py_off_t end
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200568#endif
569 )
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000570{
Antoine Pitroua3f44572012-04-17 13:50:58 +0200571 size_t addend;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000572#ifdef HAVE_FSTAT
Victor Stinnera2a64772011-10-11 22:45:02 +0200573 if (end != (Py_off_t)-1) {
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000574 /* Files claiming a size smaller than SMALLCHUNK may
575 actually be streaming pseudo-files. In this case, we
576 apply the more aggressive algorithm below.
577 */
578 if (end >= SMALLCHUNK && end >= pos && pos >= 0) {
579 /* Add 1 so if the file were to grow we'd notice. */
Victor Stinnerc5af7732011-10-11 23:00:31 +0200580 Py_off_t bufsize = currentsize + end - pos + 1;
581 if (bufsize < PY_SSIZE_T_MAX)
582 return (size_t)bufsize;
583 else
584 return PY_SSIZE_T_MAX;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000585 }
586 }
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000587#endif
Nadeem Vawdad41a98b2011-10-13 13:34:16 +0200588 /* Expand the buffer by an amount proportional to the current size,
Antoine Pitroua3f44572012-04-17 13:50:58 +0200589 giving us amortized linear-time behavior. For bigger sizes, use a
590 less-than-double growth factor to avoid excessive allocation. */
591 if (currentsize > 65536)
592 addend = currentsize >> 3;
593 else
594 addend = 256 + currentsize;
595 if (addend < SMALLCHUNK)
596 /* Avoid tiny read() calls. */
597 addend = SMALLCHUNK;
598 return addend + currentsize;
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000599}
600
Guido van Rossum7165cb12007-07-10 06:54:34 +0000601static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000602fileio_readall(fileio *self)
Guido van Rossum7165cb12007-07-10 06:54:34 +0000603{
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200604#ifdef HAVE_FSTAT
605 struct stat st;
Victor Stinnera2a64772011-10-11 22:45:02 +0200606 Py_off_t pos, end;
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200607#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000608 PyObject *result;
609 Py_ssize_t total = 0;
Victor Stinnerc44057d2013-01-03 03:33:21 +0100610 Py_ssize_t n;
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200611 size_t newsize;
Guido van Rossum7165cb12007-07-10 06:54:34 +0000612
Victor Stinnerb79f28c2011-05-25 22:09:03 +0200613 if (self->fd < 0)
614 return err_closed();
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000615 if (!_PyVerify_fd(self->fd))
616 return PyErr_SetFromErrno(PyExc_IOError);
Kristján Valur Jónssona8abe862009-03-24 15:27:42 +0000617
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000618 result = PyBytes_FromStringAndSize(NULL, SMALLCHUNK);
619 if (result == NULL)
620 return NULL;
Guido van Rossum7165cb12007-07-10 06:54:34 +0000621
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200622#ifdef HAVE_FSTAT
623#if defined(MS_WIN64) || defined(MS_WINDOWS)
624 pos = _lseeki64(self->fd, 0L, SEEK_CUR);
625#else
626 pos = lseek(self->fd, 0L, SEEK_CUR);
627#endif
628 if (fstat(self->fd, &st) == 0)
629 end = st.st_size;
630 else
Victor Stinnera2a64772011-10-11 22:45:02 +0200631 end = (Py_off_t)-1;
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200632#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000633 while (1) {
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200634#ifdef HAVE_FSTAT
635 newsize = new_buffersize(self, total, pos, end);
636#else
637 newsize = new_buffersize(self, total);
638#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000639 if (newsize > PY_SSIZE_T_MAX || newsize <= 0) {
640 PyErr_SetString(PyExc_OverflowError,
641 "unbounded read returned more bytes "
642 "than a Python string can hold ");
643 Py_DECREF(result);
644 return NULL;
645 }
Christian Heimesa872de52008-12-05 08:26:55 +0000646
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000647 if (PyBytes_GET_SIZE(result) < (Py_ssize_t)newsize) {
648 if (_PyBytes_Resize(&result, newsize) < 0) {
649 if (total == 0) {
650 Py_DECREF(result);
651 return NULL;
652 }
653 PyErr_Clear();
654 break;
655 }
656 }
657 Py_BEGIN_ALLOW_THREADS
658 errno = 0;
Victor Stinnerc44057d2013-01-03 03:33:21 +0100659 n = newsize - total;
660#if defined(MS_WIN64) || defined(MS_WINDOWS)
661 if (n > INT_MAX)
662 n = INT_MAX;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000663 n = read(self->fd,
664 PyBytes_AS_STRING(result) + total,
Victor Stinnerc44057d2013-01-03 03:33:21 +0100665 (int)n);
666#else
667 n = read(self->fd,
668 PyBytes_AS_STRING(result) + total,
669 n);
670#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000671 Py_END_ALLOW_THREADS
672 if (n == 0)
673 break;
674 if (n < 0) {
Gregory P. Smith51359922012-06-23 23:55:39 -0700675 if (errno == EINTR) {
676 if (PyErr_CheckSignals()) {
677 Py_DECREF(result);
678 return NULL;
679 }
680 continue;
681 }
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000682 if (total > 0)
683 break;
684 if (errno == EAGAIN) {
685 Py_DECREF(result);
686 Py_RETURN_NONE;
687 }
688 Py_DECREF(result);
689 PyErr_SetFromErrno(PyExc_IOError);
690 return NULL;
691 }
692 total += n;
Victor Stinnere9d44ccb2011-05-26 00:16:44 +0200693#ifdef HAVE_FSTAT
694 pos += n;
695#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000696 }
Guido van Rossum7165cb12007-07-10 06:54:34 +0000697
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000698 if (PyBytes_GET_SIZE(result) > total) {
699 if (_PyBytes_Resize(&result, total) < 0) {
700 /* This should never happen, but just in case */
701 Py_DECREF(result);
702 return NULL;
703 }
704 }
705 return result;
Guido van Rossum7165cb12007-07-10 06:54:34 +0000706}
707
Guido van Rossuma9e20242007-03-08 00:43:48 +0000708static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000709fileio_read(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000710{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000711 char *ptr;
712 Py_ssize_t n;
713 Py_ssize_t size = -1;
714 PyObject *bytes;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000715
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000716 if (self->fd < 0)
717 return err_closed();
718 if (!self->readable)
719 return err_mode("reading");
Guido van Rossuma9e20242007-03-08 00:43:48 +0000720
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000721 if (!PyArg_ParseTuple(args, "|O&", &_PyIO_ConvertSsize_t, &size))
722 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000723
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000724 if (size < 0) {
725 return fileio_readall(self);
726 }
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000727
Victor Stinnerc655a722011-07-05 11:31:49 +0200728#if defined(MS_WIN64) || defined(MS_WINDOWS)
729 if (size > INT_MAX)
730 size = INT_MAX;
731#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000732 bytes = PyBytes_FromStringAndSize(NULL, size);
733 if (bytes == NULL)
734 return NULL;
735 ptr = PyBytes_AS_STRING(bytes);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000736
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000737 if (_PyVerify_fd(self->fd)) {
738 Py_BEGIN_ALLOW_THREADS
739 errno = 0;
Victor Stinnerc655a722011-07-05 11:31:49 +0200740#if defined(MS_WIN64) || defined(MS_WINDOWS)
741 n = read(self->fd, ptr, (int)size);
742#else
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000743 n = read(self->fd, ptr, size);
Victor Stinnerc655a722011-07-05 11:31:49 +0200744#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000745 Py_END_ALLOW_THREADS
746 } else
747 n = -1;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000748
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000749 if (n < 0) {
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100750 int err = errno;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000751 Py_DECREF(bytes);
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100752 if (err == EAGAIN)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000753 Py_RETURN_NONE;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100754 errno = err;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000755 PyErr_SetFromErrno(PyExc_IOError);
756 return NULL;
757 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000758
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000759 if (n != size) {
760 if (_PyBytes_Resize(&bytes, n) < 0) {
761 Py_DECREF(bytes);
762 return NULL;
763 }
764 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000765
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000766 return (PyObject *) bytes;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000767}
768
769static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000770fileio_write(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000771{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000772 Py_buffer pbuf;
Victor Stinnere6edec22011-01-04 00:29:35 +0000773 Py_ssize_t n, len;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100774 int err;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000775
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000776 if (self->fd < 0)
777 return err_closed();
778 if (!self->writable)
779 return err_mode("writing");
Guido van Rossum53807da2007-04-10 19:01:47 +0000780
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000781 if (!PyArg_ParseTuple(args, "y*", &pbuf))
782 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000783
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000784 if (_PyVerify_fd(self->fd)) {
785 Py_BEGIN_ALLOW_THREADS
786 errno = 0;
Victor Stinnere6edec22011-01-04 00:29:35 +0000787 len = pbuf.len;
788#if defined(MS_WIN64) || defined(MS_WINDOWS)
Victor Stinnere0daff12011-03-20 23:36:35 +0100789 if (len > 32767 && isatty(self->fd)) {
790 /* Issue #11395: the Windows console returns an error (12: not
791 enough space error) on writing into stdout if stdout mode is
792 binary and the length is greater than 66,000 bytes (or less,
793 depending on heap usage). */
794 len = 32767;
795 }
796 else if (len > INT_MAX)
Victor Stinnere6edec22011-01-04 00:29:35 +0000797 len = INT_MAX;
798 n = write(self->fd, pbuf.buf, (int)len);
799#else
Victor Stinner72344792011-01-11 00:04:12 +0000800 n = write(self->fd, pbuf.buf, len);
Victor Stinnere6edec22011-01-04 00:29:35 +0000801#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000802 Py_END_ALLOW_THREADS
803 } else
804 n = -1;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100805 err = errno;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000806
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000807 PyBuffer_Release(&pbuf);
Martin v. Löwis423be952008-08-13 15:53:07 +0000808
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000809 if (n < 0) {
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100810 if (err == EAGAIN)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000811 Py_RETURN_NONE;
Antoine Pitrouc345ce12011-12-16 12:28:32 +0100812 errno = err;
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000813 PyErr_SetFromErrno(PyExc_IOError);
814 return NULL;
815 }
Guido van Rossuma9e20242007-03-08 00:43:48 +0000816
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000817 return PyLong_FromSsize_t(n);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000818}
819
Guido van Rossum53807da2007-04-10 19:01:47 +0000820/* XXX Windows support below is likely incomplete */
821
Guido van Rossum53807da2007-04-10 19:01:47 +0000822/* Cribbed from posix_lseek() */
823static PyObject *
824portable_lseek(int fd, PyObject *posobj, int whence)
825{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000826 Py_off_t pos, res;
Guido van Rossum53807da2007-04-10 19:01:47 +0000827
828#ifdef SEEK_SET
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000829 /* Turn 0, 1, 2 into SEEK_{SET,CUR,END} */
830 switch (whence) {
Guido van Rossum53807da2007-04-10 19:01:47 +0000831#if SEEK_SET != 0
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000832 case 0: whence = SEEK_SET; break;
Guido van Rossum53807da2007-04-10 19:01:47 +0000833#endif
834#if SEEK_CUR != 1
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000835 case 1: whence = SEEK_CUR; break;
Guido van Rossum53807da2007-04-10 19:01:47 +0000836#endif
Antoine Pitrou4f7945f2009-01-20 11:42:11 +0000837#if SEEK_END != 2
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000838 case 2: whence = SEEK_END; break;
Guido van Rossum53807da2007-04-10 19:01:47 +0000839#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000840 }
Guido van Rossum53807da2007-04-10 19:01:47 +0000841#endif /* SEEK_SET */
842
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000843 if (posobj == NULL)
844 pos = 0;
845 else {
846 if(PyFloat_Check(posobj)) {
847 PyErr_SetString(PyExc_TypeError, "an integer is required");
848 return NULL;
849 }
Alexandre Vassalotti77250f42008-05-06 19:48:38 +0000850#if defined(HAVE_LARGEFILE_SUPPORT)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000851 pos = PyLong_AsLongLong(posobj);
Guido van Rossum53807da2007-04-10 19:01:47 +0000852#else
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000853 pos = PyLong_AsLong(posobj);
Guido van Rossum53807da2007-04-10 19:01:47 +0000854#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000855 if (PyErr_Occurred())
856 return NULL;
857 }
Guido van Rossum53807da2007-04-10 19:01:47 +0000858
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000859 if (_PyVerify_fd(fd)) {
860 Py_BEGIN_ALLOW_THREADS
Guido van Rossum53807da2007-04-10 19:01:47 +0000861#if defined(MS_WIN64) || defined(MS_WINDOWS)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000862 res = _lseeki64(fd, pos, whence);
Guido van Rossum53807da2007-04-10 19:01:47 +0000863#else
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000864 res = lseek(fd, pos, whence);
Guido van Rossum53807da2007-04-10 19:01:47 +0000865#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000866 Py_END_ALLOW_THREADS
867 } else
868 res = -1;
869 if (res < 0)
870 return PyErr_SetFromErrno(PyExc_IOError);
Guido van Rossum53807da2007-04-10 19:01:47 +0000871
Alexandre Vassalotti77250f42008-05-06 19:48:38 +0000872#if defined(HAVE_LARGEFILE_SUPPORT)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000873 return PyLong_FromLongLong(res);
Alexandre Vassalotti77250f42008-05-06 19:48:38 +0000874#else
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000875 return PyLong_FromLong(res);
Guido van Rossum53807da2007-04-10 19:01:47 +0000876#endif
877}
878
Guido van Rossuma9e20242007-03-08 00:43:48 +0000879static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000880fileio_seek(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000881{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000882 PyObject *posobj;
883 int whence = 0;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000884
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000885 if (self->fd < 0)
886 return err_closed();
Guido van Rossuma9e20242007-03-08 00:43:48 +0000887
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000888 if (!PyArg_ParseTuple(args, "O|i", &posobj, &whence))
889 return NULL;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000890
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000891 return portable_lseek(self->fd, posobj, whence);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000892}
893
894static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000895fileio_tell(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000896{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000897 if (self->fd < 0)
898 return err_closed();
Guido van Rossuma9e20242007-03-08 00:43:48 +0000899
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000900 return portable_lseek(self->fd, NULL, 1);
Guido van Rossuma9e20242007-03-08 00:43:48 +0000901}
902
Thomas Hellerc6a55ee2007-07-11 12:45:46 +0000903#ifdef HAVE_FTRUNCATE
Guido van Rossuma9e20242007-03-08 00:43:48 +0000904static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +0000905fileio_truncate(fileio *self, PyObject *args)
Guido van Rossuma9e20242007-03-08 00:43:48 +0000906{
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000907 PyObject *posobj = NULL; /* the new size wanted by the user */
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000908#ifndef MS_WINDOWS
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000909 Py_off_t pos;
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000910#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000911 int ret;
912 int fd;
Guido van Rossuma9e20242007-03-08 00:43:48 +0000913
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000914 fd = self->fd;
915 if (fd < 0)
916 return err_closed();
917 if (!self->writable)
918 return err_mode("writing");
Guido van Rossuma9e20242007-03-08 00:43:48 +0000919
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000920 if (!PyArg_ParseTuple(args, "|O", &posobj))
921 return NULL;
Guido van Rossum53807da2007-04-10 19:01:47 +0000922
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000923 if (posobj == Py_None || posobj == NULL) {
924 /* Get the current position. */
925 posobj = portable_lseek(fd, NULL, 1);
926 if (posobj == NULL)
927 return NULL;
928 }
929 else {
930 Py_INCREF(posobj);
931 }
Guido van Rossum53807da2007-04-10 19:01:47 +0000932
Thomas Hellerfdeee3a2007-07-12 11:21:36 +0000933#ifdef MS_WINDOWS
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000934 /* MS _chsize doesn't work if newsize doesn't fit in 32 bits,
935 so don't even try using it. */
936 {
937 PyObject *oldposobj, *tempposobj;
938 HANDLE hFile;
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000939
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000940 /* we save the file pointer position */
941 oldposobj = portable_lseek(fd, NULL, 1);
942 if (oldposobj == NULL) {
943 Py_DECREF(posobj);
944 return NULL;
945 }
Thomas Hellerfdeee3a2007-07-12 11:21:36 +0000946
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000947 /* we then move to the truncation position */
948 tempposobj = portable_lseek(fd, posobj, 0);
949 if (tempposobj == NULL) {
950 Py_DECREF(oldposobj);
951 Py_DECREF(posobj);
952 return NULL;
953 }
954 Py_DECREF(tempposobj);
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000955
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000956 /* Truncate. Note that this may grow the file! */
957 Py_BEGIN_ALLOW_THREADS
958 errno = 0;
959 hFile = (HANDLE)_get_osfhandle(fd);
960 ret = hFile == (HANDLE)-1; /* testing for INVALID_HANDLE value */
961 if (ret == 0) {
962 ret = SetEndOfFile(hFile) == 0;
963 if (ret)
964 errno = EACCES;
965 }
966 Py_END_ALLOW_THREADS
967
968 /* we restore the file pointer position in any case */
969 tempposobj = portable_lseek(fd, oldposobj, 0);
970 Py_DECREF(oldposobj);
971 if (tempposobj == NULL) {
972 Py_DECREF(posobj);
973 return NULL;
974 }
975 Py_DECREF(tempposobj);
976 }
Thomas Hellerfdeee3a2007-07-12 11:21:36 +0000977#else
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000978
979#if defined(HAVE_LARGEFILE_SUPPORT)
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000980 pos = PyLong_AsLongLong(posobj);
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000981#else
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000982 pos = PyLong_AsLong(posobj);
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000983#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000984 if (PyErr_Occurred()){
985 Py_DECREF(posobj);
986 return NULL;
987 }
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000988
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000989 Py_BEGIN_ALLOW_THREADS
990 errno = 0;
991 ret = ftruncate(fd, pos);
992 Py_END_ALLOW_THREADS
Antoine Pitrou905a2ff2010-01-31 22:47:27 +0000993
Thomas Hellerfdeee3a2007-07-12 11:21:36 +0000994#endif /* !MS_WINDOWS */
Guido van Rossuma9e20242007-03-08 00:43:48 +0000995
Antoine Pitrouae4b4722010-05-05 16:31:07 +0000996 if (ret != 0) {
997 Py_DECREF(posobj);
998 PyErr_SetFromErrno(PyExc_IOError);
999 return NULL;
1000 }
Guido van Rossuma9e20242007-03-08 00:43:48 +00001001
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001002 return posobj;
Guido van Rossuma9e20242007-03-08 00:43:48 +00001003}
Antoine Pitrou905a2ff2010-01-31 22:47:27 +00001004#endif /* HAVE_FTRUNCATE */
Guido van Rossum53807da2007-04-10 19:01:47 +00001005
1006static char *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001007mode_string(fileio *self)
Guido van Rossum53807da2007-04-10 19:01:47 +00001008{
Charles-François Natalidc3044c2012-01-09 22:40:02 +01001009 if (self->created) {
1010 if (self->readable)
1011 return "xb+";
1012 else
1013 return "xb";
1014 }
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001015 if (self->readable) {
1016 if (self->writable)
1017 return "rb+";
1018 else
1019 return "rb";
1020 }
1021 else
1022 return "wb";
Guido van Rossum53807da2007-04-10 19:01:47 +00001023}
Guido van Rossuma9e20242007-03-08 00:43:48 +00001024
1025static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001026fileio_repr(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +00001027{
Martin v. Löwis767046a2011-10-14 15:35:36 +02001028 _Py_IDENTIFIER(name);
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001029 PyObject *nameobj, *res;
Guido van Rossuma9e20242007-03-08 00:43:48 +00001030
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001031 if (self->fd < 0)
1032 return PyUnicode_FromFormat("<_io.FileIO [closed]>");
Antoine Pitrou716c4442009-05-23 19:04:03 +00001033
Martin v. Löwis767046a2011-10-14 15:35:36 +02001034 nameobj = _PyObject_GetAttrId((PyObject *) self, &PyId_name);
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001035 if (nameobj == NULL) {
1036 if (PyErr_ExceptionMatches(PyExc_AttributeError))
1037 PyErr_Clear();
1038 else
1039 return NULL;
1040 res = PyUnicode_FromFormat("<_io.FileIO fd=%d mode='%s'>",
1041 self->fd, mode_string(self));
1042 }
1043 else {
1044 res = PyUnicode_FromFormat("<_io.FileIO name=%R mode='%s'>",
1045 nameobj, mode_string(self));
1046 Py_DECREF(nameobj);
1047 }
1048 return res;
Guido van Rossuma9e20242007-03-08 00:43:48 +00001049}
1050
1051static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001052fileio_isatty(fileio *self)
Guido van Rossuma9e20242007-03-08 00:43:48 +00001053{
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001054 long res;
Guido van Rossum53807da2007-04-10 19:01:47 +00001055
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001056 if (self->fd < 0)
1057 return err_closed();
1058 Py_BEGIN_ALLOW_THREADS
1059 res = isatty(self->fd);
1060 Py_END_ALLOW_THREADS
1061 return PyBool_FromLong(res);
Guido van Rossuma9e20242007-03-08 00:43:48 +00001062}
1063
Antoine Pitrou243757e2010-11-05 21:15:39 +00001064static PyObject *
1065fileio_getstate(fileio *self)
1066{
1067 PyErr_Format(PyExc_TypeError,
1068 "cannot serialize '%s' object", Py_TYPE(self)->tp_name);
1069 return NULL;
1070}
1071
Guido van Rossuma9e20242007-03-08 00:43:48 +00001072
1073PyDoc_STRVAR(fileio_doc,
Ross Lagerwall59142db2011-10-31 20:34:46 +02001074"file(name: str[, mode: str][, opener: None]) -> file IO object\n"
Guido van Rossuma9e20242007-03-08 00:43:48 +00001075"\n"
Charles-François Natalidc3044c2012-01-09 22:40:02 +01001076"Open a file. The mode can be 'r', 'w', 'x' or 'a' for reading (default),\n"
Charles-François Natalid612de12012-01-14 11:51:00 +01001077"writing, exclusive creation or appending. The file will be created if it\n"
1078"doesn't exist when opened for writing or appending; it will be truncated\n"
1079"when opened for writing. A `FileExistsError` will be raised if it already\n"
Charles-François Natalidc3044c2012-01-09 22:40:02 +01001080"exists when opened for creating. Opening a file for creating implies\n"
1081"writing so this mode behaves in a similar way to 'w'.Add a '+' to the mode\n"
1082"to allow simultaneous reading and writing. A custom opener can be used by\n"
1083"passing a callable as *opener*. The underlying file descriptor for the file\n"
Ross Lagerwall59142db2011-10-31 20:34:46 +02001084"object is then obtained by calling opener with (*name*, *flags*).\n"
Charles-François Natalidc3044c2012-01-09 22:40:02 +01001085"*opener* must return an open file descriptor (passing os.open as *opener*\n"
1086"results in functionality similar to passing None).");
Guido van Rossuma9e20242007-03-08 00:43:48 +00001087
1088PyDoc_STRVAR(read_doc,
1089"read(size: int) -> bytes. read at most size bytes, returned as bytes.\n"
1090"\n"
1091"Only makes one system call, so less data may be returned than requested\n"
Guido van Rossum7165cb12007-07-10 06:54:34 +00001092"In non-blocking mode, returns None if no data is available.\n"
1093"On end-of-file, returns ''.");
1094
1095PyDoc_STRVAR(readall_doc,
1096"readall() -> bytes. read all data from the file, returned as bytes.\n"
1097"\n"
1098"In non-blocking mode, returns as much as is immediately available,\n"
1099"or None if no data is available. On end-of-file, returns ''.");
Guido van Rossuma9e20242007-03-08 00:43:48 +00001100
1101PyDoc_STRVAR(write_doc,
1102"write(b: bytes) -> int. Write bytes b to file, return number written.\n"
1103"\n"
1104"Only makes one system call, so not all of the data may be written.\n"
1105"The number of bytes actually written is returned.");
1106
1107PyDoc_STRVAR(fileno_doc,
1108"fileno() -> int. \"file descriptor\".\n"
1109"\n"
1110"This is needed for lower-level file interfaces, such the fcntl module.");
1111
1112PyDoc_STRVAR(seek_doc,
1113"seek(offset: int[, whence: int]) -> None. Move to new file position.\n"
1114"\n"
1115"Argument offset is a byte count. Optional argument whence defaults to\n"
1116"0 (offset from start of file, offset should be >= 0); other values are 1\n"
1117"(move relative to current position, positive or negative), and 2 (move\n"
1118"relative to end of file, usually negative, although many platforms allow\n"
1119"seeking beyond the end of a file)."
1120"\n"
1121"Note that not all file objects are seekable.");
1122
Thomas Hellerc6a55ee2007-07-11 12:45:46 +00001123#ifdef HAVE_FTRUNCATE
Guido van Rossuma9e20242007-03-08 00:43:48 +00001124PyDoc_STRVAR(truncate_doc,
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001125"truncate([size: int]) -> None. Truncate the file to at most size bytes.\n"
Guido van Rossuma9e20242007-03-08 00:43:48 +00001126"\n"
Alexandre Vassalotti77250f42008-05-06 19:48:38 +00001127"Size defaults to the current file position, as returned by tell()."
1128"The current file position is changed to the value of size.");
Thomas Hellerc6a55ee2007-07-11 12:45:46 +00001129#endif
Guido van Rossuma9e20242007-03-08 00:43:48 +00001130
1131PyDoc_STRVAR(tell_doc,
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001132"tell() -> int. Current file position");
Guido van Rossuma9e20242007-03-08 00:43:48 +00001133
1134PyDoc_STRVAR(readinto_doc,
Benjamin Peterson9a8082f2009-03-05 00:55:56 +00001135"readinto() -> Same as RawIOBase.readinto().");
Guido van Rossuma9e20242007-03-08 00:43:48 +00001136
1137PyDoc_STRVAR(close_doc,
1138"close() -> None. Close the file.\n"
1139"\n"
1140"A closed file cannot be used for further I/O operations. close() may be\n"
1141"called more than once without error. Changes the fileno to -1.");
1142
1143PyDoc_STRVAR(isatty_doc,
1144"isatty() -> bool. True if the file is connected to a tty device.");
1145
Guido van Rossuma9e20242007-03-08 00:43:48 +00001146PyDoc_STRVAR(seekable_doc,
1147"seekable() -> bool. True if file supports random-access.");
1148
1149PyDoc_STRVAR(readable_doc,
1150"readable() -> bool. True if file was opened in a read mode.");
1151
1152PyDoc_STRVAR(writable_doc,
1153"writable() -> bool. True if file was opened in a write mode.");
1154
1155static PyMethodDef fileio_methods[] = {
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001156 {"read", (PyCFunction)fileio_read, METH_VARARGS, read_doc},
1157 {"readall", (PyCFunction)fileio_readall, METH_NOARGS, readall_doc},
1158 {"readinto", (PyCFunction)fileio_readinto, METH_VARARGS, readinto_doc},
1159 {"write", (PyCFunction)fileio_write, METH_VARARGS, write_doc},
1160 {"seek", (PyCFunction)fileio_seek, METH_VARARGS, seek_doc},
1161 {"tell", (PyCFunction)fileio_tell, METH_VARARGS, tell_doc},
Thomas Hellerc6a55ee2007-07-11 12:45:46 +00001162#ifdef HAVE_FTRUNCATE
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001163 {"truncate", (PyCFunction)fileio_truncate, METH_VARARGS, truncate_doc},
Thomas Hellerc6a55ee2007-07-11 12:45:46 +00001164#endif
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001165 {"close", (PyCFunction)fileio_close, METH_NOARGS, close_doc},
1166 {"seekable", (PyCFunction)fileio_seekable, METH_NOARGS, seekable_doc},
1167 {"readable", (PyCFunction)fileio_readable, METH_NOARGS, readable_doc},
1168 {"writable", (PyCFunction)fileio_writable, METH_NOARGS, writable_doc},
1169 {"fileno", (PyCFunction)fileio_fileno, METH_NOARGS, fileno_doc},
1170 {"isatty", (PyCFunction)fileio_isatty, METH_NOARGS, isatty_doc},
Antoine Pitroue033e062010-10-29 10:38:18 +00001171 {"_dealloc_warn", (PyCFunction)fileio_dealloc_warn, METH_O, NULL},
Antoine Pitrou243757e2010-11-05 21:15:39 +00001172 {"__getstate__", (PyCFunction)fileio_getstate, METH_NOARGS, NULL},
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001173 {NULL, NULL} /* sentinel */
Guido van Rossuma9e20242007-03-08 00:43:48 +00001174};
1175
Guido van Rossum53807da2007-04-10 19:01:47 +00001176/* 'closed' and 'mode' are attributes for backwards compatibility reasons. */
1177
Guido van Rossumb0428152007-04-08 17:44:42 +00001178static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001179get_closed(fileio *self, void *closure)
Guido van Rossumb0428152007-04-08 17:44:42 +00001180{
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001181 return PyBool_FromLong((long)(self->fd < 0));
Guido van Rossum53807da2007-04-10 19:01:47 +00001182}
1183
1184static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001185get_closefd(fileio *self, void *closure)
Christian Heimesecc42a22008-11-05 19:30:32 +00001186{
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001187 return PyBool_FromLong((long)(self->closefd));
Christian Heimesecc42a22008-11-05 19:30:32 +00001188}
1189
1190static PyObject *
Benjamin Peterson680bf1a2009-06-12 02:07:12 +00001191get_mode(fileio *self, void *closure)
Guido van Rossum53807da2007-04-10 19:01:47 +00001192{
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001193 return PyUnicode_FromString(mode_string(self));
Guido van Rossumb0428152007-04-08 17:44:42 +00001194}
1195
1196static PyGetSetDef fileio_getsetlist[] = {
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001197 {"closed", (getter)get_closed, NULL, "True if the file is closed"},
1198 {"closefd", (getter)get_closefd, NULL,
1199 "True if the file descriptor will be closed"},
1200 {"mode", (getter)get_mode, NULL, "String giving the file mode"},
1201 {NULL},
Guido van Rossumb0428152007-04-08 17:44:42 +00001202};
1203
Guido van Rossuma9e20242007-03-08 00:43:48 +00001204PyTypeObject PyFileIO_Type = {
Antoine Pitrouae4b4722010-05-05 16:31:07 +00001205 PyVarObject_HEAD_INIT(NULL, 0)
1206 "_io.FileIO",
1207 sizeof(fileio),
1208 0,
1209 (destructor)fileio_dealloc, /* tp_dealloc */
1210 0, /* tp_print */
1211 0, /* tp_getattr */
1212 0, /* tp_setattr */
1213 0, /* tp_reserved */
1214 (reprfunc)fileio_repr, /* tp_repr */
1215 0, /* tp_as_number */
1216 0, /* tp_as_sequence */
1217 0, /* tp_as_mapping */
1218 0, /* tp_hash */
1219 0, /* tp_call */
1220 0, /* tp_str */
1221 PyObject_GenericGetAttr, /* tp_getattro */
1222 0, /* tp_setattro */
1223 0, /* tp_as_buffer */
1224 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE
1225 | Py_TPFLAGS_HAVE_GC, /* tp_flags */
1226 fileio_doc, /* tp_doc */
1227 (traverseproc)fileio_traverse, /* tp_traverse */
1228 (inquiry)fileio_clear, /* tp_clear */
1229 0, /* tp_richcompare */
1230 offsetof(fileio, weakreflist), /* tp_weaklistoffset */
1231 0, /* tp_iter */
1232 0, /* tp_iternext */
1233 fileio_methods, /* tp_methods */
1234 0, /* tp_members */
1235 fileio_getsetlist, /* tp_getset */
1236 0, /* tp_base */
1237 0, /* tp_dict */
1238 0, /* tp_descr_get */
1239 0, /* tp_descr_set */
1240 offsetof(fileio, dict), /* tp_dictoffset */
1241 fileio_init, /* tp_init */
1242 PyType_GenericAlloc, /* tp_alloc */
1243 fileio_new, /* tp_new */
1244 PyObject_GC_Del, /* tp_free */
Guido van Rossuma9e20242007-03-08 00:43:48 +00001245};