diff options
author | Guido van Rossum <guido@python.org> | 2007-03-08 00:43:48 (GMT) |
---|---|---|
committer | Guido van Rossum <guido@python.org> | 2007-03-08 00:43:48 (GMT) |
commit | a9e2024b8443959cc906958d161afe9f0d08bc25 (patch) | |
tree | e90d1893c99002ba822e9f7e9b4c41ce79923774 /Modules/_fileio.c | |
parent | 4d0f5a4934854207948115b14b4643a6cb600a0d (diff) | |
download | cpython-a9e2024b8443959cc906958d161afe9f0d08bc25.zip cpython-a9e2024b8443959cc906958d161afe9f0d08bc25.tar.gz cpython-a9e2024b8443959cc906958d161afe9f0d08bc25.tar.bz2 |
Check in Daniel Stutzbach's _fileio.c and test_fileio.py
(see SF#1671314) with small tweaks.
The io module now uses this instead of its own implementation
of the FileIO class, if it can import _fileio.
Diffstat (limited to 'Modules/_fileio.c')
-rw-r--r-- | Modules/_fileio.c | 713 |
1 files changed, 713 insertions, 0 deletions
diff --git a/Modules/_fileio.c b/Modules/_fileio.c new file mode 100644 index 0000000..9ab27c1 --- /dev/null +++ b/Modules/_fileio.c @@ -0,0 +1,713 @@ +/* Author: Daniel Stutzbach */ + +#define PY_SSIZE_T_CLEAN +#include "Python.h" +#include <sys/types.h> +#include <sys/stat.h> +#include <fcntl.h> +#include <stddef.h> /* For offsetof */ + +/* + * Known likely problems: + * + * - Files larger then 2**32-1 + * - Files with unicode filenames + * - Passing numbers greater than 2**32-1 when an integer is expected + * - Making it work on Windows and other oddball platforms + * + * To Do: + * + * - autoconfify header file inclusion + * - Make the ABC RawIO type and inherit from it. + * + * Unanswered questions: + * + * - Add mode, name, and closed properties a la Python 2 file objects? + * - Do we need a (*close)() in the struct like Python 2 file objects, + * for not-quite-ordinary-file objects? + */ + +#ifdef MS_WINDOWS +/* can simulate truncate with Win32 API functions; see file_truncate */ +#define HAVE_FTRUNCATE +#define WIN32_LEAN_AND_MEAN +#include <windows.h> +#endif + +typedef struct { + PyObject_HEAD + int fd; + int own_fd; /* 1 means we should close fd */ + int readable; + int writable; + int seekable; /* -1 means unknown */ + PyObject *weakreflist; +} PyFileIOObject; + +#define PyFileIO_Check(op) (PyObject_TypeCheck((op), &PyFileIO_Type)) + +/* Note: if this function is changed so that it can return a true value, + * then we need a separate function for __exit__ + */ +static PyObject * +fileio_close(PyFileIOObject *self) +{ + if (self->fd >= 0) { + Py_BEGIN_ALLOW_THREADS + errno = 0; + close(self->fd); + Py_END_ALLOW_THREADS + if (errno < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + self->fd = -1; + } + + Py_RETURN_NONE; +} + +static PyObject * +fileio_new(PyTypeObject *type, PyObject *args, PyObject *kews) +{ + PyFileIOObject *self; + + assert(type != NULL && type->tp_alloc != NULL); + + self = (PyFileIOObject *) type->tp_alloc(type, 0); + if (self != NULL) { + self->fd = -1; + self->weakreflist = NULL; + self->own_fd = 1; + self->seekable = -1; + } + + return (PyObject *) self; +} + +/* On Unix, open will succeed for directories. + In Python, there should be no file objects referring to + directories, so we need a check. */ + +static int +dircheck(PyFileIOObject* self) +{ +#if defined(HAVE_FSTAT) && defined(S_IFDIR) && defined(EISDIR) + struct stat buf; + if (self->fd < 0) + return 0; + if (fstat(self->fd, &buf) == 0 && S_ISDIR(buf.st_mode)) { +#ifdef HAVE_STRERROR + char *msg = strerror(EISDIR); +#else + char *msg = "Is a directory"; +#endif + PyObject *exc; + PyObject *closeresult = fileio_close(self); + Py_DECREF(closeresult); + + exc = PyObject_CallFunction(PyExc_IOError, "(is)", + EISDIR, msg); + PyErr_SetObject(PyExc_IOError, exc); + Py_XDECREF(exc); + return -1; + } +#endif + return 0; +} + + +static int +fileio_init(PyObject *oself, PyObject *args, PyObject *kwds) +{ + PyFileIOObject *self = (PyFileIOObject *) oself; + static char *kwlist[] = {"filename", "mode", NULL}; + char *name = NULL; + char *mode = "r"; + char *s; + int wideargument = 0; + int ret = 0; + int rwa = 0, plus = 0, append = 0; + int flags = 0; + + assert(PyFileIO_Check(oself)); + if (self->fd >= 0) + { + /* Have to close the existing file first. */ + PyObject *closeresult = fileio_close(self); + if (closeresult == NULL) + return -1; + Py_DECREF(closeresult); + } + +#ifdef Py_WIN_WIDE_FILENAMES + if (GetVersion() < 0x80000000) { /* On NT, so wide API available */ + PyObject *po; + if (PyArg_ParseTupleAndKeywords(args, kwds, "U|s:fileio", + kwlist, &po, &mode)) { + wideargument = 1; + } else { + /* Drop the argument parsing error as narrow + strings are also valid. */ + PyErr_Clear(); + } + + PyErr_SetString(PyExc_NotImplementedError, + "Windows wide filenames are not yet supported"); + goto error; + } +#endif + + if (!wideargument) { + if (!PyArg_ParseTupleAndKeywords(args, kwds, "et|s:fileio", + kwlist, + Py_FileSystemDefaultEncoding, + &name, &mode)) + goto error; + } + + self->readable = self->writable = 0; + s = mode; + while (*s) { + switch (*s++) { + case 'r': + if (rwa) { + bad_mode: + PyErr_SetString(PyExc_ValueError, + "Must have exactly one of read/write/append mode"); + goto error; + } + rwa = 1; + self->readable = 1; + break; + case 'w': + if (rwa) + goto bad_mode; + rwa = 1; + self->writable = 1; + flags |= O_CREAT | O_TRUNC; + break; + case 'a': + if (rwa) + goto bad_mode; + rwa = 1; + self->writable = 1; + flags |= O_CREAT; + append = 1; + break; + case '+': + if (plus) + goto bad_mode; + self->readable = self->writable = 1; + plus = 1; + break; + default: + PyErr_Format(PyExc_ValueError, + "invalid mode: %.200s", mode); + goto error; + } + } + + if (!rwa) + goto bad_mode; + + if (self->readable && self->writable) + flags |= O_RDWR; + else if (self->readable) + flags |= O_RDONLY; + else + flags |= O_WRONLY; + +#ifdef O_BINARY + flags |= O_BINARY; +#endif + + Py_BEGIN_ALLOW_THREADS + errno = 0; + self->fd = open(name, flags, 0666); + Py_END_ALLOW_THREADS + if (self->fd < 0 || dircheck(self) < 0) { + PyErr_SetFromErrnoWithFilename(PyExc_IOError, name); + goto error; + } + + goto done; + + error: + ret = -1; + + done: + PyMem_Free(name); + return ret; +} + +static void +fileio_dealloc(PyFileIOObject *self) +{ + if (self->weakreflist != NULL) + PyObject_ClearWeakRefs((PyObject *) self); + + if (self->fd >= 0 && self->own_fd) { + PyObject *closeresult = fileio_close(self); + if (closeresult == NULL) { +#ifdef HAVE_STRERROR + PySys_WriteStderr("close failed: [Errno %d] %s\n", errno, strerror(errno)); +#else + PySys_WriteStderr("close failed: [Errno %d]\n", errno); +#endif + } else + Py_DECREF(closeresult); + } + + self->ob_type->tp_free((PyObject *)self); +} + +static PyObject * +err_closed(void) +{ + PyErr_SetString(PyExc_ValueError, "I/O operation on closed file"); + return NULL; +} + +static PyObject * +fileio_fileno(PyFileIOObject *self) +{ + if (self->fd < 0) + return err_closed(); + return PyInt_FromLong((long) self->fd); +} + +static PyObject * +fileio_readable(PyFileIOObject *self) +{ + if (self->fd < 0) + return err_closed(); + return PyInt_FromLong((long) self->readable); +} + +static PyObject * +fileio_writable(PyFileIOObject *self) +{ + if (self->fd < 0) + return err_closed(); + return PyInt_FromLong((long) self->writable); +} + +static PyObject * +fileio_seekable(PyFileIOObject *self) +{ + if (self->fd < 0) + return err_closed(); + if (self->seekable < 0) { + int ret; + Py_BEGIN_ALLOW_THREADS + ret = lseek(self->fd, 0, SEEK_CUR); + Py_END_ALLOW_THREADS + if (ret < 0) + self->seekable = 0; + else + self->seekable = 1; + } + return PyInt_FromLong((long) self->seekable); +} + +static PyObject * +fileio_readinto(PyFileIOObject *self, PyObject *args) +{ + char *ptr; + Py_ssize_t n; + + if (self->fd < 0) + return err_closed(); + if (!PyArg_ParseTuple(args, "w#", &ptr, &n)) + return NULL; + + Py_BEGIN_ALLOW_THREADS + errno = 0; + n = read(self->fd, ptr, n); + Py_END_ALLOW_THREADS + if (n < 0) { + if (errno == EAGAIN) + Py_RETURN_NONE; + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + return PyInt_FromLong(n); +} + +static PyObject * +fileio_read(PyFileIOObject *self, PyObject *args) +{ + char *ptr; + Py_ssize_t n, size; + PyObject *bytes; + + if (self->fd < 0) + return err_closed(); + + if (!PyArg_ParseTuple(args, "i", &size)) + return NULL; + + bytes = PyBytes_FromStringAndSize(NULL, size); + if (bytes == NULL) + return NULL; + ptr = PyBytes_AsString(bytes); + + Py_BEGIN_ALLOW_THREADS + errno = 0; + n = read(self->fd, ptr, size); + Py_END_ALLOW_THREADS + + if (n < 0) { + if (errno == EAGAIN) + Py_RETURN_NONE; + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + if (n != size) { + if (PyBytes_Resize(bytes, n) < 0) { + Py_DECREF(bytes); + return NULL; + } + } + + return (PyObject *) bytes; +} + +static PyObject * +fileio_write(PyFileIOObject *self, PyObject *args) +{ + Py_ssize_t n; + char *ptr; + + if (self->fd < 0) + return err_closed(); + if (!PyArg_ParseTuple(args, "s#", &ptr, &n)) + return NULL; + + Py_BEGIN_ALLOW_THREADS + errno = 0; + n = write(self->fd, ptr, n); + Py_END_ALLOW_THREADS + + if (n < 0) { + if (errno == EAGAIN) + Py_RETURN_NONE; + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + return PyInt_FromLong(n); +} + +static PyObject * +fileio_seek(PyFileIOObject *self, PyObject *args) +{ + Py_ssize_t offset; + Py_ssize_t whence = 0; + + if (self->fd < 0) + return err_closed(); + + if (!PyArg_ParseTuple(args, "i|i", &offset, &whence)) + return NULL; + + Py_BEGIN_ALLOW_THREADS + errno = 0; + offset = lseek(self->fd, offset, whence); + Py_END_ALLOW_THREADS + + if (offset < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + Py_RETURN_NONE; +} + +static PyObject * +fileio_tell(PyFileIOObject *self, PyObject *args) +{ + Py_ssize_t offset; + + if (self->fd < 0) + return err_closed(); + + Py_BEGIN_ALLOW_THREADS + errno = 0; + offset = lseek(self->fd, 0, SEEK_CUR); + Py_END_ALLOW_THREADS + + if (offset < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + return PyInt_FromLong(offset); +} + +#ifdef HAVE_FTRUNCATE +static PyObject * +fileio_truncate(PyFileIOObject *self, PyObject *args) +{ + Py_ssize_t length; + int ret; + + if (self->fd < 0) + return err_closed(); + + /* Setup default value */ + Py_BEGIN_ALLOW_THREADS + errno = 0; + length = lseek(self->fd, 0, SEEK_CUR); + Py_END_ALLOW_THREADS + + if (length < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + if (!PyArg_ParseTuple(args, "|i", &length)) + return NULL; + +#ifdef MS_WINDOWS + /* MS _chsize doesn't work if newsize doesn't fit in 32 bits, + so don't even try using it. */ + { + HANDLE hFile; + Py_ssize_t initialpos; + + /* Have to move current pos to desired endpoint on Windows. */ + Py_BEGIN_ALLOW_THREADS + errno = 0; + ret = _portable_fseek(f->f_fp, newsize, SEEK_SET) != 0; + Py_END_ALLOW_THREADS + if (ret) + goto onioerror; + + /* Truncate. Note that this may grow the file! */ + Py_BEGIN_ALLOW_THREADS + errno = 0; + hFile = (HANDLE)_get_osfhandle(fileno(f->f_fp)); + ret = hFile == (HANDLE)-1; + if (ret == 0) { + ret = SetEndOfFile(hFile) == 0; + if (ret) + errno = EACCES; + } + Py_END_ALLOW_THREADS + if (ret) + goto onioerror; + } +#else + Py_BEGIN_ALLOW_THREADS + errno = 0; + ret = ftruncate(self->fd, length); + Py_END_ALLOW_THREADS +#endif /* !MS_WINDOWS */ + + if (ret < 0) { + onioerror: + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + + /* Return to initial position */ + Py_BEGIN_ALLOW_THREADS + errno = 0; + ret = lseek(self->fd, length, SEEK_SET); + Py_END_ALLOW_THREADS + if (ret < 0) + goto onioerror; + + Py_RETURN_NONE; +} +#endif + +static PyObject * +fileio_repr(PyFileIOObject *self) +{ + PyObject *ret = NULL; + + ret = PyString_FromFormat("<%s file at %p>", + self->fd < 0 ? "closed" : "open", + self); + return ret; +} + +static PyObject * +fileio_isatty(PyFileIOObject *self) +{ + long res; + + if (self->fd < 0) + return err_closed(); + Py_BEGIN_ALLOW_THREADS + res = isatty(self->fd); + Py_END_ALLOW_THREADS + return PyBool_FromLong(res); +} + +static PyObject * +fileio_self(PyFileIOObject *self) +{ + if (self->fd < 0) + return err_closed(); + Py_INCREF(self); + return (PyObject *)self; +} + +PyDoc_STRVAR(fileio_doc, +"file(name: str[, mode: str]) -> file IO object\n" +"\n" +"Open a file. The mode can be 'r', 'w' or 'a' for reading (default),\n" +"writing or appending. The file will be created if it doesn't exist\n" +"when opened for writing or appending; it will be truncated when\n" +"opened for writing. Add a '+' to the mode to allow simultaneous\n" +"reading and writing."); + +PyDoc_STRVAR(read_doc, +"read(size: int) -> bytes. read at most size bytes, returned as bytes.\n" +"\n" +"Only makes one system call, so less data may be returned than requested\n" +"In non-blocking mode, returns None if no data is available. On\n" +"end-of-file, returns 0."); + +PyDoc_STRVAR(write_doc, +"write(b: bytes) -> int. Write bytes b to file, return number written.\n" +"\n" +"Only makes one system call, so not all of the data may be written.\n" +"The number of bytes actually written is returned."); + +PyDoc_STRVAR(fileno_doc, +"fileno() -> int. \"file descriptor\".\n" +"\n" +"This is needed for lower-level file interfaces, such the fcntl module."); + +PyDoc_STRVAR(seek_doc, +"seek(offset: int[, whence: int]) -> None. Move to new file position.\n" +"\n" +"Argument offset is a byte count. Optional argument whence defaults to\n" +"0 (offset from start of file, offset should be >= 0); other values are 1\n" +"(move relative to current position, positive or negative), and 2 (move\n" +"relative to end of file, usually negative, although many platforms allow\n" +"seeking beyond the end of a file)." +"\n" +"Note that not all file objects are seekable."); + +PyDoc_STRVAR(truncate_doc, +"truncate([size: int]) -> None. Truncate the file to at most size bytes.\n" +"\n" +"Size defaults to the current file position, as returned by tell()."); + +PyDoc_STRVAR(tell_doc, +"tell() -> int. Current file position"); + +PyDoc_STRVAR(readinto_doc, +"readinto() -> Undocumented. Don't use this; it may go away."); + +PyDoc_STRVAR(close_doc, +"close() -> None. Close the file.\n" +"\n" +"A closed file cannot be used for further I/O operations. close() may be\n" +"called more than once without error. Changes the fileno to -1."); + +PyDoc_STRVAR(isatty_doc, +"isatty() -> bool. True if the file is connected to a tty device."); + +PyDoc_STRVAR(enter_doc, +"__enter__() -> self."); + +PyDoc_STRVAR(exit_doc, +"__exit__(*excinfo) -> None. Closes the file."); + +PyDoc_STRVAR(seekable_doc, +"seekable() -> bool. True if file supports random-access."); + +PyDoc_STRVAR(readable_doc, +"readable() -> bool. True if file was opened in a read mode."); + +PyDoc_STRVAR(writable_doc, +"writable() -> bool. True if file was opened in a write mode."); + +static PyMethodDef fileio_methods[] = { + {"read", (PyCFunction)fileio_read, METH_VARARGS, read_doc}, + {"readinto", (PyCFunction)fileio_readinto, METH_VARARGS, readinto_doc}, + {"write", (PyCFunction)fileio_write, METH_VARARGS, write_doc}, + {"seek", (PyCFunction)fileio_seek, METH_VARARGS, seek_doc}, + {"tell", (PyCFunction)fileio_tell, METH_VARARGS, tell_doc}, + {"truncate", (PyCFunction)fileio_truncate, METH_VARARGS, truncate_doc}, + {"close", (PyCFunction)fileio_close, METH_NOARGS, close_doc}, + {"seekable", (PyCFunction)fileio_seekable, METH_NOARGS, seekable_doc}, + {"readable", (PyCFunction)fileio_readable, METH_NOARGS, readable_doc}, + {"writable", (PyCFunction)fileio_writable, METH_NOARGS, writable_doc}, + {"fileno", (PyCFunction)fileio_fileno, METH_NOARGS, fileno_doc}, + {"isatty", (PyCFunction)fileio_isatty, METH_NOARGS, isatty_doc}, + {"__enter__",(PyCFunction)fileio_self, METH_NOARGS, enter_doc}, + {"__exit__", (PyCFunction)fileio_close, METH_VARARGS, exit_doc}, + {NULL, NULL} /* sentinel */ +}; + +PyTypeObject PyFileIO_Type = { + PyObject_HEAD_INIT(&PyType_Type) + 0, + "FileIO", + sizeof(PyFileIOObject), + 0, + (destructor)fileio_dealloc, /* tp_dealloc */ + 0, /* tp_print */ + 0, /* tp_getattr */ + 0, /* tp_setattr */ + 0, /* tp_compare */ + (reprfunc)fileio_repr, /* tp_repr */ + 0, /* tp_as_number */ + 0, /* tp_as_sequence */ + 0, /* tp_as_mapping */ + 0, /* tp_hash */ + 0, /* tp_call */ + 0, /* tp_str */ + PyObject_GenericGetAttr, /* tp_getattro */ + 0, /* tp_setattro */ + 0, /* tp_as_buffer */ + Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */ + fileio_doc, /* tp_doc */ + 0, /* tp_traverse */ + 0, /* tp_clear */ + 0, /* tp_richcompare */ + offsetof(PyFileIOObject, weakreflist), /* tp_weaklistoffset */ + 0, /* tp_iter */ + 0, /* tp_iternext */ + fileio_methods, /* tp_methods */ + 0, /* tp_members */ + 0, /* tp_getset */ + 0, /* tp_base */ + 0, /* tp_dict */ + 0, /* tp_descr_get */ + 0, /* tp_descr_set */ + 0, /* tp_dictoffset */ + fileio_init, /* tp_init */ + PyType_GenericAlloc, /* tp_alloc */ + fileio_new, /* tp_new */ + PyObject_Del, /* tp_free */ +}; + +static PyMethodDef module_methods[] = { + {NULL, NULL} +}; + +PyMODINIT_FUNC +init_fileio(void) +{ + PyObject *m; /* a module object */ + + m = Py_InitModule3("_fileio", module_methods, + "Fast implementation of io.FileIO."); + if (m == NULL) + return; + if (PyType_Ready(&PyFileIO_Type) < 0) + return; + Py_INCREF(&PyFileIO_Type); + PyModule_AddObject(m, "_FileIO", (PyObject *) &PyFileIO_Type); +} |