summaryrefslogtreecommitdiffstats
path: root/Modules/_fileio.c
diff options
context:
space:
mode:
authorGuido van Rossum <guido@python.org>2007-03-08 00:43:48 (GMT)
committerGuido van Rossum <guido@python.org>2007-03-08 00:43:48 (GMT)
commita9e2024b8443959cc906958d161afe9f0d08bc25 (patch)
treee90d1893c99002ba822e9f7e9b4c41ce79923774 /Modules/_fileio.c
parent4d0f5a4934854207948115b14b4643a6cb600a0d (diff)
downloadcpython-a9e2024b8443959cc906958d161afe9f0d08bc25.zip
cpython-a9e2024b8443959cc906958d161afe9f0d08bc25.tar.gz
cpython-a9e2024b8443959cc906958d161afe9f0d08bc25.tar.bz2
Check in Daniel Stutzbach's _fileio.c and test_fileio.py
(see SF#1671314) with small tweaks. The io module now uses this instead of its own implementation of the FileIO class, if it can import _fileio.
Diffstat (limited to 'Modules/_fileio.c')
-rw-r--r--Modules/_fileio.c713
1 files changed, 713 insertions, 0 deletions
diff --git a/Modules/_fileio.c b/Modules/_fileio.c
new file mode 100644
index 0000000..9ab27c1
--- /dev/null
+++ b/Modules/_fileio.c
@@ -0,0 +1,713 @@
+/* Author: Daniel Stutzbach */
+
+#define PY_SSIZE_T_CLEAN
+#include "Python.h"
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <fcntl.h>
+#include <stddef.h> /* For offsetof */
+
+/*
+ * Known likely problems:
+ *
+ * - Files larger then 2**32-1
+ * - Files with unicode filenames
+ * - Passing numbers greater than 2**32-1 when an integer is expected
+ * - Making it work on Windows and other oddball platforms
+ *
+ * To Do:
+ *
+ * - autoconfify header file inclusion
+ * - Make the ABC RawIO type and inherit from it.
+ *
+ * Unanswered questions:
+ *
+ * - Add mode, name, and closed properties a la Python 2 file objects?
+ * - Do we need a (*close)() in the struct like Python 2 file objects,
+ * for not-quite-ordinary-file objects?
+ */
+
+#ifdef MS_WINDOWS
+/* can simulate truncate with Win32 API functions; see file_truncate */
+#define HAVE_FTRUNCATE
+#define WIN32_LEAN_AND_MEAN
+#include <windows.h>
+#endif
+
+typedef struct {
+ PyObject_HEAD
+ int fd;
+ int own_fd; /* 1 means we should close fd */
+ int readable;
+ int writable;
+ int seekable; /* -1 means unknown */
+ PyObject *weakreflist;
+} PyFileIOObject;
+
+#define PyFileIO_Check(op) (PyObject_TypeCheck((op), &PyFileIO_Type))
+
+/* Note: if this function is changed so that it can return a true value,
+ * then we need a separate function for __exit__
+ */
+static PyObject *
+fileio_close(PyFileIOObject *self)
+{
+ if (self->fd >= 0) {
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ close(self->fd);
+ Py_END_ALLOW_THREADS
+ if (errno < 0) {
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+ self->fd = -1;
+ }
+
+ Py_RETURN_NONE;
+}
+
+static PyObject *
+fileio_new(PyTypeObject *type, PyObject *args, PyObject *kews)
+{
+ PyFileIOObject *self;
+
+ assert(type != NULL && type->tp_alloc != NULL);
+
+ self = (PyFileIOObject *) type->tp_alloc(type, 0);
+ if (self != NULL) {
+ self->fd = -1;
+ self->weakreflist = NULL;
+ self->own_fd = 1;
+ self->seekable = -1;
+ }
+
+ return (PyObject *) self;
+}
+
+/* On Unix, open will succeed for directories.
+ In Python, there should be no file objects referring to
+ directories, so we need a check. */
+
+static int
+dircheck(PyFileIOObject* self)
+{
+#if defined(HAVE_FSTAT) && defined(S_IFDIR) && defined(EISDIR)
+ struct stat buf;
+ if (self->fd < 0)
+ return 0;
+ if (fstat(self->fd, &buf) == 0 && S_ISDIR(buf.st_mode)) {
+#ifdef HAVE_STRERROR
+ char *msg = strerror(EISDIR);
+#else
+ char *msg = "Is a directory";
+#endif
+ PyObject *exc;
+ PyObject *closeresult = fileio_close(self);
+ Py_DECREF(closeresult);
+
+ exc = PyObject_CallFunction(PyExc_IOError, "(is)",
+ EISDIR, msg);
+ PyErr_SetObject(PyExc_IOError, exc);
+ Py_XDECREF(exc);
+ return -1;
+ }
+#endif
+ return 0;
+}
+
+
+static int
+fileio_init(PyObject *oself, PyObject *args, PyObject *kwds)
+{
+ PyFileIOObject *self = (PyFileIOObject *) oself;
+ static char *kwlist[] = {"filename", "mode", NULL};
+ char *name = NULL;
+ char *mode = "r";
+ char *s;
+ int wideargument = 0;
+ int ret = 0;
+ int rwa = 0, plus = 0, append = 0;
+ int flags = 0;
+
+ assert(PyFileIO_Check(oself));
+ if (self->fd >= 0)
+ {
+ /* Have to close the existing file first. */
+ PyObject *closeresult = fileio_close(self);
+ if (closeresult == NULL)
+ return -1;
+ Py_DECREF(closeresult);
+ }
+
+#ifdef Py_WIN_WIDE_FILENAMES
+ if (GetVersion() < 0x80000000) { /* On NT, so wide API available */
+ PyObject *po;
+ if (PyArg_ParseTupleAndKeywords(args, kwds, "U|s:fileio",
+ kwlist, &po, &mode)) {
+ wideargument = 1;
+ } else {
+ /* Drop the argument parsing error as narrow
+ strings are also valid. */
+ PyErr_Clear();
+ }
+
+ PyErr_SetString(PyExc_NotImplementedError,
+ "Windows wide filenames are not yet supported");
+ goto error;
+ }
+#endif
+
+ if (!wideargument) {
+ if (!PyArg_ParseTupleAndKeywords(args, kwds, "et|s:fileio",
+ kwlist,
+ Py_FileSystemDefaultEncoding,
+ &name, &mode))
+ goto error;
+ }
+
+ self->readable = self->writable = 0;
+ s = mode;
+ while (*s) {
+ switch (*s++) {
+ case 'r':
+ if (rwa) {
+ bad_mode:
+ PyErr_SetString(PyExc_ValueError,
+ "Must have exactly one of read/write/append mode");
+ goto error;
+ }
+ rwa = 1;
+ self->readable = 1;
+ break;
+ case 'w':
+ if (rwa)
+ goto bad_mode;
+ rwa = 1;
+ self->writable = 1;
+ flags |= O_CREAT | O_TRUNC;
+ break;
+ case 'a':
+ if (rwa)
+ goto bad_mode;
+ rwa = 1;
+ self->writable = 1;
+ flags |= O_CREAT;
+ append = 1;
+ break;
+ case '+':
+ if (plus)
+ goto bad_mode;
+ self->readable = self->writable = 1;
+ plus = 1;
+ break;
+ default:
+ PyErr_Format(PyExc_ValueError,
+ "invalid mode: %.200s", mode);
+ goto error;
+ }
+ }
+
+ if (!rwa)
+ goto bad_mode;
+
+ if (self->readable && self->writable)
+ flags |= O_RDWR;
+ else if (self->readable)
+ flags |= O_RDONLY;
+ else
+ flags |= O_WRONLY;
+
+#ifdef O_BINARY
+ flags |= O_BINARY;
+#endif
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ self->fd = open(name, flags, 0666);
+ Py_END_ALLOW_THREADS
+ if (self->fd < 0 || dircheck(self) < 0) {
+ PyErr_SetFromErrnoWithFilename(PyExc_IOError, name);
+ goto error;
+ }
+
+ goto done;
+
+ error:
+ ret = -1;
+
+ done:
+ PyMem_Free(name);
+ return ret;
+}
+
+static void
+fileio_dealloc(PyFileIOObject *self)
+{
+ if (self->weakreflist != NULL)
+ PyObject_ClearWeakRefs((PyObject *) self);
+
+ if (self->fd >= 0 && self->own_fd) {
+ PyObject *closeresult = fileio_close(self);
+ if (closeresult == NULL) {
+#ifdef HAVE_STRERROR
+ PySys_WriteStderr("close failed: [Errno %d] %s\n", errno, strerror(errno));
+#else
+ PySys_WriteStderr("close failed: [Errno %d]\n", errno);
+#endif
+ } else
+ Py_DECREF(closeresult);
+ }
+
+ self->ob_type->tp_free((PyObject *)self);
+}
+
+static PyObject *
+err_closed(void)
+{
+ PyErr_SetString(PyExc_ValueError, "I/O operation on closed file");
+ return NULL;
+}
+
+static PyObject *
+fileio_fileno(PyFileIOObject *self)
+{
+ if (self->fd < 0)
+ return err_closed();
+ return PyInt_FromLong((long) self->fd);
+}
+
+static PyObject *
+fileio_readable(PyFileIOObject *self)
+{
+ if (self->fd < 0)
+ return err_closed();
+ return PyInt_FromLong((long) self->readable);
+}
+
+static PyObject *
+fileio_writable(PyFileIOObject *self)
+{
+ if (self->fd < 0)
+ return err_closed();
+ return PyInt_FromLong((long) self->writable);
+}
+
+static PyObject *
+fileio_seekable(PyFileIOObject *self)
+{
+ if (self->fd < 0)
+ return err_closed();
+ if (self->seekable < 0) {
+ int ret;
+ Py_BEGIN_ALLOW_THREADS
+ ret = lseek(self->fd, 0, SEEK_CUR);
+ Py_END_ALLOW_THREADS
+ if (ret < 0)
+ self->seekable = 0;
+ else
+ self->seekable = 1;
+ }
+ return PyInt_FromLong((long) self->seekable);
+}
+
+static PyObject *
+fileio_readinto(PyFileIOObject *self, PyObject *args)
+{
+ char *ptr;
+ Py_ssize_t n;
+
+ if (self->fd < 0)
+ return err_closed();
+ if (!PyArg_ParseTuple(args, "w#", &ptr, &n))
+ return NULL;
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ n = read(self->fd, ptr, n);
+ Py_END_ALLOW_THREADS
+ if (n < 0) {
+ if (errno == EAGAIN)
+ Py_RETURN_NONE;
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ return PyInt_FromLong(n);
+}
+
+static PyObject *
+fileio_read(PyFileIOObject *self, PyObject *args)
+{
+ char *ptr;
+ Py_ssize_t n, size;
+ PyObject *bytes;
+
+ if (self->fd < 0)
+ return err_closed();
+
+ if (!PyArg_ParseTuple(args, "i", &size))
+ return NULL;
+
+ bytes = PyBytes_FromStringAndSize(NULL, size);
+ if (bytes == NULL)
+ return NULL;
+ ptr = PyBytes_AsString(bytes);
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ n = read(self->fd, ptr, size);
+ Py_END_ALLOW_THREADS
+
+ if (n < 0) {
+ if (errno == EAGAIN)
+ Py_RETURN_NONE;
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ if (n != size) {
+ if (PyBytes_Resize(bytes, n) < 0) {
+ Py_DECREF(bytes);
+ return NULL;
+ }
+ }
+
+ return (PyObject *) bytes;
+}
+
+static PyObject *
+fileio_write(PyFileIOObject *self, PyObject *args)
+{
+ Py_ssize_t n;
+ char *ptr;
+
+ if (self->fd < 0)
+ return err_closed();
+ if (!PyArg_ParseTuple(args, "s#", &ptr, &n))
+ return NULL;
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ n = write(self->fd, ptr, n);
+ Py_END_ALLOW_THREADS
+
+ if (n < 0) {
+ if (errno == EAGAIN)
+ Py_RETURN_NONE;
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ return PyInt_FromLong(n);
+}
+
+static PyObject *
+fileio_seek(PyFileIOObject *self, PyObject *args)
+{
+ Py_ssize_t offset;
+ Py_ssize_t whence = 0;
+
+ if (self->fd < 0)
+ return err_closed();
+
+ if (!PyArg_ParseTuple(args, "i|i", &offset, &whence))
+ return NULL;
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ offset = lseek(self->fd, offset, whence);
+ Py_END_ALLOW_THREADS
+
+ if (offset < 0) {
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ Py_RETURN_NONE;
+}
+
+static PyObject *
+fileio_tell(PyFileIOObject *self, PyObject *args)
+{
+ Py_ssize_t offset;
+
+ if (self->fd < 0)
+ return err_closed();
+
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ offset = lseek(self->fd, 0, SEEK_CUR);
+ Py_END_ALLOW_THREADS
+
+ if (offset < 0) {
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ return PyInt_FromLong(offset);
+}
+
+#ifdef HAVE_FTRUNCATE
+static PyObject *
+fileio_truncate(PyFileIOObject *self, PyObject *args)
+{
+ Py_ssize_t length;
+ int ret;
+
+ if (self->fd < 0)
+ return err_closed();
+
+ /* Setup default value */
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ length = lseek(self->fd, 0, SEEK_CUR);
+ Py_END_ALLOW_THREADS
+
+ if (length < 0) {
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ if (!PyArg_ParseTuple(args, "|i", &length))
+ return NULL;
+
+#ifdef MS_WINDOWS
+ /* MS _chsize doesn't work if newsize doesn't fit in 32 bits,
+ so don't even try using it. */
+ {
+ HANDLE hFile;
+ Py_ssize_t initialpos;
+
+ /* Have to move current pos to desired endpoint on Windows. */
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ ret = _portable_fseek(f->f_fp, newsize, SEEK_SET) != 0;
+ Py_END_ALLOW_THREADS
+ if (ret)
+ goto onioerror;
+
+ /* Truncate. Note that this may grow the file! */
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ hFile = (HANDLE)_get_osfhandle(fileno(f->f_fp));
+ ret = hFile == (HANDLE)-1;
+ if (ret == 0) {
+ ret = SetEndOfFile(hFile) == 0;
+ if (ret)
+ errno = EACCES;
+ }
+ Py_END_ALLOW_THREADS
+ if (ret)
+ goto onioerror;
+ }
+#else
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ ret = ftruncate(self->fd, length);
+ Py_END_ALLOW_THREADS
+#endif /* !MS_WINDOWS */
+
+ if (ret < 0) {
+ onioerror:
+ PyErr_SetFromErrno(PyExc_IOError);
+ return NULL;
+ }
+
+ /* Return to initial position */
+ Py_BEGIN_ALLOW_THREADS
+ errno = 0;
+ ret = lseek(self->fd, length, SEEK_SET);
+ Py_END_ALLOW_THREADS
+ if (ret < 0)
+ goto onioerror;
+
+ Py_RETURN_NONE;
+}
+#endif
+
+static PyObject *
+fileio_repr(PyFileIOObject *self)
+{
+ PyObject *ret = NULL;
+
+ ret = PyString_FromFormat("<%s file at %p>",
+ self->fd < 0 ? "closed" : "open",
+ self);
+ return ret;
+}
+
+static PyObject *
+fileio_isatty(PyFileIOObject *self)
+{
+ long res;
+
+ if (self->fd < 0)
+ return err_closed();
+ Py_BEGIN_ALLOW_THREADS
+ res = isatty(self->fd);
+ Py_END_ALLOW_THREADS
+ return PyBool_FromLong(res);
+}
+
+static PyObject *
+fileio_self(PyFileIOObject *self)
+{
+ if (self->fd < 0)
+ return err_closed();
+ Py_INCREF(self);
+ return (PyObject *)self;
+}
+
+PyDoc_STRVAR(fileio_doc,
+"file(name: str[, mode: str]) -> file IO object\n"
+"\n"
+"Open a file. The mode can be 'r', 'w' or 'a' for reading (default),\n"
+"writing or appending. The file will be created if it doesn't exist\n"
+"when opened for writing or appending; it will be truncated when\n"
+"opened for writing. Add a '+' to the mode to allow simultaneous\n"
+"reading and writing.");
+
+PyDoc_STRVAR(read_doc,
+"read(size: int) -> bytes. read at most size bytes, returned as bytes.\n"
+"\n"
+"Only makes one system call, so less data may be returned than requested\n"
+"In non-blocking mode, returns None if no data is available. On\n"
+"end-of-file, returns 0.");
+
+PyDoc_STRVAR(write_doc,
+"write(b: bytes) -> int. Write bytes b to file, return number written.\n"
+"\n"
+"Only makes one system call, so not all of the data may be written.\n"
+"The number of bytes actually written is returned.");
+
+PyDoc_STRVAR(fileno_doc,
+"fileno() -> int. \"file descriptor\".\n"
+"\n"
+"This is needed for lower-level file interfaces, such the fcntl module.");
+
+PyDoc_STRVAR(seek_doc,
+"seek(offset: int[, whence: int]) -> None. Move to new file position.\n"
+"\n"
+"Argument offset is a byte count. Optional argument whence defaults to\n"
+"0 (offset from start of file, offset should be >= 0); other values are 1\n"
+"(move relative to current position, positive or negative), and 2 (move\n"
+"relative to end of file, usually negative, although many platforms allow\n"
+"seeking beyond the end of a file)."
+"\n"
+"Note that not all file objects are seekable.");
+
+PyDoc_STRVAR(truncate_doc,
+"truncate([size: int]) -> None. Truncate the file to at most size bytes.\n"
+"\n"
+"Size defaults to the current file position, as returned by tell().");
+
+PyDoc_STRVAR(tell_doc,
+"tell() -> int. Current file position");
+
+PyDoc_STRVAR(readinto_doc,
+"readinto() -> Undocumented. Don't use this; it may go away.");
+
+PyDoc_STRVAR(close_doc,
+"close() -> None. Close the file.\n"
+"\n"
+"A closed file cannot be used for further I/O operations. close() may be\n"
+"called more than once without error. Changes the fileno to -1.");
+
+PyDoc_STRVAR(isatty_doc,
+"isatty() -> bool. True if the file is connected to a tty device.");
+
+PyDoc_STRVAR(enter_doc,
+"__enter__() -> self.");
+
+PyDoc_STRVAR(exit_doc,
+"__exit__(*excinfo) -> None. Closes the file.");
+
+PyDoc_STRVAR(seekable_doc,
+"seekable() -> bool. True if file supports random-access.");
+
+PyDoc_STRVAR(readable_doc,
+"readable() -> bool. True if file was opened in a read mode.");
+
+PyDoc_STRVAR(writable_doc,
+"writable() -> bool. True if file was opened in a write mode.");
+
+static PyMethodDef fileio_methods[] = {
+ {"read", (PyCFunction)fileio_read, METH_VARARGS, read_doc},
+ {"readinto", (PyCFunction)fileio_readinto, METH_VARARGS, readinto_doc},
+ {"write", (PyCFunction)fileio_write, METH_VARARGS, write_doc},
+ {"seek", (PyCFunction)fileio_seek, METH_VARARGS, seek_doc},
+ {"tell", (PyCFunction)fileio_tell, METH_VARARGS, tell_doc},
+ {"truncate", (PyCFunction)fileio_truncate, METH_VARARGS, truncate_doc},
+ {"close", (PyCFunction)fileio_close, METH_NOARGS, close_doc},
+ {"seekable", (PyCFunction)fileio_seekable, METH_NOARGS, seekable_doc},
+ {"readable", (PyCFunction)fileio_readable, METH_NOARGS, readable_doc},
+ {"writable", (PyCFunction)fileio_writable, METH_NOARGS, writable_doc},
+ {"fileno", (PyCFunction)fileio_fileno, METH_NOARGS, fileno_doc},
+ {"isatty", (PyCFunction)fileio_isatty, METH_NOARGS, isatty_doc},
+ {"__enter__",(PyCFunction)fileio_self, METH_NOARGS, enter_doc},
+ {"__exit__", (PyCFunction)fileio_close, METH_VARARGS, exit_doc},
+ {NULL, NULL} /* sentinel */
+};
+
+PyTypeObject PyFileIO_Type = {
+ PyObject_HEAD_INIT(&PyType_Type)
+ 0,
+ "FileIO",
+ sizeof(PyFileIOObject),
+ 0,
+ (destructor)fileio_dealloc, /* tp_dealloc */
+ 0, /* tp_print */
+ 0, /* tp_getattr */
+ 0, /* tp_setattr */
+ 0, /* tp_compare */
+ (reprfunc)fileio_repr, /* tp_repr */
+ 0, /* tp_as_number */
+ 0, /* tp_as_sequence */
+ 0, /* tp_as_mapping */
+ 0, /* tp_hash */
+ 0, /* tp_call */
+ 0, /* tp_str */
+ PyObject_GenericGetAttr, /* tp_getattro */
+ 0, /* tp_setattro */
+ 0, /* tp_as_buffer */
+ Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */
+ fileio_doc, /* tp_doc */
+ 0, /* tp_traverse */
+ 0, /* tp_clear */
+ 0, /* tp_richcompare */
+ offsetof(PyFileIOObject, weakreflist), /* tp_weaklistoffset */
+ 0, /* tp_iter */
+ 0, /* tp_iternext */
+ fileio_methods, /* tp_methods */
+ 0, /* tp_members */
+ 0, /* tp_getset */
+ 0, /* tp_base */
+ 0, /* tp_dict */
+ 0, /* tp_descr_get */
+ 0, /* tp_descr_set */
+ 0, /* tp_dictoffset */
+ fileio_init, /* tp_init */
+ PyType_GenericAlloc, /* tp_alloc */
+ fileio_new, /* tp_new */
+ PyObject_Del, /* tp_free */
+};
+
+static PyMethodDef module_methods[] = {
+ {NULL, NULL}
+};
+
+PyMODINIT_FUNC
+init_fileio(void)
+{
+ PyObject *m; /* a module object */
+
+ m = Py_InitModule3("_fileio", module_methods,
+ "Fast implementation of io.FileIO.");
+ if (m == NULL)
+ return;
+ if (PyType_Ready(&PyFileIO_Type) < 0)
+ return;
+ Py_INCREF(&PyFileIO_Type);
+ PyModule_AddObject(m, "_FileIO", (PyObject *) &PyFileIO_Type);
+}