summaryrefslogtreecommitdiffstats
path: root/Lib/wave.py
diff options
context:
space:
mode:
Diffstat (limited to 'Lib/wave.py')
-rw-r--r--Lib/wave.py559
1 files changed, 559 insertions, 0 deletions
diff --git a/Lib/wave.py b/Lib/wave.py
new file mode 100644
index 0000000..5d1a1c1
--- /dev/null
+++ b/Lib/wave.py
@@ -0,0 +1,559 @@
+# Stuff to parse WAVE files.
+#
+# Usage.
+#
+# Reading WAVE files:
+# f = wave.open(file, 'r')
+# where file is either the name of a file or an open file pointer.
+# The open file pointer must have methods read(), seek(), and close().
+# When the setpos() and rewind() methods are not used, the seek()
+# method is not necessary.
+#
+# This returns an instance of a class with the following public methods:
+# getnchannels() -- returns number of audio channels (1 for
+# mono, 2 for stereo)
+# getsampwidth() -- returns sample width in bytes
+# getframerate() -- returns sampling frequency
+# getnframes() -- returns number of audio frames
+# getcomptype() -- returns compression type ('NONE' for AIFF files)
+# getcompname() -- returns human-readable version of
+# compression type ('not compressed' for AIFF files)
+# getparams() -- returns a tuple consisting of all of the
+# above in the above order
+# getmarkers() -- returns None (for compatibility with the
+# aifc module)
+# getmark(id) -- raises an error since the mark does not
+# exist (for compatibility with the aifc module)
+# readframes(n) -- returns at most n frames of audio
+# rewind() -- rewind to the beginning of the audio stream
+# setpos(pos) -- seek to the specified position
+# tell() -- return the current position
+# close() -- close the instance (make it unusable)
+# The position returned by tell() and the position given to setpos()
+# are compatible and have nothing to do with the actual postion in the
+# file.
+# The close() method is called automatically when the class instance
+# is destroyed.
+#
+# Writing WAVE files:
+# f = wave.open(file, 'w')
+# where file is either the name of a file or an open file pointer.
+# The open file pointer must have methods write(), tell(), seek(), and
+# close().
+#
+# This returns an instance of a class with the following public methods:
+# setnchannels(n) -- set the number of channels
+# setsampwidth(n) -- set the sample width
+# setframerate(n) -- set the frame rate
+# setnframes(n) -- set the number of frames
+# setcomptype(type, name)
+# -- set the compression type and the
+# human-readable compression type
+# setparams(nchannels, sampwidth, framerate, nframes, comptype, compname)
+# -- set all parameters at once
+# tell() -- return current position in output file
+# writeframesraw(data)
+# -- write audio frames without pathing up the
+# file header
+# writeframes(data)
+# -- write audio frames and patch up the file header
+# close() -- patch up the file header and close the
+# output file
+# You should set the parameters before the first writeframesraw or
+# writeframes. The total number of frames does not need to be set,
+# but when it is set to the correct value, the header does not have to
+# be patched up.
+# It is best to first set all parameters, perhaps possibly the
+# compression type, and then write audio frames using writeframesraw.
+# When all frames have been written, either call writeframes('') or
+# close() to patch up the sizes in the header.
+# The close() method is called automatically when the class instance
+# is destroyed.
+
+import __builtin__
+
+Error = 'wave.Error'
+
+WAVE_FORMAT_PCM = 0x0001
+
+_array_fmts = None, 'b', 'h', None, 'l'
+
+def _read_long(file):
+ x = 0L
+ for i in range(4):
+ byte = file.read(1)
+ if byte == '':
+ raise EOFError
+ x = x + (ord(byte) << (8 * i))
+ if x >= 0x80000000L:
+ x = x - 0x100000000L
+ return int(x)
+
+def _read_ulong(file):
+ x = 0L
+ for i in range(4):
+ byte = file.read(1)
+ if byte == '':
+ raise EOFError
+ x = x + (ord(byte) << (8 * i))
+ return x
+
+def _read_short(file):
+ x = 0
+ for i in range(2):
+ byte = file.read(1)
+ if byte == '':
+ raise EOFError
+ x = x + (ord(byte) << (8 * i))
+ if x >= 0x8000:
+ x = x - 0x10000
+ return x
+
+def _write_short(f, x):
+ d, m = divmod(x, 256)
+ f.write(chr(m))
+ f.write(chr(d))
+
+def _write_long(f, x):
+ if x < 0:
+ x = x + 0x100000000L
+ for i in range(4):
+ d, m = divmod(x, 256)
+ f.write(chr(int(m)))
+ x = d
+
+class Chunk:
+ def __init__(self, file):
+ self.file = file
+ self.chunkname = self.file.read(4)
+ if len(self.chunkname) < 4:
+ raise EOFError
+ self.chunksize = _read_long(self.file)
+ self.size_read = 0
+ self.offset = self.file.tell()
+
+ def rewind(self):
+ self.file.seek(self.offset, 0)
+ self.size_read = 0
+
+ def setpos(self, pos):
+ if pos < 0 or pos > self.chunksize:
+ raise RuntimeError
+ self.file.seek(self.offset + pos, 0)
+ self.size_read = pos
+
+ def read(self, length):
+ if self.size_read >= self.chunksize:
+ return ''
+ if length > self.chunksize - self.size_read:
+ length = self.chunksize - self.size_read
+ data = self.file.read(length)
+ self.size_read = self.size_read + len(data)
+ return data
+
+ def skip(self):
+ try:
+ self.file.seek(self.chunksize - self.size_read, 1)
+ except RuntimeError:
+ while self.size_read < self.chunksize:
+ dummy = self.read(8192)
+ if not dummy:
+ raise EOFError
+
+class Wave_read:
+ # Variables used in this class:
+ #
+ # These variables are available to the user though appropriate
+ # methods of this class:
+ # _file -- the open file with methods read(), close(), and seek()
+ # set through the __init__() method
+ # _nchannels -- the number of audio channels
+ # available through the getnchannels() method
+ # _nframes -- the number of audio frames
+ # available through the getnframes() method
+ # _sampwidth -- the number of bytes per audio sample
+ # available through the getsampwidth() method
+ # _framerate -- the sampling frequency
+ # available through the getframerate() method
+ # _comptype -- the AIFF-C compression type ('NONE' if AIFF)
+ # available through the getcomptype() method
+ # _compname -- the human-readable AIFF-C compression type
+ # available through the getcomptype() method
+ # _soundpos -- the position in the audio stream
+ # available through the tell() method, set through the
+ # setpos() method
+ #
+ # These variables are used internally only:
+ # _fmt_chunk_read -- 1 iff the FMT chunk has been read
+ # _data_seek_needed -- 1 iff positioned correctly in audio
+ # file for readframes()
+ # _data_chunk -- instantiation of a chunk class for the DATA chunk
+ # _framesize -- size of one frame in the file
+
+ access _file, _nchannels, _nframes, _sampwidth, _framerate, \
+ _comptype, _compname, _soundpos, \
+ _fmt_chunk_read, _data_seek_needed, \
+ _data_chunk, _framesize: private
+
+ def initfp(self, file):
+ self._file = file
+ self._convert = None
+ self._soundpos = 0
+ form = self._file.read(4)
+ if form != 'RIFF':
+ raise Error, 'file does not start with RIFF id'
+ formlength = _read_long(self._file)
+ if formlength <= 0:
+ raise Error, 'invalid FORM chunk data size'
+ formdata = self._file.read(4)
+ formlength = formlength - 4
+ if formdata != 'WAVE':
+ raise Error, 'not a WAVE file'
+ self._fmt_chunk_read = 0
+ while formlength > 0:
+ self._data_seek_needed = 1
+ chunk = Chunk(self._file)
+ if chunk.chunkname == 'fmt ':
+ self._read_fmt_chunk(chunk)
+ self._fmt_chunk_read = 1
+ elif chunk.chunkname == 'data':
+ if not self._fmt_chunk_read:
+ raise Error, 'data chunk before fmt chunk'
+ self._data_chunk = chunk
+ self._nframes = chunk.chunksize / self._framesize
+ self._data_seek_needed = 0
+ formlength = formlength - 8 - chunk.chunksize
+ if formlength > 0:
+ chunk.skip()
+ if not self._fmt_chunk_read or not self._data_chunk:
+ raise Error, 'fmt chunk and/or data chunk missing'
+
+ def __init__(self, f):
+ if type(f) == type(''):
+ f = __builtin__.open(f, 'r')
+ # else, assume it is an open file object already
+ self.initfp(f)
+
+ def __del__(self):
+ if self._file:
+ self.close()
+
+ #
+ # User visible methods.
+ #
+ def getfp(self):
+ return self._file
+
+ def rewind(self):
+ self._data_seek_needed = 1
+ self._soundpos = 0
+
+ def close(self):
+ self._file = None
+
+ def tell(self):
+ return self._soundpos
+
+ def getnchannels(self):
+ return self._nchannels
+
+ def getnframes(self):
+ return self._nframes
+
+ def getsampwidth(self):
+ return self._sampwidth
+
+ def getframerate(self):
+ return self._framerate
+
+ def getcomptype(self):
+ return self._comptype
+
+ def getcompname(self):
+ return self._compname
+
+ def getparams(self):
+ return self.getnchannels(), self.getsampwidth(), \
+ self.getframerate(), self.getnframes(), \
+ self.getcomptype(), self.getcompname()
+
+ def getmarkers(self):
+ return None
+
+ def getmark(self, id):
+ raise Error, 'no marks'
+
+ def setpos(self, pos):
+ if pos < 0 or pos > self._nframes:
+ raise Error, 'position not in range'
+ self._soundpos = pos
+ self._data_seek_needed = 1
+
+ def readframes(self, nframes):
+ if self._data_seek_needed:
+ self._data_chunk.rewind()
+ pos = self._soundpos * self._framesize
+ if pos:
+ self._data_chunk.setpos(pos)
+ self._data_seek_needed = 0
+ if nframes == 0:
+ return ''
+ if self._sampwidth > 1:
+ # unfortunately the fromfile() method does not take
+ # something that only looks like a file object, so
+ # we have to reach into the innards of the chunk object
+ import array
+ data = array.array(_array_fmts[self._sampwidth])
+ nitems = nframes * self._nchannels
+ if nitems * self._sampwidth > self._data_chunk.chunksize - self._data_chunk.size_read:
+ nitems = (self._data_chunk.chunksize - self._data_chunk.size_read) / self._sampwidth
+ data.fromfile(self._data_chunk.file, nitems)
+ self._data_chunk.size_read = self._data_chunk.size_read + nitems * self._sampwidth
+ data.byteswap()
+ data = data.tostring()
+ else:
+ data = self._data_chunk.read(nframes * self._framesize)
+ if self._convert and data:
+ data = self._convert(data)
+ self._soundpos = self._soundpos + len(data) / (self._nchannels * self._sampwidth)
+ return data
+
+ #
+ # Internal methods.
+ #
+ access *: private
+
+ def _read_fmt_chunk(self, chunk):
+ wFormatTag = _read_short(chunk)
+ self._nchannels = _read_short(chunk)
+ self._framerate = _read_long(chunk)
+ dwAvgBytesPerSec = _read_long(chunk)
+ wBlockAlign = _read_short(chunk)
+ if wFormatTag == WAVE_FORMAT_PCM:
+ self._sampwidth = (_read_short(chunk) + 7) / 8
+ else:
+ raise Error, 'unknown format'
+ self._framesize = self._nchannels * self._sampwidth
+ self._comptype = 'NONE'
+ self._compname = 'not compressed'
+
+class Wave_write:
+ # Variables used in this class:
+ #
+ # These variables are user settable through appropriate methods
+ # of this class:
+ # _file -- the open file with methods write(), close(), tell(), seek()
+ # set through the __init__() method
+ # _comptype -- the AIFF-C compression type ('NONE' in AIFF)
+ # set through the setcomptype() or setparams() method
+ # _compname -- the human-readable AIFF-C compression type
+ # set through the setcomptype() or setparams() method
+ # _nchannels -- the number of audio channels
+ # set through the setnchannels() or setparams() method
+ # _sampwidth -- the number of bytes per audio sample
+ # set through the setsampwidth() or setparams() method
+ # _framerate -- the sampling frequency
+ # set through the setframerate() or setparams() method
+ # _nframes -- the number of audio frames written to the header
+ # set through the setnframes() or setparams() method
+ #
+ # These variables are used internally only:
+ # _datalength -- the size of the audio samples written to the header
+ # _nframeswritten -- the number of frames actually written
+ # _datawritten -- the size of the audio samples actually written
+
+ access _file, _comptype, _compname, _nchannels, _sampwidth, \
+ _framerate, _nframes, _nframeswritten, \
+ _datalength, _datawritten: private
+
+ def __init__(self, f):
+ if type(f) == type(''):
+ f = __builtin__.open(f, 'w')
+ self.initfp(f)
+
+ def initfp(self, file):
+ self._file = file
+ self._convert = None
+ self._nchannels = 0
+ self._sampwidth = 0
+ self._framerate = 0
+ self._nframes = 0
+ self._nframeswritten = 0
+ self._datawritten = 0
+ self._datalength = 0
+
+ def __del__(self):
+ if self._file:
+ self.close()
+
+ #
+ # User visible methods.
+ #
+ def setnchannels(self, nchannels):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ if nchannels < 1:
+ raise Error, 'bad # of channels'
+ self._nchannels = nchannels
+
+ def getnchannels(self):
+ if not self._nchannels:
+ raise Error, 'number of channels not set'
+ return self._nchannels
+
+ def setsampwidth(self, sampwidth):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ if sampwidth < 1 or sampwidth > 4:
+ raise Error, 'bad sample width'
+ self._sampwidth = sampwidth
+
+ def getsampwidth(self):
+ if not self._sampwidth:
+ raise Error, 'sample width not set'
+ return self._sampwidth
+
+ def setframerate(self, framerate):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ if framerate <= 0:
+ raise Error, 'bad frame rate'
+ self._framerate = framerate
+
+ def getframerate(self):
+ if not self._framerate:
+ raise Error, 'frame rate not set'
+ return self._framerate
+
+ def setnframes(self, nframes):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ self._nframes = nframes
+
+ def getnframes(self):
+ return self._nframeswritten
+
+ def setcomptype(self, comptype, compname):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ if comptype not in ('NONE',):
+ raise Error, 'unsupported compression type'
+ self._comptype = comptype
+ self._compname = compname
+
+ def getcomptype(self):
+ return self._comptype
+
+ def getcompname(self):
+ return self._compname
+
+ def setparams(self, (nchannels, sampwidth, framerate, nframes, comptype, compname)):
+ if self._datawritten:
+ raise Error, 'cannot change parameters after starting to write'
+ self.setnchannels(nchannels)
+ self.setsampwidth(sampwidth)
+ self.setframerate(framerate)
+ self.setnframes(nframes)
+ self.setcomptype(comptype, compname)
+
+ def getparams(self):
+ if not self._nchannels or not self._sampwidth or not self._framerate:
+ raise Error, 'not all parameters set'
+ return self._nchannels, self._sampwidth, self._framerate, \
+ self._nframes, self._comptype, self._compname
+
+ def setmark(self, id, pos, name):
+ raise Error, 'setmark() not supported'
+
+ def getmark(self, id):
+ raise Error, 'no marks'
+
+ def getmarkers(self):
+ return None
+
+ def tell(self):
+ return self._nframeswritten
+
+ def writeframesraw(self, data):
+ self._ensure_header_written(len(data))
+ nframes = len(data) / (self._sampwidth * self._nchannels)
+ if self._convert:
+ data = self._convert(data)
+ if self._sampwidth > 1:
+ import array
+ data = array.array(_array_fmts[self._sampwidth], data)
+ data.byteswap()
+ data.tofile(self._file)
+ self._datawritten = self._datawritten + len(data) * self._sampwidth
+ else:
+ self._file.write(data)
+ self._datawritten = self._datawritten + len(data)
+ self._nframeswritten = self._nframeswritten + nframes
+
+ def writeframes(self, data):
+ self.writeframesraw(data)
+ if self._datalength != self._datawritten:
+ self._patchheader()
+
+ def close(self):
+ self._ensure_header_written(0)
+ if self._datalength != self._datawritten:
+ self._patchheader()
+ self._file.flush()
+ self._file = None
+
+ #
+ # Internal methods.
+ #
+ access *: private
+
+ def _ensure_header_written(self, datasize):
+ if not self._datawritten:
+ if not self._nchannels:
+ raise Error, '# channels not specified'
+ if not self._sampwidth:
+ raise Error, 'sample width not specified'
+ if not self._framerate:
+ raise Error, 'sampling rate not specified'
+ self._write_header(datasize)
+
+ def _write_header(self, initlength):
+ self._file.write('RIFF')
+ if not self._nframes:
+ self._nframes = initlength / (self._nchannels * self._sampwidth)
+ self._datalength = self._nframes * self._nchannels * self._sampwidth
+ self._form_length_pos = self._file.tell()
+ _write_long(self._file, 36 + self._datalength)
+ self._file.write('WAVE')
+ self._file.write('fmt ')
+ _write_long(self._file, 16)
+ _write_short(self._file, WAVE_FORMAT_PCM)
+ _write_short(self._file, self._nchannels)
+ _write_long(self._file, self._framerate)
+ _write_long(self._file, self._nchannels * self._framerate * self._sampwidth)
+ _write_short(self._file, self._nchannels * self._sampwidth)
+ _write_short(self._file, self._sampwidth * 8)
+ self._file.write('data')
+ self._data_length_pos = self._file.tell()
+ _write_long(self._file, self._datalength)
+
+ def _patchheader(self):
+ if self._datawritten == self._datalength:
+ return
+ curpos = self._file.tell()
+ self._file.seek(self._form_length_pos, 0)
+ _write_long(36 + self._datawritten)
+ self._file.seek(self._data_length_pos, 0)
+ _write_long(self._file, self._datawritten)
+ self._file.seek(curpos, 0)
+ self._datalength = self._datawritten
+
+def open(f, mode):
+ if mode == 'r':
+ return Wave_read(f)
+ elif mode == 'w':
+ return Wave_write(f)
+ else:
+ raise Error, "mode must be 'r' or 'w'"
+
+openfp = open # B/W compatibility