Description
An audio manager.
Pulse-code modulation (PCM) is a method used to digitally represent
sampled analog signals. A PCM signal is a sequence of digital audio
samples containing the data providing the necessary information to
reconstruct the original analog signal. Each sample represents the
amplitude of the signal at a specific point in time, and the samples
are uniformly spaced in time.
The amplitude is the only information explicitly stored in the sample.
A PCM stream has two basic properties that determine the stream's
fidelity to the original analog signal: the sampling rate, which is the
number of times per second that samples are taken; and the bit depth,
which determines the number of possible digital values that can be used
to represent each sample.
For speech analysis, recommended sampling rate are 16000 (for automatic
analysis) or 48000 (for manual analysis); and recommended sample depths
are 16 per sample.
These variables are user gettable through appropriate methods:
- nchannels -- the number of audio channels
- framerate -- the sampling frequency
- sampwidth -- the number of bytes per audio sample (1, 2 or 4)
- nframes -- the number of frames
- params -- parameters of the wave file
- filename -- the name of the wave file
The audiofp member is assigned by the IO classes (WaveIO only).
It is expected that it can access the following methods:
- readframes()
- writeframes()
- getsampwidth()
- getframerate()
- getnframes()
- getnchannels()
- setpos()
- tell()
- rewind()
Public functions
set
Set from another AudioPCM() instance.
It can be set either with an audio file pointer, or a list of
channels or both.
Parameters
- other: (AudioPCM) the other AudioPCM to set
View Source
def set(self, other):
"""Set from another AudioPCM() instance.
It can be set either with an audio file pointer, or a list of
channels or both.
:param other: (AudioPCM) the other AudioPCM to set
"""
self._audio_fp = other.get_audiofp()
self._channels = other.get_channels()
get_channels
Return the list of uploaded channels.
Returns
View Source
def get_channels(self):
"""Return the list of uploaded channels.
:return: (list) channels
"""
return self._channels
get_audiofp
Return the audio file pointer.
Returns
View Source
def get_audiofp(self):
"""Return the audio file pointer.
:return: audio file pointer
"""
return self._audio_fp
remove_channel
Remove a channel from the list of uploaded channels.
Parameters
- channel: (Channel) the channel to remove
View Source
def remove_channel(self, channel):
"""Remove a channel from the list of uploaded channels.
:param channel: (Channel) the channel to remove
"""
self._channels.remove(channel)
pop_channel
Pop a channel at the position given from the list of uploaded channels.
Parameters
- idx: (int) the index of the channel to remove
View Source
def pop_channel(self, idx):
"""Pop a channel at the position given from the list of uploaded channels.
:param idx: (int) the index of the channel to remove
"""
idx = int(idx)
self._channels.pop(idx)
insert_channel
Insert a channel at the position given in the list of uploaded channels.
Parameters
- idx: (int) the index where the channel has to be inserted
- channel: (Channel) the channel to insert
View Source
def insert_channel(self, idx, channel):
"""Insert a channel at the position given in the list of uploaded channels.
:param idx: (int) the index where the channel has to be inserted
:param channel: (Channel) the channel to insert
"""
idx = int(idx)
self._channels.insert(idx, channel)
get_channel
Get an uploaded channel.
Parameters
- idx: (int) the index of the channel to return
Returns
View Source
def get_channel(self, idx):
"""Get an uploaded channel.
:param idx: (int) the index of the channel to return
:returns: (Channel)
"""
idx = int(idx)
return self._channels[idx]
append_channel
Append a channel to the list of uploaded channels.
Parameters
- channel: (Channel) the channel to append
Returns
View Source
def append_channel(self, channel):
"""Append a channel to the list of uploaded channels.
:param channel: (Channel) the channel to append
:return: index of the channel
"""
self._channels.append(channel)
return len(self._channels) - 1
extract_channel
Extract a channel from the Audio File Pointer.
Append the channel into the list of channels.
Frames are stored into a Channel() instance.
Index of the channel in the audio file:
0 = 1st channel (left); 1 = 2nd channel (right); 2 = 3rd channel...
Parameters
- index: (int) The index of the channel to extract
Returns
- the index of the Channel() in the list
View Source
def extract_channel(self, index=0):
"""Extract a channel from the Audio File Pointer.
Append the channel into the list of channels.
Frames are stored into a Channel() instance.
Index of the channel in the audio file:
0 = 1st channel (left); 1 = 2nd channel (right); 2 = 3rd channel...
:param index: (int) The index of the channel to extract
:return: the index of the Channel() in the list
"""
if self._audio_fp is None:
raise AudioError
index = int(index)
if index < 0:
raise ChannelIndexError(index)
nc = self.get_nchannels()
self.seek(0)
data = self.read_frames(self.get_nframes())
if nc == 0:
raise AudioDataError
if index + 1 > nc:
raise ChannelIndexError(index)
if nc == 1:
channel = Channel(self.get_framerate(), self.get_sampwidth(), data)
return self.append_channel(channel)
frames = b''
sw = self.get_sampwidth()
for i in range(index * sw, len(data), nc * sw):
frames += data[i:i + sw]
channel = Channel(self.get_framerate(), self.get_sampwidth(), frames)
return self.append_channel(channel)
extract_channels
Extract all channels from the Audio File Pointer.
Append the extracted channels to the list of channels.
View Source
def extract_channels(self):
"""Extract all channels from the Audio File Pointer.
Append the extracted channels to the list of channels.
"""
if self._audio_fp is None:
raise AudioError
nc = self.get_nchannels()
sw = self.get_sampwidth()
self.seek(0)
data = self.read_frames(self.get_nframes())
if nc == 0:
raise AudioDataError
for index in range(nc):
frames = b''
for i in range(index * sw, len(data), nc * sw):
frames = frames + data[i:i + sw]
channel = Channel(self.get_framerate(), self.get_sampwidth(), frames)
self.append_channel(channel)
read
Read all frames of the audio file.
Returns
View Source
def read(self):
"""Read all frames of the audio file.
:return: (str) frames
"""
return self.read_frames(self.get_nframes())
read_frames
Read n frames from the audio file.
Parameters
- nframes: (int) the number of frames to read
Returns
View Source
def read_frames(self, nframes):
"""Read n frames from the audio file.
:param nframes: (int) the number of frames to read
:return: (str) frames
"""
if self._audio_fp is None:
raise AudioError
return self._audio_fp.readframes(nframes)
read_samples
Read the samples from the audio file.
Parameters
- nframes: (int) the number of frames to read
Returns
- (list of list) list of samples of each channel
View Source
def read_samples(self, nframes):
"""Read the samples from the audio file.
:param nframes: (int) the number of frames to read
:return: (list of list) list of samples of each channel
"""
if self._audio_fp is None:
raise AudioError
nframes = int(nframes)
return AudioConverter().unpack_data(self.read_frames(nframes), self.get_sampwidth(), self.get_nchannels())
get_sampwidth
Return the sample width of the Audio File Pointer.
Returns
- (int) sample width of the audio file
View Source
def get_sampwidth(self):
"""Return the sample width of the Audio File Pointer.
:return: (int) sample width of the audio file
"""
if self._audio_fp is None:
if len(self._channels) > 0:
return self._channels[0].get_sampwidth()
else:
raise AudioDataError
return self._audio_fp.getsampwidth()
get_framerate
Return the frame rate of the Audio File Pointer.
Returns
- (int) frame rate of the audio file
View Source
def get_framerate(self):
"""Return the frame rate of the Audio File Pointer.
:return: (int) frame rate of the audio file
"""
if self._audio_fp is None:
if len(self._channels) > 0:
return self._channels[0].get_framerate()
else:
raise AudioDataError
return self._audio_fp.getframerate()
get_nframes
Return the number of frames of the Audio File Pointer.
Returns
- (int) number of frames of the audio file
View Source
def get_nframes(self):
"""Return the number of frames of the Audio File Pointer.
:return: (int) number of frames of the audio file
"""
if self._audio_fp is None:
if len(self._channels) > 0:
return self._channels[0].get_nframes()
else:
raise AudioDataError
return self._audio_fp.getnframes()
get_nchannels
Return the number of channels of the Audio File Pointer.
Returns
- (int) number of channels of the audio file
View Source
def get_nchannels(self):
"""Return the number of channels of the Audio File Pointer.
:return: (int) number of channels of the audio file
"""
if self._audio_fp is None:
if len(self._channels) > 0:
return len(self._channels)
else:
raise AudioDataError
return self._audio_fp.getnchannels()
get_duration
Return the duration of the Audio File Pointer.
Returns
- (float) duration of the audio file (in seconds)
View Source
def get_duration(self):
"""Return the duration of the Audio File Pointer.
:return: (float) duration of the audio file (in seconds)
"""
if self._audio_fp is None:
if len(self._channels) > 0:
return self._channels[0].get_duration()
else:
raise AudioDataError
return float(self.get_nframes()) / float(self.get_framerate())
rms
Return the root-mean-square of the whole file.
Returns
- (float) rms of the audio file
View Source
def rms(self):
"""Return the root-mean-square of the whole file.
:return: (float) rms of the audio file
"""
pos = self.tell()
self.seek(0)
a = AudioFrames(self.read_frames(self.get_nframes()), self.get_sampwidth(), self.get_nchannels())
self.seek(pos)
return a.rms()
clipping_rate
Return the clipping rate of the frames.
Parameters
- factor: (float) An interval to be more precise on clipping rate. It will consider that all frames outside the interval are clipped. Factor has to be between 0 and 1.
Returns
View Source
def clipping_rate(self, factor):
"""Return the clipping rate of the frames.
:param factor: (float) An interval to be more precise on clipping rate.
It will consider that all frames outside the interval are clipped.
Factor has to be between 0 and 1.
:return: (float)
"""
pos = self.tell()
self.seek(0)
a = AudioFrames(self.read_frames(self.get_nframes()), self.get_sampwidth())
self.seek(pos)
return a.clipping_rate(factor)
seek
Fix the reader pointer position.
Parameters
- pos: (int) the position to set.
View Source
def seek(self, pos):
"""Fix the reader pointer position.
:param pos: (int) the position to set.
"""
if self._audio_fp is None:
raise AudioError
try:
self._audio_fp.setpos(pos)
except:
raise Exception('pos {} not in range (0, {}).'.format(pos, self.get_nframes()))
tell
Get the reader pointer position.
Returns
- (int) the current position
View Source
def tell(self):
"""Get the reader pointer position.
:return: (int) the current position
"""
if self._audio_fp is None:
raise AudioError
return self._audio_fp.tell()
rewind
Set reader position at the beginning of the file.
View Source
def rewind(self):
"""Set reader position at the beginning of the file."""
if self._audio_fp is None:
raise AudioError
return self._audio_fp.rewind()
verify_channels
Check that the uploaded channels have the same parameters.
Check the frame rate, sample width and number of frames.
Returns
View Source
def verify_channels(self):
"""Check that the uploaded channels have the same parameters.
Check the frame rate, sample width and number of frames.
:return: (bool)
"""
mixer = ChannelMixer()
f = 1.0 / len(self._channels)
for c in self._channels:
mixer.append_channel(c, f)
try:
mixer.check_channels()
except MixChannelError:
return False
return True
open
Open an audio file.
Parameters
View Source
def open(self, filename):
"""Open an audio file."""
name = self.__class__.__name__
raise NotImplementedError('{:s} does not support open().'.format(name))
save
Save an audio file.
Parameters
View Source
def save(self, filename):
"""Save an audio file."""
name = self.__class__.__name__
raise NotImplementedError('{:s} does not support save().'.format(name))
save_fragments
Save a fragment of an audio file.
Parameters
View Source
def save_fragments(self, filename):
"""Save a fragment of an audio file."""
name = self.__class__.__name__
raise NotImplementedError('{:s} does not support save_fragments().'.format(name))
close
Close the audio file.
View Source
def close(self):
"""Close the audio file."""
if self._audio_fp is None:
raise AudioError
self._audio_fp.close()
self._audio_fp = None