Created
May 21, 2020 14:29
-
-
Save kepler62f/9d5836a1eff8b372ddf6de43b5b74d95 to your computer and use it in GitHub Desktop.
Record audio stream from a microphone to wav files (with overlaps) using pyaudio
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
from datetime import datetime | |
import pyaudio | |
import wave | |
class MicRecorder(): | |
''' | |
A recorder class for recording audio stream from a microphone to WAV files. | |
Uses non-blocking callback threads to get audio stream but uses a list | |
to save chunks of stream to file | |
output_path: string, folder to output wave files | |
channels: integer, 1 mono, 2 stereo | |
rate: integer, microphone sampling rate (hertz) | |
frames_per_buffer: integer, | |
clip_duration: integer, how long each audio clip should be (seconds) | |
overlap: integer, overlap between consecutive clips (seconds, between 0 and clip_duration) | |
Example: | |
from micrecorder import MicRecorder | |
rec = MicRecorder('./audio-clips', overlap=2) | |
rec.start_recording() | |
''' | |
def __init__(self, output_path, channels=1, rate=16000, frames_per_buffer=1024, clip_duration=4, overlap=0): | |
self.output_path = output_path | |
self.channels = channels | |
self.rate = rate | |
self.frames_per_buffer = frames_per_buffer | |
self.clip_duration = clip_duration | |
self.overlap = overlap | |
self._pa = pyaudio.PyAudio() | |
self._stream = None | |
self.frames = [] | |
def start_recording(self): | |
fps = int(self.rate / self.frames_per_buffer * self.clip_duration) | |
self._stream = self._pa.open(format=pyaudio.paInt16, | |
channels=self.channels, | |
rate=self.rate, | |
input=True, | |
frames_per_buffer=self.frames_per_buffer, | |
stream_callback=self.get_callback()) | |
print('Begin recording...') | |
self._stream.start_stream() | |
try: | |
while True: | |
if len(self.frames) > fps: | |
clip = [] | |
for i in range(0, fps): | |
clip.append(self.frames[i]) | |
fname = ''.join([self.output_path, '/clip-', datetime.utcnow().strftime('%Y%m%d%H%M%S'), '.wav']) | |
wavefile = self._prepare_file(fname) | |
wavefile.writeframes(b''.join(clip)) | |
wavefile.close() | |
self.frames = self.frames[(self.clip_duration - self.overlap - 1):] | |
except KeyboardInterrupt as e: | |
print('Terminating recording...', end='') | |
self.stop_recording() | |
print('OK') | |
def stop_recording(self): | |
self._stream.stop_stream() | |
def get_callback(self): | |
def callback(in_data, frame_count, time_info, status): | |
self.frames.append(in_data) | |
return in_data, pyaudio.paContinue | |
return callback | |
def _prepare_file(self, filename, mode='wb'): | |
wavefile = wave.open(filename, mode) | |
wavefile.setnchannels(self.channels) | |
wavefile.setsampwidth(self._pa.get_sample_size(pyaudio.paInt16)) | |
wavefile.setframerate(self.rate) | |
return wavefile |
Add a break
after line 56 to prevent an infinite loop.
In line 56,
While slicing list of frames, indexes refer to frames not to seconds.
Yet here slicing is done with clip duration and overlap which both are expressed in seconds.
Compensate it with " * fps" to get actual frame index.
Also " - 1" in calculation is implicitly adding one second overlap, which is not what I would expect from setting overlap to 0.
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Maybe consider setting default output path to current directory