Skip to content

Instantly share code, notes, and snippets.

@kepler62f
Created May 21, 2020 14:29
Show Gist options
  • Save kepler62f/9d5836a1eff8b372ddf6de43b5b74d95 to your computer and use it in GitHub Desktop.
Save kepler62f/9d5836a1eff8b372ddf6de43b5b74d95 to your computer and use it in GitHub Desktop.
Record audio stream from a microphone to wav files (with overlaps) using pyaudio
from datetime import datetime
import pyaudio
import wave
class MicRecorder():
'''
A recorder class for recording audio stream from a microphone to WAV files.
Uses non-blocking callback threads to get audio stream but uses a list
to save chunks of stream to file
output_path: string, folder to output wave files
channels: integer, 1 mono, 2 stereo
rate: integer, microphone sampling rate (hertz)
frames_per_buffer: integer,
clip_duration: integer, how long each audio clip should be (seconds)
overlap: integer, overlap between consecutive clips (seconds, between 0 and clip_duration)
Example:
from micrecorder import MicRecorder
rec = MicRecorder('./audio-clips', overlap=2)
rec.start_recording()
'''
def __init__(self, output_path, channels=1, rate=16000, frames_per_buffer=1024, clip_duration=4, overlap=0):
self.output_path = output_path
self.channels = channels
self.rate = rate
self.frames_per_buffer = frames_per_buffer
self.clip_duration = clip_duration
self.overlap = overlap
self._pa = pyaudio.PyAudio()
self._stream = None
self.frames = []
def start_recording(self):
fps = int(self.rate / self.frames_per_buffer * self.clip_duration)
self._stream = self._pa.open(format=pyaudio.paInt16,
channels=self.channels,
rate=self.rate,
input=True,
frames_per_buffer=self.frames_per_buffer,
stream_callback=self.get_callback())
print('Begin recording...')
self._stream.start_stream()
try:
while True:
if len(self.frames) > fps:
clip = []
for i in range(0, fps):
clip.append(self.frames[i])
fname = ''.join([self.output_path, '/clip-', datetime.utcnow().strftime('%Y%m%d%H%M%S'), '.wav'])
wavefile = self._prepare_file(fname)
wavefile.writeframes(b''.join(clip))
wavefile.close()
self.frames = self.frames[(self.clip_duration - self.overlap - 1):]
except KeyboardInterrupt as e:
print('Terminating recording...', end='')
self.stop_recording()
print('OK')
def stop_recording(self):
self._stream.stop_stream()
def get_callback(self):
def callback(in_data, frame_count, time_info, status):
self.frames.append(in_data)
return in_data, pyaudio.paContinue
return callback
def _prepare_file(self, filename, mode='wb'):
wavefile = wave.open(filename, mode)
wavefile.setnchannels(self.channels)
wavefile.setsampwidth(self._pa.get_sample_size(pyaudio.paInt16))
wavefile.setframerate(self.rate)
return wavefile
@creeper6530
Copy link

Maybe consider setting default output path to current directory

@dgusoff
Copy link

dgusoff commented Dec 8, 2023

Add a break after line 56 to prevent an infinite loop.

@MrHubert1710
Copy link

In line 56,
While slicing list of frames, indexes refer to frames not to seconds.
Yet here slicing is done with clip duration and overlap which both are expressed in seconds.
Compensate it with " * fps" to get actual frame index.
Also " - 1" in calculation is implicitly adding one second overlap, which is not what I would expect from setting overlap to 0.

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment