Adam-D-Lewis · June 19, 2023 16:18
diff --git a/voice_type.py b/voice_type.py
 # POC Type with your voice script
 # You may also need to install the additional dependencies: portaudio flac

 from pathlib import Path
 import speech_recognition as sr
 import pyaudio
 from pynput.keyboard import Controller
 from threading import Thread
 import wave

 BASE_DIR = Path(__file__).resolve().parent

 def type_text(text):
    keyboard = Controller()

    # Type each character in the text
    for char in text:
        keyboard.press(char)
        keyboard.release(char)
        # time.sleep(0.1)  # Adjust the delay between keypresses if needed

    # Press Enter key at the end
    keyboard.press('\n')
    keyboard.release('\n')


 def play_audio(filename):
    # Open the file for reading.
    wav = wave.open(filename, 'rb')

    # Create an interface to PortAudio.
    pa = pyaudio.PyAudio()

    # Open a .Stream object to write the WAV file to.
    # 'output = True' indicates that the sound will be outputted to the speaker.
    # 'rate' is the sample rate from the wav file, which we set as the rate of the output stream.
    # 'channels' is also set using the method getnchannels().
    # 'format' we get from a lookup dictionary provided by PyAudio containing the appropriate format for the sample width returned from the wave file.
    stream = pa.open(
        format = pa.get_format_from_width(wav.getsampwidth()),
        channels = wav.getnchannels(),
        rate = wav.getframerate(),
        output = True
    )

    # CHUNK size
    CHUNK = 1024

    # Read data in chunks
    data = wav.readframes(CHUNK)

    # Play the sound by writing the audio data to the stream.
    while data != b'':
        stream.write(data)
        data = wav.readframes(CHUNK)

    # Close and terminate everything properly.
    stream.stop_stream()
    stream.close()
    pa.terminate()

 def make_sound_thread():
    sound_file_path = str(BASE_DIR.joinpath('start-record.wav'))
    thread = Thread(
        target=play_audio, 
        args=(sound_file_path,)
    )
    return thread

 def main(): 
    # Initialize the recognizer
    r = sr.Recognizer()

    # Open the microphone for recording
    with sr.Microphone() as source:
        make_sound_thread().start()

        # Adjust ambient noise threshold, if needed
        # r.adjust_for_ambient_noise(source)
        
        # Record the audio
        print("Listening...")
        audio = r.listen(source)
        print('done listening')
        try:
            # Perform speech recognition
            text = r.recognize_google(audio)

            # Print the recognized text
            print("Detected Speech:", text)
            type_text(text)
            
        except sr.UnknownValueError as e:
            make_sound_thread().start()
            print("Unable to recognize speech")
            with open(BASE_DIR.joinpath('error_log.txt'), "a") as error_file:
                error_file.write(str(e) + '\n')

 if __name__ == "__main__":
    main()
	# POC Type with your voice script
	# You may also need to install the additional dependencies: portaudio flac

	from pathlib import Path
	import speech_recognition as sr
	import pyaudio
	from pynput.keyboard import Controller
	from threading import Thread
	import wave

	BASE_DIR = Path(__file__).resolve().parent

	def type_text(text):
	keyboard = Controller()

	# Type each character in the text
	for char in text:
	keyboard.press(char)
	keyboard.release(char)
	# time.sleep(0.1) # Adjust the delay between keypresses if needed

	# Press Enter key at the end
	keyboard.press('\n')
	keyboard.release('\n')


	def play_audio(filename):
	# Open the file for reading.
	wav = wave.open(filename, 'rb')

	# Create an interface to PortAudio.
	pa = pyaudio.PyAudio()

	# Open a .Stream object to write the WAV file to.
	# 'output = True' indicates that the sound will be outputted to the speaker.
	# 'rate' is the sample rate from the wav file, which we set as the rate of the output stream.
	# 'channels' is also set using the method getnchannels().
	# 'format' we get from a lookup dictionary provided by PyAudio containing the appropriate format for the sample width returned from the wave file.
	stream = pa.open(
	format = pa.get_format_from_width(wav.getsampwidth()),
	channels = wav.getnchannels(),
	rate = wav.getframerate(),
	output = True
	)

	# CHUNK size
	CHUNK = 1024

	# Read data in chunks
	data = wav.readframes(CHUNK)

	# Play the sound by writing the audio data to the stream.
	while data != b'':
	stream.write(data)
	data = wav.readframes(CHUNK)

	# Close and terminate everything properly.
	stream.stop_stream()
	stream.close()
	pa.terminate()

	def make_sound_thread():
	sound_file_path = str(BASE_DIR.joinpath('start-record.wav'))
	thread = Thread(
	target=play_audio,
	args=(sound_file_path,)
	)
	return thread

	def main():
	# Initialize the recognizer
	r = sr.Recognizer()

	# Open the microphone for recording
	with sr.Microphone() as source:
	make_sound_thread().start()

	# Adjust ambient noise threshold, if needed
	# r.adjust_for_ambient_noise(source)

	# Record the audio
	print("Listening...")
	audio = r.listen(source)
	print('done listening')
	try:
	# Perform speech recognition
	text = r.recognize_google(audio)

	# Print the recognized text
	print("Detected Speech:", text)
	type_text(text)

	except sr.UnknownValueError as e:
	make_sound_thread().start()
	print("Unable to recognize speech")
	with open(BASE_DIR.joinpath('error_log.txt'), "a") as error_file:
	error_file.write(str(e) + '\n')

	if __name__ == "__main__":
	main()