mherwig · December 11, 2015 23:18 · mherwig · Feb 13, 2014
diff --git a/simple-voice-control.sh b/simple-voice-control.sh
 #!/bin/bash
 #
 # Author: Mike Herwig
 # Description:
 # Simple voice control demonstration using google's speech-api

 LANG="en"

 API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

 CMD_LIST_DIRECTORY="list directory"
 CMD_WHOAMI="who am i"


 JSON=`arecord -f cd -t wav -d 3 -r 16000 | flac - -f --best --sample-rate 16000 -o out.flac;\
 wget -O - -o /dev/null --post-file out.flac --header="Content-Type: audio/x-flac; rate=16000" "$API"`

 UTTERANCE=`echo $JSON\
 |sed -e 's/[{}]/''/g'\
  |awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
   |awk -F: 'NR==3 { print $3; exit }'\
    |sed -e 's/["]/''/g'`

 echo "utterance: $UTTERANCE"
 echo ""

 if [ `echo "$UTTERANCE" | grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
 	ls .
 elif [ `echo "$UTTERANCE" | grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
 	whoami
 fi
diff --git a/VoiceControl.sh b/VoiceControl.sh
 #!/bin/bash
 #
 # Author: Mike Herwig
 # Description:
 # Updated voice control demonstration using google's speech-api
 # The main difference to the previous script I uploaded to my Gist is that it's using sox for recording now
 # and only records your voice to the disc when sox detects sound
 # Dependencies: sox, wget

 LANG="en"

 API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

 CMD_LIST_DIRECTORY="list directory"
 CMD_WHOAMI="who am i"

 function waitForCommand {
 	rec /tmp/cmdrecording.flac rate 32k silence 1 0.1 3% 1 3.0 3%
 }

 function speechToJSON {
 	JSON=`wget -O - -o /dev/null --post-file /tmp/cmdrecording.flac --header="Content-Type: audio/x-flac; rate=32000" "$API"`
 }

 function getUtterance {
 	UTTERANCE=`echo $JSON\
 	 |sed -e 's/[{}]/''/g'\
 	  |awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
 	   |awk -F: 'NR==3 { print $3; exit }'\
 	    |sed -e 's/["]/''/g'`

 	echo "utterance: $UTTERANCE"
 	echo ""
 }

 while true; do
 	waitForCommand && speechToJSON && getUtterance

 	if [ `echo "$UTTERANCE" | grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
        	ls .
 	elif [ `echo "$UTTERANCE" | grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
        	whoami
 	fi

 	#sleep 1
 done
	#!/bin/bash
	#
	# Author: Mike Herwig
	# Description:
	# Simple voice control demonstration using google's speech-api

	LANG="en"

	API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

	CMD_LIST_DIRECTORY="list directory"
	CMD_WHOAMI="who am i"


	JSON=`arecord -f cd -t wav -d 3 -r 16000 \| flac - -f --best --sample-rate 16000 -o out.flac;\
	wget -O - -o /dev/null --post-file out.flac --header="Content-Type: audio/x-flac; rate=16000" "$API"`

	UTTERANCE=`echo $JSON\
	\|sed -e 's/[{}]/''/g'\
	\|awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
	\|awk -F: 'NR==3 { print $3; exit }'\
	\|sed -e 's/["]/''/g'`

	echo "utterance: $UTTERANCE"
	echo ""

	if [ `echo "$UTTERANCE" \| grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
	ls .
	elif [ `echo "$UTTERANCE" \| grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
	whoami
	fi