mherwig/VoiceControl.sh

## simple-voice-control.sh
#!/bin/bash
#
# Author: Mike Herwig
# Description:
# Simple voice control demonstration using google's speech-api

LANG="en"

API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

CMD_LIST_DIRECTORY="list directory"
CMD_WHOAMI="who am i"


JSON=`arecord -f cd -t wav -d 3 -r 16000 | flac - -f --best --sample-rate 16000 -o out.flac;\
wget -O - -o /dev/null --post-file out.flac --header="Content-Type: audio/x-flac; rate=16000" "$API"`

UTTERANCE=`echo $JSON\
 |sed -e 's/[{}]/''/g'\
  |awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
   |awk -F: 'NR==3 { print $3; exit }'\
    |sed -e 's/["]/''/g'`

echo "utterance: $UTTERANCE"
echo ""

if [ `echo "$UTTERANCE" | grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
	ls .
elif [ `echo "$UTTERANCE" | grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
	whoami
fi

## VoiceControl.sh
#!/bin/bash
#
# Author: Mike Herwig
# Description:
# Updated voice control demonstration using google's speech-api
# The main difference to the previous script I uploaded to my Gist is that it's using sox for recording now
# and only records your voice to the disc when sox detects sound
# Dependencies: sox, wget

LANG="en"

API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

CMD_LIST_DIRECTORY="list directory"
CMD_WHOAMI="who am i"

function waitForCommand {
	rec /tmp/cmdrecording.flac rate 32k silence 1 0.1 3% 1 3.0 3%
}

function speechToJSON {
	JSON=`wget -O - -o /dev/null --post-file /tmp/cmdrecording.flac --header="Content-Type: audio/x-flac; rate=32000" "$API"`
}

function getUtterance {
	UTTERANCE=`echo $JSON\
	 |sed -e 's/[{}]/''/g'\
	  |awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
	   |awk -F: 'NR==3 { print $3; exit }'\
	    |sed -e 's/["]/''/g'`

	echo "utterance: $UTTERANCE"
	echo ""
}

while true; do
	waitForCommand && speechToJSON && getUtterance

	if [ `echo "$UTTERANCE" | grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
        	ls .
	elif [ `echo "$UTTERANCE" | grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
        	whoami
	fi

	#sleep 1
done
	#!/bin/bash
	#
	# Author: Mike Herwig
	# Description:
	# Simple voice control demonstration using google's speech-api

	LANG="en"

	API="http://www.google.com/speech-api/v1/recognize?lang=$LANG"

	CMD_LIST_DIRECTORY="list directory"
	CMD_WHOAMI="who am i"


	JSON=`arecord -f cd -t wav -d 3 -r 16000 \| flac - -f --best --sample-rate 16000 -o out.flac;\
	wget -O - -o /dev/null --post-file out.flac --header="Content-Type: audio/x-flac; rate=16000" "$API"`

	UTTERANCE=`echo $JSON\
	\|sed -e 's/[{}]/''/g'\
	\|awk -v k="text" '{n=split($0,a,","); for (i=1; i<=n; i++) print a[i]; exit }'\
	\|awk -F: 'NR==3 { print $3; exit }'\
	\|sed -e 's/["]/''/g'`

	echo "utterance: $UTTERANCE"
	echo ""

	if [ `echo "$UTTERANCE" \| grep -ic "^$CMD_LIST_DIRECTORY$"` -gt 0 ]; then
	ls .
	elif [ `echo "$UTTERANCE" \| grep -ic "^$CMD_WHOAMI$"` -gt 0 ]; then
	whoami
	fi