-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsample_wave.py
60 lines (48 loc) · 2.38 KB
/
sample_wave.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
#!/usr/bin/env python2.7
import houndify
import sys
import time
import wave
CLIENT_ID = sys.argv[1]
CLIENT_KEY = sys.argv[2]
AUDIO_FILE = sys.argv[3]
BUFFER_SIZE = 512
#
# Simplest HoundListener; just print out what we receive.
# You can use these callbacks to interact with your UI.
#
class MyListener(houndify.HoundListener):
def onPartialTranscript(self, transcript):
print(("Partial transcript: " + transcript))
def onFinalResponse(self, response):
print(("Final response: " + str(response)))
def onError(self, err):
print(("Error: " + str(err)))
client = houndify.StreamingHoundClient(CLIENT_ID, CLIENT_KEY, "test_user")
client.setLocation(37.388309, -121.973968)
## Uncomment the lines below to see an example of using a custom
## grammar for matching. Use the file 'turnthelightson.wav' to try it.
# clientMatches = [ {
# "Expression" : '([1/100 ("can"|"could"|"will"|"would")."you"].[1/10 "please"].("turn"|"switch"|(1/100 "flip"))."on".["the"].("light"|"lights").[1/20 "for"."me"].[1/20 "please"])|([1/100 ("can"|"could"|"will"|"would")."you"].[1/10 "please"].[100 ("turn"|"switch"|(1/100 "flip"))].["the"].("light"|"lights")."on".[1/20 "for"."me"].[1/20 "please"])|((("i".("want"|"like"))|((("i".["would"])|("i\'d")).("like"|"want"))).["the"].("light"|"lights").["turned"|"switched"|("to"."go")|(1/100"flipped")]."on".[1/20"please"])"',
# "Result" : { "Intent" : "TURN_LIGHT_ON" },
# "SpokenResponse" : "Ok, I\'m turning the lights on.",
# "SpokenResponseLong" : "Ok, I\'m turning the lights on.",
# "WrittenResponse" : "Ok, I\'m turning the lights on.",
# "WrittenResponseLong" : "Ok, I\'m turning the lights on."
# } ]
# client.setHoundRequestInfo('ClientMatches', clientMatches)
audio = wave.open(AUDIO_FILE)
if audio.getsampwidth() != 2:
print(("%s: wrong sample width (must be 16-bit)" % fname))
if audio.getframerate() != 8000 and audio.getframerate() != 16000:
print(("%s: unsupported sampling frequency (must be either 8 or 16 khz)" % fname))
if audio.getnchannels() != 1:
print(("%s: must be single channel (mono)" % fname))
client.setSampleRate(audio.getframerate())
client.start(MyListener())
while True:
samples = audio.readframes(BUFFER_SIZE)
if len(samples) == 0: break
if client.fill(samples): break
time.sleep(0.032) # simulate real-time so we can see the partial transcripts
result = client.finish() # returns either final response or error