Added simple continuous mode (Under Development)

JamezQ · Mar 24, 2013 · cf5d1dd · cf5d1dd
1 parent 1d1655e
commit cf5d1dd
Show file tree

Hide file tree

Showing 8 changed files with 143 additions and 3 deletions.
diff --git a/Microphone/pycmd_nocmd b/Microphone/pycmd_nocmd
diff --git a/PEOPLE_WANT.txt b/PEOPLE_WANT.txt
@@ -9,11 +9,11 @@ show me my recent documents
 natvigate to some place
 directions to some place
 
-whats my ip - BmanDesigns
+whats my ip - BmanDesigns (Done)
 
 where am I
 
-who am I - BmanDesigns
+who am I - BmanDesigns (Done)
 
 ifconfig
 

diff --git a/Recognition/bin/UserInformation b/Recognition/bin/UserInformation
diff --git a/Recognition/config/plugins.db b/Recognition/config/plugins.db
diff --git a/Recognition/modes/main.dic b/Recognition/modes/main.dic
@@ -1,3 +1,9 @@
+#PLUGIN: UserInformation
+<<w,W>hat's,<w,W>hats,<w,W>hat is> my <i,I><p,P>
+  UserInformation ip
+<<w,W>hat's,<w,W>hats,<w,W>hat is> my name
+  UserInformation name
+#END
 #PLUGIN: Gmail
 <d,D>o <i,I> have new <mail,messages,email>
   Gmail unread

diff --git a/continue b/continue
@@ -0,0 +1,134 @@
+#!/usr/bin/python
+
+# open a microphone in pyAudio and listen for taps
+
+import pyaudio
+import struct
+import math
+import os
+
+INITIAL_TAP_THRESHOLD = 0.010
+FORMAT = pyaudio.paInt16 
+SHORT_NORMALIZE = (1.0/32768.0)
+CHANNELS = 2
+RATE = 44100  
+INPUT_BLOCK_TIME = 0.05
+INPUT_FRAMES_PER_BLOCK = int(RATE*INPUT_BLOCK_TIME)
+# if we get this many noisy blocks in a row, increase the threshold
+OVERSENSITIVE = 15.0/INPUT_BLOCK_TIME                    
+# if we get this many quiet blocks in a row, decrease the threshold
+UNDERSENSITIVE = 120.0/INPUT_BLOCK_TIME 
+# if the noise was longer than this many blocks, it's not a 'tap'
+MAX_TAP_BLOCKS = 0.15/INPUT_BLOCK_TIME
+
+def get_rms( block ):
+	# RMS amplitude is defined as the square root of the 
+	# mean over time of the square of the amplitude.
+	# so we need to convert this string of bytes into 
+	# a string of 16-bit samples...
+
+	# we will get one short out for each 
+	# two chars in the string.
+	count = len(block)/2
+	format = "%dh"%(count)
+	shorts = struct.unpack( format, block )
+
+	# iterate over the block.
+	sum_squares = 0.0
+	for sample in shorts:
+		# sample is a signed short in +/- 32768. 
+		# normalize it to 1.0
+		n = sample * SHORT_NORMALIZE
+		sum_squares += n*n
+
+	return math.sqrt( sum_squares / count )
+
+class TapTester(object):
+	def __init__(self):
+		self.pa = pyaudio.PyAudio()
+		self.stream = self.open_mic_stream()
+		self.tap_threshold = INITIAL_TAP_THRESHOLD
+		self.noisycount = MAX_TAP_BLOCKS+1 
+		self.quietcount = 0 
+		self.errorcount = 0
+		self.trigger = True
+		self.switchmiddle = False
+		self.switchon = False
+		self.switchoff = True
+
+	def stop(self):
+		self.stream.close()
+
+	def find_input_device(self):
+		device_index = None            
+		for i in range( self.pa.get_device_count() ):     
+			devinfo = self.pa.get_device_info_by_index(i)   
+			print( "Device %d: %s"%(i,devinfo["name"]) )
+
+			for keyword in ["mic","input"]:
+				if keyword in devinfo["name"].lower():
+				    print( "Found an input: device %d - %s"%(i,devinfo["name"]) )
+				    device_index = i
+				    return device_index
+
+		if device_index == None:
+			print( "No preferred input found; using default input device." )
+
+		return device_index
+
+	def open_mic_stream( self ):
+		device_index = self.find_input_device()
+
+		stream = self.pa.open(   format = FORMAT,
+				                 channels = CHANNELS,
+				                 rate = RATE,
+				                 input = True,
+				                 input_device_index = device_index,
+				                 frames_per_buffer = INPUT_FRAMES_PER_BLOCK)
+
+		return stream
+
+
+	def listen(self):
+		try:
+			block = self.stream.read(INPUT_FRAMES_PER_BLOCK)
+		except IOError, e:
+			# dammit. 
+			self.errorcount += 1
+			print( "(%d) Error recording: %s"%(self.errorcount,e) )
+			self.noisycount = 1
+			return
+
+		amplitude = get_rms( block )
+		amp2 = amplitude*1000
+		#print self.noisycount, self.quietcount
+		if amp2 > 2.0:
+			self.noisycount += 1
+			self.quietcount = 0
+		else:
+			self.noisycount = 0
+			self.quietcount += 1
+		if self.noisycount > 20:
+			if self.switchoff:
+				print "Switch On"
+				self.switchon = True
+			self.switchoff = False
+		if self.quietcount > 5:
+			if self.switchon and self.switchmiddle == False:
+				print "Switch Middle"
+				os.system("./hotkey")
+				self.quietcount = 0
+				self.switchmiddle = True
+			if self.quietcount > 30:
+				if self.switchon and self.switchmiddle:
+					print "Switch Off"
+					os.system("./hotkey")
+				self.switchon = False
+				self.switchmiddle = False
+				self.switchoff = True
+
+if __name__ == "__main__":
+	tt = TapTester()
+
+	for i in range(1000):
+		tt.listen()
diff --git a/result.json b/result.json
@@ -1 +1 @@
-{"status":0,"id":"b0ebf735610f34e9fcd10bf212d4e596-1","hypotheses":[{"utterance":"play bulletproof","confidence":0.9345257}]}
+{"status":0,"id":"7c8c98f3772cedd147af8603258fd7be-1","hypotheses":[{"utterance":"open Firefox","confidence":0.959115}]}
diff --git a/speech.flac b/speech.flac