From 54cf720f8b0396fa21b15a09f751d20dc8b5cb26 Mon Sep 17 00:00:00 2001
From: Matthew Scholefield <matthew3311999@gmail.com>
Date: Thu, 23 Jun 2016 16:03:47 -0500
Subject: [PATCH] Added timeout override to listener and fixed bug with it
 previously the listner's behavior would be influenced by the buffer size.
 Now, however, it is not since the noise is increased by a factor of the
 seconds per buffer.

---
 mycroft/client/speech/mic.py | 20 +++++++++++++++-----
 1 file changed, 15 insertions(+), 5 deletions(-)

diff --git a/mycroft/client/speech/mic.py b/mycroft/client/speech/mic.py
index cb98af8c2c..f6d1a5f3d8 100644
--- a/mycroft/client/speech/mic.py
+++ b/mycroft/client/speech/mic.py
@@ -126,12 +126,16 @@ class ResponsiveRecognizer(speech_recognition.Recognizer):
 
     # The minimum seconds of noise before a
     # phrase can be considered complete
-    MIN_LOUD_SEC_PER_PHRASE = 0.2
+    MIN_LOUD_SEC_PER_PHRASE = 0.1
 
     # The maximum length a phrase can be recorded,
     # provided there is noise the entire time
     RECORDING_TIMEOUT = 30.0
 
+    # The maximum time it will continue to record silence
+    # when not enough noise has been detected
+    RECORDING_TIMEOUT_WITH_SILENCE = 3.0
+
     # Time between pocketsphinx checks for the wake word
     SEC_BETWEEN_WW_CHECKS = 0.2
 
@@ -167,17 +171,17 @@ class ResponsiveRecognizer(speech_recognition.Recognizer):
         num_loud_chunks = 0
         noise = 0
 
-        max_noise = 20
+        max_noise = 25
         min_noise = 0
 
         def increase_noise(level):
             if level < max_noise:
-                return level + 2
+                return level + 200 * sec_per_buffer
             return level
 
         def decrease_noise(level):
             if level > min_noise:
-                return level - 1
+                return level - 100 * sec_per_buffer
             return level
 
         # Smallest number of loud chunks required to return
@@ -187,6 +191,9 @@ class ResponsiveRecognizer(speech_recognition.Recognizer):
         max_chunks = int(self.RECORDING_TIMEOUT / sec_per_buffer)
         num_chunks = 0
 
+        # Will return if exceeded this even if there's not enough loud chunks
+        max_chunks_of_silence = int(self.RECORDING_TIMEOUT_WITH_SILENCE/sec_per_buffer)
+
         # bytearray to store audio in
         byte_data = '\0' * source.SAMPLE_WIDTH
 
@@ -205,7 +212,10 @@ class ResponsiveRecognizer(speech_recognition.Recognizer):
                 noise = decrease_noise(noise)
                 self.adjust_threshold(energy, sec_per_buffer)
 
-            if noise <= min_noise and num_loud_chunks > min_loud_chunks:
+            was_loud_enough = num_loud_chunks > min_loud_chunks
+            quiet_enough = noise <= min_noise
+            recorded_too_much_silence = num_chunks > max_chunks_of_silence
+            if quiet_enough and (was_loud_enough or recorded_too_much_silence):
                 phrase_complete = True
 
         return byte_data