163 lines
4.9 KiB
Python
163 lines
4.9 KiB
Python
# Copyright 2017 Mycroft AI Inc.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
#
|
|
import re
|
|
import time
|
|
from threading import Lock
|
|
|
|
from mycroft.configuration import Configuration
|
|
from mycroft.metrics import report_timing, Stopwatch
|
|
from mycroft.tts import TTSFactory
|
|
from mycroft.util import create_signal, check_for_signal
|
|
from mycroft.util.log import LOG
|
|
from mycroft.messagebus.message import Message
|
|
|
|
ws = None # TODO:18.02 - Rename to "messagebus"
|
|
config = None
|
|
tts = None
|
|
tts_hash = None
|
|
lock = Lock()
|
|
|
|
_last_stop_signal = 0
|
|
|
|
|
|
def _start_listener(message):
|
|
"""
|
|
Force Mycroft to start listening (as if 'Hey Mycroft' was spoken)
|
|
"""
|
|
create_signal('startListening')
|
|
|
|
|
|
def handle_speak(event):
|
|
"""
|
|
Handle "speak" message
|
|
"""
|
|
config = Configuration.get()
|
|
Configuration.init(ws)
|
|
global _last_stop_signal
|
|
|
|
# Get conversation ID
|
|
if event.context and 'ident' in event.context:
|
|
ident = event.context['ident']
|
|
else:
|
|
ident = 'unknown'
|
|
|
|
with lock:
|
|
stopwatch = Stopwatch()
|
|
stopwatch.start()
|
|
utterance = event.data['utterance']
|
|
if event.data.get('expect_response', False):
|
|
# When expect_response is requested, the listener will be restarted
|
|
# at the end of the next bit of spoken audio.
|
|
ws.once('recognizer_loop:audio_output_end', _start_listener)
|
|
|
|
# This is a bit of a hack for Picroft. The analog audio on a Pi blocks
|
|
# for 30 seconds fairly often, so we don't want to break on periods
|
|
# (decreasing the chance of encountering the block). But we will
|
|
# keep the split for non-Picroft installs since it give user feedback
|
|
# faster on longer phrases.
|
|
#
|
|
# TODO: Remove or make an option? This is really a hack, anyway,
|
|
# so we likely will want to get rid of this when not running on Mimic
|
|
if (config.get('enclosure', {}).get('platform') != "picroft" and
|
|
len(re.findall('<[^>]*>', utterance)) == 0):
|
|
start = time.time()
|
|
chunks = re.split(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?)\s',
|
|
utterance)
|
|
for chunk in chunks:
|
|
try:
|
|
mute_and_speak(chunk, ident)
|
|
except KeyboardInterrupt:
|
|
raise
|
|
except Exception:
|
|
LOG.error('Error in mute_and_speak', exc_info=True)
|
|
if (_last_stop_signal > start or
|
|
check_for_signal('buttonPress')):
|
|
break
|
|
else:
|
|
mute_and_speak(utterance, ident)
|
|
|
|
stopwatch.stop()
|
|
report_timing(ident, 'speech', stopwatch, {'utterance': utterance,
|
|
'tts': tts.__class__.__name__})
|
|
|
|
|
|
def mute_and_speak(utterance, ident):
|
|
"""
|
|
Mute mic and start speaking the utterance using selected tts backend.
|
|
|
|
Args:
|
|
utterance: The sentence to be spoken
|
|
ident: Ident tying the utterance to the source query
|
|
"""
|
|
global tts_hash
|
|
|
|
# update TTS object if configuration has changed
|
|
if tts_hash != hash(str(config.get('tts', ''))):
|
|
global tts
|
|
# Stop tts playback thread
|
|
tts.playback.stop()
|
|
tts.playback.join()
|
|
# Create new tts instance
|
|
tts = TTSFactory.create()
|
|
tts.init(ws)
|
|
tts_hash = hash(str(config.get('tts', '')))
|
|
|
|
LOG.info("Speak: " + utterance)
|
|
try:
|
|
tts.execute(utterance, ident)
|
|
except Exception as e:
|
|
LOG.error('TTS execution failed ({})'.format(repr(e)))
|
|
|
|
|
|
def handle_stop(event):
|
|
"""
|
|
handle stop message
|
|
"""
|
|
global _last_stop_signal
|
|
if check_for_signal("isSpeaking", -1):
|
|
_last_stop_signal = time.time()
|
|
tts.playback.clear_queue()
|
|
tts.playback.clear_visimes()
|
|
ws.emit(Message("mycroft.stop.handled", {"by": "TTS"}))
|
|
|
|
|
|
def init(websocket):
|
|
"""
|
|
Start speech related handlers
|
|
"""
|
|
|
|
global ws
|
|
global tts
|
|
global tts_hash
|
|
global config
|
|
|
|
ws = websocket
|
|
Configuration.init(ws)
|
|
config = Configuration.get()
|
|
ws.on('mycroft.stop', handle_stop)
|
|
ws.on('mycroft.audio.speech.stop', handle_stop)
|
|
ws.on('speak', handle_speak)
|
|
ws.on('mycroft.mic.listen', _start_listener)
|
|
|
|
tts = TTSFactory.create()
|
|
tts.init(ws)
|
|
tts_hash = config.get('tts')
|
|
|
|
|
|
def shutdown():
|
|
if tts:
|
|
tts.playback.stop()
|
|
tts.playback.join()
|