dragonfly-grammars/kaldi_dfly_loader_plus_gui.py

"""
Command-module loader for Kaldi.

This script is based on 'dfly-loader-wsr.py' written by Christo Butcher and
has been adapted to work with the Kaldi engine instead.

This script can be used to look for Dragonfly command-modules for use with
the Kaldi engine. It scans the directory it's in and loads any ``_*.py`` it
finds.
"""

# TODO Have a simple GUI for pausing, resuming, cancelling and stopping
# recognition, etc

from __future__ import print_function

import logging
import os.path
import os
import sys

import six

from dragonfly import get_engine
from dragonfly import Grammar, MappingRule, Function, Dictation, FuncContext
from dragonfly.loader import CommandModuleDirectory
from dragonfly.log import setup_log

# --------------------------------------------------------------------------
# Set up basic logging.

if False:
    # Debugging logging for reporting trouble
    logging.basicConfig(level=10)
    logging.getLogger('grammar.decode').setLevel(20)
    logging.getLogger('grammar.begin').setLevel(20)
    logging.getLogger('compound').setLevel(20)
    logging.getLogger('kaldi.compiler').setLevel(10)
else:
    setup_log()


# --------------------------------------------------------------------------
# User notification / rudimentary UI. MODIFY AS DESIRED

# For message in ('sleep', 'wake')
def notify(message):
    if message == 'sleep':
        K = "sleeping"
        os.system('echo "{0}" | festival --tts'.format(K))
        print("Sleeping...")
        # get_engine().speak("Sleeping")
    elif message == 'wake':
        print("Awake...")
        K = "I have awakened"
        os.system('echo "{0}" | festival --tts'.format(K))
        # get_engine().speak("Awake")


# --------------------------------------------------------------------------
# Sleep/wake grammar. (This can be unused or removed if you don't want it.)

sleeping = False

def load_sleep_wake_grammar(initial_awake):
    sleep_grammar = Grammar("sleep")

    def sleep(force=False):
        global sleeping
        if not sleeping or force:
            sleeping = True
            sleep_grammar.set_exclusiveness(True)
        notify('sleep')

    def wake(force=False):
        global sleeping
        if sleeping or force:
            sleeping = False
            sleep_grammar.set_exclusiveness(False)
        notify('wake')

    class SleepRule(MappingRule):
        mapping = {
            "wake up":  Function(wake) + Function(lambda: get_engine().start_saving_adaptation_state()),
            "snore":   Function(lambda: get_engine().stop_saving_adaptation_state()) + Function(sleep),
            "halt listening":   Function(lambda: get_engine().stop_saving_adaptation_state()) + Function(sleep),
        }
    sleep_grammar.add_rule(SleepRule())

    sleep_noise_rule = MappingRule(
        name = "sleep_noise_rule",
        mapping = { "<text>": Function(lambda text: False and print(text)) },
        extras = [ Dictation("text") ],
        context = FuncContext(lambda: sleeping),
    )
    sleep_grammar.add_rule(sleep_noise_rule)

    sleep_grammar.load()

    if initial_awake:
        wake(force=True)
    else:
        sleep(force=True)


# --------------------------------------------------------------------------
# Main event driving loop.

def main():
    logging.basicConfig(level=logging.INFO)

    try:
        path = os.path.dirname(__file__)
    except NameError:
        # The "__file__" name is not always available, for example
        # when this module is run from PythonWin.  In this case we
        # simply use the current working directory.
        path = os.getcwd()
        __file__ = os.path.join(path, "kaldi_module_loader_plus.py")

    # Set any configuration options here as keyword arguments.
    # See Kaldi engine documentation for all available options and more info.
    engine = get_engine('kaldi',
        model_dir='kaldi_model',  # default model directory
        # vad_aggressiveness=3,  # default aggressiveness of VAD
        # vad_padding_start_ms=150,  # default ms of required silence before VAD
        # vad_padding_end_ms=150,  # default ms of required silence after VAD
        # vad_complex_padding_end_ms=500,  # default ms of required silence after VAD for complex utterances
        # input_device_index=None,  # set to an int to choose a non-default microphone
        # lazy_compilation=True,  # set to True to parallelize & speed up loading
        # retain_dir=None,  # set to a writable directory path to retain recognition metadata and/or audio data
        # retain_audio=None,  # set to True to retain speech data wave files in the retain_dir (if set)
    )

    # Call connect() now that the engine configuration is set.
    engine.connect()

    # Load grammars.
    load_sleep_wake_grammar(True)
    directory = CommandModuleDirectory(path, excludes=[__file__])
    directory.load()

    # Define recognition callback functions.
    def on_begin():
        print("Speech start detected.")

    def on_recognition(words):
        message = u"Recognized: %s" % u" ".join(words)

        # This only seems to be an issue with Python 2.7 on Windows.
        if six.PY2:
            encoding = sys.stdout.encoding or "ascii"
            message = message.encode(encoding, errors='replace')
        print(message)

    def on_failure():
        print("Sorry, what was that?")

    # Start the engine's main recognition loop
    engine.prepare_for_recognition()
    try:
        print("Listening...")
        engine.do_recognition(on_begin, on_recognition, on_failure)
    except KeyboardInterrupt:
        pass


if __name__ == "__main__":
    main()
added readme,md modified gerammars to work better on linux 2022-02-10 07:19:17 -06:00			`"""`
			`Command-module loader for Kaldi.`

			`This script is based on 'dfly-loader-wsr.py' written by Christo Butcher and`
			`has been adapted to work with the Kaldi engine instead.`

			`This script can be used to look for Dragonfly command-modules for use with`
			the Kaldi engine. It scans the directory it's in and loads any ``_*.py`` it
			`finds.`
			`"""`

			`# TODO Have a simple GUI for pausing, resuming, cancelling and stopping`
			`# recognition, etc`

			`from __future__ import print_function`

			`import logging`
			`import os.path`
			`import os`
			`import sys`

			`import six`

			`from dragonfly import get_engine`
			`from dragonfly import Grammar, MappingRule, Function, Dictation, FuncContext`
			`from dragonfly.loader import CommandModuleDirectory`
			`from dragonfly.log import setup_log`

			`# --------------------------------------------------------------------------`
			`# Set up basic logging.`

			`if False:`
			`# Debugging logging for reporting trouble`
			`logging.basicConfig(level=10)`
			`logging.getLogger('grammar.decode').setLevel(20)`
			`logging.getLogger('grammar.begin').setLevel(20)`
			`logging.getLogger('compound').setLevel(20)`
			`logging.getLogger('kaldi.compiler').setLevel(10)`
			`else:`
			`setup_log()`


			`# --------------------------------------------------------------------------`
			`# User notification / rudimentary UI. MODIFY AS DESIRED`

			`# For message in ('sleep', 'wake')`
			`def notify(message):`
			`if message == 'sleep':`
			`K = "sleeping"`
			`os.system('echo "{0}" \| festival --tts'.format(K))`
			`print("Sleeping...")`
			`# get_engine().speak("Sleeping")`
			`elif message == 'wake':`
			`print("Awake...")`
			`K = "I have awakened"`
			`os.system('echo "{0}" \| festival --tts'.format(K))`
			`# get_engine().speak("Awake")`


			`# --------------------------------------------------------------------------`
			`# Sleep/wake grammar. (This can be unused or removed if you don't want it.)`

			`sleeping = False`

			`def load_sleep_wake_grammar(initial_awake):`
			`sleep_grammar = Grammar("sleep")`

			`def sleep(force=False):`
			`global sleeping`
			`if not sleeping or force:`
			`sleeping = True`
			`sleep_grammar.set_exclusiveness(True)`
			`notify('sleep')`

			`def wake(force=False):`
			`global sleeping`
			`if sleeping or force:`
			`sleeping = False`
			`sleep_grammar.set_exclusiveness(False)`
			`notify('wake')`

			`class SleepRule(MappingRule):`
			`mapping = {`
			`"wake up": Function(wake) + Function(lambda: get_engine().start_saving_adaptation_state()),`
			`"snore": Function(lambda: get_engine().stop_saving_adaptation_state()) + Function(sleep),`
			`"halt listening": Function(lambda: get_engine().stop_saving_adaptation_state()) + Function(sleep),`
			`}`
			`sleep_grammar.add_rule(SleepRule())`

			`sleep_noise_rule = MappingRule(`
			`name = "sleep_noise_rule",`
			`mapping = { "<text>": Function(lambda text: False and print(text)) },`
			`extras = [ Dictation("text") ],`
			`context = FuncContext(lambda: sleeping),`
			`)`
			`sleep_grammar.add_rule(sleep_noise_rule)`

			`sleep_grammar.load()`

			`if initial_awake:`
			`wake(force=True)`
			`else:`
			`sleep(force=True)`


			`# --------------------------------------------------------------------------`
			`# Main event driving loop.`

			`def main():`
			`logging.basicConfig(level=logging.INFO)`

			`try:`
			`path = os.path.dirname(__file__)`
			`except NameError:`
			`# The "__file__" name is not always available, for example`
			`# when this module is run from PythonWin. In this case we`
			`# simply use the current working directory.`
			`path = os.getcwd()`
			`__file__ = os.path.join(path, "kaldi_module_loader_plus.py")`

			`# Set any configuration options here as keyword arguments.`
			`# See Kaldi engine documentation for all available options and more info.`
			`engine = get_engine('kaldi',`
			`model_dir='kaldi_model', # default model directory`
			`# vad_aggressiveness=3, # default aggressiveness of VAD`
			`# vad_padding_start_ms=150, # default ms of required silence before VAD`
			`# vad_padding_end_ms=150, # default ms of required silence after VAD`
			`# vad_complex_padding_end_ms=500, # default ms of required silence after VAD for complex utterances`
			`# input_device_index=None, # set to an int to choose a non-default microphone`
			`# lazy_compilation=True, # set to True to parallelize & speed up loading`
			`# retain_dir=None, # set to a writable directory path to retain recognition metadata and/or audio data`
			`# retain_audio=None, # set to True to retain speech data wave files in the retain_dir (if set)`
			`)`

			`# Call connect() now that the engine configuration is set.`
			`engine.connect()`

			`# Load grammars.`
			`load_sleep_wake_grammar(True)`
			`directory = CommandModuleDirectory(path, excludes=[__file__])`
			`directory.load()`

			`# Define recognition callback functions.`
			`def on_begin():`
			`print("Speech start detected.")`

			`def on_recognition(words):`
			`message = u"Recognized: %s" % u" ".join(words)`

			`# This only seems to be an issue with Python 2.7 on Windows.`
			`if six.PY2:`
			`encoding = sys.stdout.encoding or "ascii"`
			`message = message.encode(encoding, errors='replace')`
			`print(message)`

			`def on_failure():`
			`print("Sorry, what was that?")`

			`# Start the engine's main recognition loop`
			`engine.prepare_for_recognition()`
			`try:`
			`print("Listening...")`
			`engine.do_recognition(on_begin, on_recognition, on_failure)`
			`except KeyboardInterrupt:`
			`pass`


			`if __name__ == "__main__":`
			`main()`