dragonfire/sr/decoder_test.py from DragonComputer/Dragonfire

dragonfire/sr/decoder_test.py
Summary

Maintainability

0 mins
Test Coverage

Issues
# -*- coding: UTF-8 -*-

from __future__ import print_function
from __future__ import absolute_import
import unittest
from gi.repository import GObject
import _thread as thread  # Low-level threading API (Python 3.x)
import logging
from dragonfire.sr.decoder import DecoderPipeline
import time
import pyaudio  # Provides Python bindings for PortAudio, the cross platform audio API

import pytest

CHUNK = 8000  # Smallest unit of audio. 1024 bytes
FORMAT = pyaudio.paInt16  # Data format
CHANNELS = 1  # Number of channels
RATE = 16000  # Bit Rate of audio stream / Frame Rate
THRESHOLD = 1000  # Threshhold value for detecting stimulant
RECORD_SECONDS = 10


class DecoderPipelineTests(unittest.TestCase):
    def __init__(self, *args, **kwargs):
        super(DecoderPipelineTests, self).__init__(*args, **kwargs)
        logging.basicConfig(level=logging.INFO)

    @classmethod
    def setUpClass(cls):
        # voxforge/tri2b_mmi_b0.05 model:
        decoder_conf = {
            "model": "models/english/final.mdl",
            "lda-mat": "models/english/final.mat",
            "word-syms": "models/english/words.txt",
            "fst": "models/english/HCLG.fst",
            "silence-phones": "6"
        }
        cls.decoder_pipeline = DecoderPipeline({"decoder": decoder_conf})
        cls.words = []
        cls.finished = False

        cls.decoder_pipeline.set_word_handler(cls.word_getter)
        cls.decoder_pipeline.set_eos_handler(cls.set_finished, cls.finished)

        loop = GObject.MainLoop()
        thread.start_new_thread(loop.run, ())

    @classmethod
    def word_getter(cls, word):
        cls.words.append(word)

    @classmethod
    def set_finished(cls, finished):
        cls.finished = finished

    def setUp(self):
        self.__class__.words = []
        self.__class__.finished = False

    @pytest.mark.skip(reason="Kaldi is deprecated.")
    def testRecognize(self):
        self.decoder_pipeline.init_request(
            "recognize",
            "audio/x-raw, layout=(string)interleaved, rate=(int)16000, format=(string)S16LE, channels=(int)1"
        )
        p = pyaudio.PyAudio()  # Create a PyAudio session
        # Create a stream
        stream = p.open(
            format=FORMAT,
            channels=CHANNELS,
            rate=RATE,
            input=True,
            output=True,
            frames_per_buffer=CHUNK)

        data = stream.read(CHUNK)  # Get first data frame from the microphone
        for i in range(0, int(RATE / CHUNK * RECORD_SECONDS)):
            data = stream.read(CHUNK)  # Read a new chunk from the stream
            stream.write(data, CHUNK)
            # time.sleep(0.25)
            self.decoder_pipeline.process_data(data)

        stream.stop_stream()
        stream.close()
        p.terminate()

        self.decoder_pipeline.end_request()
        while not self.finished:
            time.sleep(1)
        print(self.words)

    @pytest.mark.skip(reason="Kaldi is deprecated.")
    def testWav(self):
        self.decoder_pipeline.init_request("testWav", "")
        f = open("tests/ten_digits.wav", "rb")
        for block in iter(lambda: f.read(16000 * 2 * 2 / 4), ""):
            time.sleep(0.25)
            self.decoder_pipeline.process_data(block)

        self.decoder_pipeline.end_request()

        while not self.finished:
            time.sleep(1)
        self.assertEqual([
            'ONE', 'TWO', 'THREE', 'FOUR', 'FIVE', 'SIX', 'SEVEN', 'EIGHT',
            '<#s>'
        ], self.words)


def main():
    unittest.main()


if __name__ == '__main__':
    main()