human/human/audio_mal_handler.py

#encoding = utf8
import logging
import queue
import time

from threading import Thread, Event
from eventbus import EventBus

import numpy as np

from human_handler import AudioHandler
from utils import melspectrogram, SyncQueue

logger = logging.getLogger(__name__)


class AudioMalHandler(AudioHandler):
    def __init__(self, context, handler):
        super().__init__(context, handler)

        EventBus().register('stop', self._on_stop)

        self._queue = SyncQueue(context.batch_size, "AudioMalHandler_queue")
        self._exit_event = Event()
        self._thread = Thread(target=self._on_run, name="AudioMalHandlerThread")
        self._exit_event.set()
        self._thread.start()

        self.frames = []
        self.chunk = context.sample_rate // context.fps
        self._is_running = True
        logger.info("AudioMalHandler init")

    def __del__(self):
        EventBus().unregister('stop', self._on_stop)

    def _on_stop(self, *args, **kwargs):
        self.stop()

    def on_message(self, message):
        super().on_message(message)

    def on_handle(self, stream, index):
        # print('AudioMalHandler on_handle', index)
        self._queue.put(stream)

    def _on_run(self):
        logging.info('chunk2mal run')
        while self._exit_event.is_set() and self._is_running:
            self._run_step()
            time.sleep(0.02)

        logging.info('chunk2mal exit')

    def _run_step(self):
        count = 0
        for _ in range(self._context.batch_size * 2):
            frame, _type = self.get_audio_frame()
            self.frames.append(frame)
            self.on_next_handle((frame, _type), 0)
            count = count + 1

        if self._is_running is False:
            return
        # context not enough, do not run network.
        if len(self.frames) <= self._context.stride_left_size + self._context.stride_right_size:
            return

        # print('AudioMalHandler _run_step', count)
        inputs = np.concatenate(self.frames)  # [N * chunk]
        mel = melspectrogram(inputs)
        # print(mel.shape[0],mel.shape,len(mel[0]),len(self.frames))
        # cut off stride
        left = max(0, self._context.stride_left_size * 80 / 50)
        right = min(len(mel[0]), len(mel[0]) - self._context.stride_right_size * 80 / 50)
        mel_idx_multiplier = 80. * 2 / self._context.fps
        mel_step_size = 16
        i = 0
        mel_chunks = []
        while i < (len(self.frames) - self._context.stride_left_size - self._context.stride_right_size) / 2\
                and self._is_running:
            start_idx = int(left + i * mel_idx_multiplier)
            # print(start_idx)
            if start_idx + mel_step_size > len(mel[0]):
                mel_chunks.append(mel[:, len(mel[0]) - mel_step_size:])
            else:
                mel_chunks.append(mel[:, start_idx: start_idx + mel_step_size])
            i += 1
        self.on_next_handle(mel_chunks, 1)

        # discard the old part to save memory
        self.frames = self.frames[-(self._context.stride_left_size + self._context.stride_right_size):]

    def get_audio_frame(self):
        try:
            # print('AudioMalHandler get_audio_frame')
            frame = self._queue.get()
            type_ = 0
        except queue.Empty:
            frame = np.zeros(self.chunk, dtype=np.float32)
            type_ = 1
        # print('AudioMalHandler get_audio_frame type:', type_)
        return frame, type_

    def stop(self):
        logging.info('stop')
        self._is_running = False
        if self._exit_event is None:
            return

        self._exit_event.clear()
        if self._thread.is_alive():
            self._thread.join()
        logging.info('chunk2mal stop')

    def pause_talk(self):
        print('AudioMalHandler pause_talk', self._queue.size())
        self._queue.clear()
modify audio mal handler 2024-10-15 13:00:24 +00:00			`#encoding = utf8`
			`import logging`
			`import queue`
			`import time`
modify render sync 2024-11-01 12:38:57 +00:00
modify add event bus 2024-11-06 03:11:53 +00:00			`from threading import Thread, Event`
			`from eventbus import EventBus`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`import numpy as np`

modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`from human_handler import AudioHandler`
modify use sync queue 2024-10-29 10:09:26 +00:00			`from utils import melspectrogram, SyncQueue`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`logger = logging.getLogger(__name__)`


			`class AudioMalHandler(AudioHandler):`
			`def __init__(self, context, handler):`
			`super().__init__(context, handler)`

modify add event bus 2024-11-06 03:11:53 +00:00			`EventBus().register('stop', self._on_stop)`

modify render sync 2024-11-01 12:38:57 +00:00			`self._queue = SyncQueue(context.batch_size, "AudioMalHandler_queue")`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`self._exit_event = Event()`
modify render sync 2024-11-01 12:38:57 +00:00			`self._thread = Thread(target=self._on_run, name="AudioMalHandlerThread")`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`self._exit_event.set()`
			`self._thread.start()`

			`self.frames = []`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`self.chunk = context.sample_rate // context.fps`
modify stop sync 2024-11-06 12:31:23 +00:00			`self._is_running = True`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`logger.info("AudioMalHandler init")`
modify audio mal handler 2024-10-15 13:00:24 +00:00
modify add event bus 2024-11-06 03:11:53 +00:00			`def __del__(self):`
			`EventBus().unregister('stop', self._on_stop)`

			`def _on_stop(self, args, *kwargs):`
			`self.stop()`

modify render vidoe async 2024-10-25 00:23:55 +00:00			`def on_message(self, message):`
modify use sync queue 2024-10-29 10:09:26 +00:00			`super().on_message(message)`
modify render vidoe async 2024-10-25 00:23:55 +00:00
modify audio mal handler 2024-10-15 13:00:24 +00:00			`def on_handle(self, stream, index):`
modify render sync 2024-11-01 12:38:57 +00:00			`# print('AudioMalHandler on_handle', index)`
modify audio handle 2024-10-16 11:04:12 +00:00			`self._queue.put(stream)`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`def _on_run(self):`
			`logging.info('chunk2mal run')`
modify stop sync 2024-11-06 12:31:23 +00:00			`while self._exit_event.is_set() and self._is_running:`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`self._run_step()`
modify render vidoe async 2024-10-25 00:23:55 +00:00			`time.sleep(0.02)`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`logging.info('chunk2mal exit')`

			`def _run_step(self):`
add temp commit 2024-10-31 00:15:49 +00:00			`count = 0`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`for _ in range(self._context.batch_size * 2):`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`frame, _type = self.get_audio_frame()`
			`self.frames.append(frame)`
modify audio handle 2024-10-16 11:04:12 +00:00			`self.on_next_handle((frame, _type), 0)`
add temp commit 2024-10-31 00:15:49 +00:00			`count = count + 1`
modify stop sync 2024-11-06 12:31:23 +00:00
			`if self._is_running is False:`
			`return`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`# context not enough, do not run network.`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`if len(self.frames) <= self._context.stride_left_size + self._context.stride_right_size:`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`return`

modify render sync 2024-11-01 12:38:57 +00:00			`# print('AudioMalHandler _run_step', count)`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`inputs = np.concatenate(self.frames) # [N * chunk]`
add audio inferance handler and about codes 2024-10-16 00:01:11 +00:00			`mel = melspectrogram(inputs)`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`# print(mel.shape[0],mel.shape,len(mel[0]),len(self.frames))`
			`# cut off stride`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`left = max(0, self._context.stride_left_size * 80 / 50)`
add temp commit 2024-10-30 12:07:04 +00:00			`right = min(len(mel[0]), len(mel[0]) - self._context.stride_right_size * 80 / 50)`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`mel_idx_multiplier = 80. * 2 / self._context.fps`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`mel_step_size = 16`
			`i = 0`
			`mel_chunks = []`
modify stop sync 2024-11-06 12:31:23 +00:00			`while i < (len(self.frames) - self._context.stride_left_size - self._context.stride_right_size) / 2\`
			`and self._is_running:`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`start_idx = int(left + i * mel_idx_multiplier)`
			`# print(start_idx)`
			`if start_idx + mel_step_size > len(mel[0]):`
			`mel_chunks.append(mel[:, len(mel[0]) - mel_step_size:])`
			`else:`
			`mel_chunks.append(mel[:, start_idx: start_idx + mel_step_size])`
			`i += 1`
modify audio handle 2024-10-16 11:04:12 +00:00			`self.on_next_handle(mel_chunks, 1)`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`# discard the old part to save memory`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`self.frames = self.frames[-(self._context.stride_left_size + self._context.stride_right_size):]`
modify audio mal handler 2024-10-15 13:00:24 +00:00
			`def get_audio_frame(self):`
			`try:`
modify render sync 2024-11-01 12:38:57 +00:00			`# print('AudioMalHandler get_audio_frame')`
use pygame to render 2024-11-04 13:44:51 +00:00			`frame = self._queue.get()`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`type_ = 0`
			`except queue.Empty:`
			`frame = np.zeros(self.chunk, dtype=np.float32)`
			`type_ = 1`
modify render sync 2024-11-01 12:38:57 +00:00			`# print('AudioMalHandler get_audio_frame type:', type_)`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`return frame, type_`

			`def stop(self):`
			`logging.info('stop')`
modify stop sync 2024-11-06 12:31:23 +00:00			`self._is_running = False`
modify audio mal handler 2024-10-15 13:00:24 +00:00			`if self._exit_event is None:`
			`return`

			`self._exit_event.clear()`
			`if self._thread.is_alive():`
			`self._thread.join()`
			`logging.info('chunk2mal stop')`
modify pause talk 2024-10-19 19:28:49 +00:00
			`def pause_talk(self):`
modify render delay 2024-10-31 13:38:35 +00:00			`print('AudioMalHandler pause_talk', self._queue.size())`
modify use sync queue 2024-10-29 10:09:26 +00:00			`self._queue.clear()`