modify ipc

2024-12-05 00:47:17 +08:00 · 2024-12-05 00:47:17 +08:00 · 322ff33c84
commit 322ff33c84
parent 2a2a3cd349
12 changed files with 117 additions and 21 deletions
--- a/human/init.py
+++ b/human/init.py
@ -4,4 +4,5 @@ from .human_context import HumanContext
 from .audio_mal_handler import AudioMalHandler
 from .audio_inference_handler import AudioInferenceHandler
 from .audio_inference_onnx_handler import AudioInferenceOnnxHandler
+from .huaman_status import HumanStatusEnum, HumanStatus
 from .human_render import HumanRender
--- a/human/audio_inference_handler.py
+++ b/human/audio_inference_handler.py
@ -6,10 +6,12 @@ import time
 from queue import Queue
 from threading import Event, Thread

+import cv2
 import numpy as np
 import torch

 from eventbus import EventBus
+from human import HumanStatus
 from human_handler import AudioHandler
 from utils import load_model, mirror_index, get_device, SyncQueue

@ -67,12 +69,13 @@ class AudioInferenceHandler(AudioHandler):
        logger.info("Model loaded")

        face_list_cycle = self._context.face_list_cycle
-
        length = len(face_list_cycle)
        index = 0
        count = 0
        count_time = 0
        logger.info('start inference')
+        silence_length = 133
+        human_status = HumanStatus(length, silence_length)

        device = get_device()
        logger.info(f'use device:{device}')
@ -107,11 +110,13 @@ class AudioInferenceHandler(AudioHandler):
                    for i in range(batch_size):
                        if not self._is_running:
                            break
-                        self.on_next_handle((None, mirror_index(length, index), audio_frames[i * 2:i * 2 + 2]),
-                                            0)
+                        # self.on_next_handle((None, mirror_index(silence_length, index),
+                        self.on_next_handle((None, human_status.get_index(),
+                                             audio_frames[i * 2:i * 2 + 2]), 0)
                        index = index + 1
                else:
                    logger.info(f'infer======= {current_text}')
+                    human_status.try_to_talk()
                    t = time.perf_counter()
                    img_batch = []
                    # for i in range(batch_size):
--- a/human/audio_inference_onnx_handler.py
+++ b/human/audio_inference_onnx_handler.py
@ -5,7 +5,9 @@ import queue
 import time
 from threading import Event, Thread

- # from gfpgan import GFPGANer
+import cv2
+
+# from gfpgan import GFPGANer
 from eventbus import EventBus
 from human_handler import AudioHandler
 from utils import load_model, mirror_index, get_device, SyncQueue
@ -93,9 +95,9 @@ class AudioInferenceOnnxHandler(AudioHandler):
        gfpgan_model = load_gfpgan_model(gfpgan_model_path)

        face_list_cycle = self._context.face_list_cycle
-
-
        length = len(face_list_cycle)
+        for i in range(length):
+            cv2.imwrite(f'face_{i}.png', face_list_cycle[i])
        index = 0
        count = 0
        count_time = 0
@ -157,18 +159,6 @@ class AudioInferenceOnnxHandler(AudioHandler):
                    onnx_out = model_g.run(onnx_names, onnx_input)[0]
                    pred = onnx_out

-                    # onnxruntime_inputs = {"audio_seqs__0": mel_batch, }
-                    # onnxruntime_names = [output.name for output in model_a.get_outputs()]
-                    # embeddings = model_a.run(onnxruntime_names, onnxruntime_inputs)[0]
-                    #
-                    # onnxruntime_inputs = {"audio_embedings__0": embeddings, "img_seqs__1": img_batch}
-                    # onnxruntime_names = [output.name for output in model_g.get_outputs()]
-                    #
-                    # start_model = time.time()
-                    # onnxruntime_output = model_g.run(onnxruntime_names, onnxruntime_inputs)[0]
-                    # end_model = time.time()
-                    # pred = onnxruntime_output
-
                    count_time += (time.perf_counter() - t)
                    count += batch_size

--- a/human/huaman_status.py
+++ b/human/huaman_status.py
@ -0,0 +1,36 @@
+#encoding = utf8
+
+import logging
+
+
+from enum import Enum
+
+
+class HumanStatusEnum(Enum):
+    silence = 1
+    talking = 2
+
+
+class HumanStatus:
+    def __init__(self, total_frames=0, last_silence_frame=0):
+        self._status = HumanStatusEnum.silence
+        self._total_frames = total_frames
+        self._last_silence_frame = last_silence_frame
+        self._current_frame = 0
+
+    def get_status(self):
+        return self._status
+
+    def set_status(self, status):
+        self._status = status
+        return self._status
+
+    def try_to_talk(self):
+        if self._status == HumanStatusEnum.silence:
+            if self._current_frame - self._last_silence_frame < 0:
+                return False
+            self._status = HumanStatusEnum.talking
+        return True
+
+    def get_index(self):
+        return self._total_frames
--- a/ipc/ipc.dll
+++ b/ipc/ipc.dll
--- a/ipc/ipc.exp
+++ b/ipc/ipc.exp
--- a/ipc/ipc.lib
+++ b/ipc/ipc.lib
--- a/ipc/ipc.pdb
+++ b/ipc/ipc.pdb
--- a/ipc/ipc_mem.py
+++ b/ipc/ipc_mem.py
@ -0,0 +1,62 @@
+#encoding = utf8
+
+import logging
+import os
+
+from ctypes import *
+
+current = os.path.dirname(__file__)
+dynamic_path = os.path.join(current, 'ipc.dll')
+
+
+class IPCMem:
+    def __init__(self, sender, receiver):
+        self.__ipc_obj = WinDLL(dynamic_path)
+        print(self.__ipc_obj)
+        if self.__ipc_obj is not None:
+            self.__ipc_obj.initialize.argtypes = [c_char_p, c_char_p]
+            self.__ipc_obj.initialize.restype = c_bool
+            print('IPCUtil init', sender.encode('utf-8'), receiver.encode('utf-8'))
+            self.__init = self.__ipc_obj.initialize(sender.encode('utf-8'), receiver.encode('utf-8'))
+            print('IPCUtil init', self.__init)
+
+    def __del__(self):
+        print('IPCUtil __del__')
+        if self.__ipc_obj is None:
+            return
+        if self.__init:
+            self.__ipc_obj.uninitialize()
+
+    def listen(self):
+        if not self.__init:
+            return False
+        self.__ipc_obj.listen.restype = c_bool
+        return self.__ipc_obj.listen()
+
+    def send_text(self, data):
+        if not self.__init:
+            return False
+        self.__ipc_obj.send.argtypes = [c_char_p, c_uint]
+        self.__ipc_obj.send.restype = c_bool
+        send_data = data.encode('utf-8')
+        send_len = len(send_data) + 1
+        if not self.__ipc_obj.send(send_data, send_len):
+            self.__ipc_obj.reConnect()
+        return True
+
+    def send_binary(self, data, size):
+        if not self.__init:
+            return False
+        self.__ipc_obj.send.argtypes = [c_char_p, c_uint]
+        self.__ipc_obj.send.restype = c_bool
+        data_ptr = cast(data, c_char_p)
+        return self.__ipc_obj.send(data_ptr, size)
+
+    def set_reader_callback(self, callback):
+        if not self.__init:
+            return False
+        CALLBACK_TYPE = CFUNCTYPE(None, c_char_p, c_uint)
+        self.c_callback = CALLBACK_TYPE(callback)  # Store the callback to prevent garbage collection
+        self.__ipc_obj.setReaderCallback.argtypes = [CALLBACK_TYPE]
+        self.__ipc_obj.setReaderCallback.restype = c_bool
+        return self.__ipc_obj.setReaderCallback(self.c_callback)
--- a/ipc/ipc_util.py
+++ b/ipc/ipc_util.py
@ -38,7 +38,7 @@ class IPCUtil:
        self.__ipc_obj.send.restype = c_bool
        send_data = data.encode('utf-8')
        send_len = len(send_data) + 1
-        if not self.__ipc_obj.send(send_data, send_len):
+        if not self.__ipc_obj.trySend(send_data, send_len):
            self.__ipc_obj.reConnect()
        return True

@ -48,7 +48,7 @@ class IPCUtil:
        self.__ipc_obj.send.argtypes = [c_char_p, c_uint]
        self.__ipc_obj.send.restype = c_bool
        data_ptr = cast(data, c_char_p)
-        return self.__ipc_obj.send(data_ptr, size)
+        return self.__ipc_obj.trySend(data_ptr, size)

    def set_reader_callback(self, callback):
        if not self.__init:
--- a/main.py
+++ b/main.py
@ -15,4 +15,5 @@ if __name__ == '__main__':
    logger.info('------------start------------')
    render = IpcRender()
    render.run()
+    render.stop()
    logger.info('------------finish------------')
--- a/ui/ipc_render.py
+++ b/ui/ipc_render.py
@ -64,7 +64,8 @@ class IpcRender:
        logger.info('ipc render exit')

    def stop(self):
-        pass
+        if self._human_context is not None:
+            self._human_context.stop()

    def on_render(self, image):
        self._queue.put(image)