modify render and ncnn asr to ask

2024-11-25 01:03:29 +08:00 · 2024-11-25 01:03:29 +08:00 · 7c1104a9ac
commit 7c1104a9ac
parent 7ae1432312
4 changed files with 62 additions and 53 deletions
--- a/asr/sherpa_ncnn_asr.py
+++ b/asr/sherpa_ncnn_asr.py
@ -63,15 +63,6 @@ class SherpaNcnnAsr(AsrBase):
        logger.info(f'_recognize_loop')
        print(f'_recognize_loop')

-        while self._stop_event.is_set():
-            logger.info(f'_recognize_loop000')
-            self._notify_complete('介绍中国5000年历史文学')
-            logger.info(f'_recognize_loop111')
-            segment_id += 1
-            time.sleep(150)
-            logger.info(f'_recognize_loop222')
-        logger.info(f'_recognize_loop exit')
-'''
        with sd.InputStream(channels=1, dtype="float32", samplerate=self._sample_rate) as s:
            while self._stop_event.is_set():
                samples, _ = s.read(self._samples_per_read)  # a blocking read
@ -94,3 +85,13 @@ class SherpaNcnnAsr(AsrBase):
                    self._recognizer.reset()
 '''

+        while self._stop_event.is_set():
+            logger.info(f'_recognize_loop000')
+            self._notify_complete('介绍中国5000年历史文学')
+            logger.info(f'_recognize_loop111')
+            segment_id += 1
+            time.sleep(150)
+            logger.info(f'_recognize_loop222')
+        logger.info(f'_recognize_loop exit')
+'''
+
--- a/human/human_render.py
+++ b/human/human_render.py
@ -48,7 +48,7 @@ class HumanRender(AudioHandler):
        logging.info('human render run')
        while self._exit_event.is_set() and self._is_running:
            self._run_step()
-            delay = 0.03
+            delay = 0.04
            time.sleep(delay)

        logging.info('human render exit')
--- a/render/video_render.py
+++ b/render/video_render.py
@ -9,23 +9,6 @@ import numpy as np
 from .base_render import BaseRender


-def img_warp_back_inv_m(img, img_to, inv_m):
-    h_up, w_up, c = img_to.shape
-    t = time.perf_counter()
-    mask = np.ones_like(img).astype(np.float32)
-    inv_mask = cv2.warpAffine(mask, inv_m, (w_up, h_up))
-    inv_img = cv2.warpAffine(img, inv_m, (w_up, h_up))
-    mask_indices = inv_mask == 1
-    print(f'time1: {time.perf_counter() - t}')
-    if 4 == c:
-        t = time.perf_counter()
-        img_to[:, :, :3][mask_indices] = inv_img[mask_indices]
-        print(f'time2: {time.perf_counter() - t}')
-    else:
-        img_to[inv_mask == 1] = inv_img[inv_mask == 1]
-    return img_to
-
-
 class VideoRender(BaseRender):
    def __init__(self, play_clock, context, human_render):
        super().__init__(play_clock, context, 'Video')
@ -33,27 +16,8 @@ class VideoRender(BaseRender):
        self.index = 0

    def render(self, frame, ps):
-        res_frame, idx, type_ = frame
-
-        if type_ == 0:
-            combine_frame = self._context.frame_list_cycle[idx]
-        else:
-            bbox = self._context.coord_list_cycle[idx]
-            combine_frame = copy.deepcopy(self._context.frame_list_cycle[idx])
-            af = self._context.align_frames[idx]
-            inv_m = self._context.inv_m_frames[idx]
-            y1, y2, x1, x2 = bbox
-            try:
-                t = time.perf_counter()
-                res_frame = cv2.resize(res_frame.astype(np.uint8), (x2 - x1, y2 - y1))
-                af[y1:y2, x1:x2] = res_frame
-                combine_frame = img_warp_back_inv_m(af, combine_frame, inv_m)
-                print(time.perf_counter() - t)
-            except Exception as e:
-                logging.error(f'resize error:{e}')
-                return
-
-        image = combine_frame
-        # image = cv2.cvtColor(image, cv2.COLOR_BGRA2RGBA)
        if self._human_render is not None:
-            self._human_render.put_image(image)
+            self._human_render.put_image(frame)
+
+        # image = cv2.cvtColor(image, cv2.COLOR_BGRA2RGBA)
+
--- a/ui/pygame_ui.py
+++ b/ui/pygame_ui.py
@ -1,6 +1,8 @@
 #encoding = utf8
+import copy
 import logging
 import os
+import time
 from queue import Queue

 import cv2
@ -15,17 +17,54 @@ logger = logging.getLogger(__name__)
 current_file_path = os.path.dirname(os.path.abspath(__file__))


+def img_warp_back_inv_m(img, img_to, inv_m):
+    h_up, w_up, c = img_to.shape
+    mask = np.ones_like(img).astype(np.float32)
+    inv_mask = cv2.warpAffine(mask, inv_m, (w_up, h_up))
+    inv_img = cv2.warpAffine(img, inv_m, (w_up, h_up))
+    mask_indices = inv_mask == 1
+    if 4 == c:
+        img_to[:, :, :3][mask_indices] = inv_img[mask_indices]
+    else:
+        img_to[inv_mask == 1] = inv_img[inv_mask == 1]
+    return img_to
+
+
+def render_image(context, frame):
+    res_frame, idx, type_ = frame
+
+    if type_ == 0:
+        combine_frame = context.frame_list_cycle[idx]
+    else:
+        bbox = context.coord_list_cycle[idx]
+        combine_frame = copy.deepcopy(context.frame_list_cycle[idx])
+        af = context.align_frames[idx]
+        inv_m = context.inv_m_frames[idx]
+        y1, y2, x1, x2 = bbox
+        try:
+            t = time.perf_counter()
+            res_frame = cv2.resize(res_frame.astype(np.uint8), (x2 - x1, y2 - y1))
+            af[y1:y2, x1:x2] = res_frame
+            combine_frame = img_warp_back_inv_m(af, combine_frame, inv_m)
+        except Exception as e:
+            logging.error(f'resize error:{e}')
+            return
+
+    image = combine_frame
+    return image
+
+
 class PyGameUI:
    def __init__(self):
        self._human_context = None
        self._queue = None
-        self.screen_ = pygame.display.set_mode((800, 600), HWSURFACE | DOUBLEBUF | RESIZABLE)
+        self.screen_ = pygame.display.set_mode((1920, 1080), HWSURFACE | DOUBLEBUF | RESIZABLE)
        self.clock = pygame.time.Clock()

        background = os.path.join(current_file_path, '..', 'data', 'background', 'background.jpg')
        logger.info(f'background: {background}')
        self._background = pygame.image.load(background).convert()
-        self.background_display_ = pygame.transform.scale(self._background, (800, 600))
+        self.background_display_ = pygame.transform.scale(self._background, (1920, 1080))
        self._human_image = None
        self.running = True

@ -48,7 +87,7 @@ class PyGameUI:
            self.screen_.blit(self.background_display_, (0, 0))
            self._update_human()
            if self._human_image is not None:
-                self.screen_.blit(self._human_image, (0, -200))
+                self.screen_.blit(self._human_image, (760, -300))

            fps = self.clock.get_fps()
            pygame.display.set_caption('fps:{:.2f}'.format(fps))
@ -59,7 +98,12 @@ class PyGameUI:
    def _update_human(self):
        if self._queue.empty():
            return
+
+        if self._queue.qsize() > 5:
+            print('render queue is slower')
+
        image = self._queue.get()
+        image = render_image(self._human_context, image)
        color_format = "RGB"
        if 4 == image.shape[2]:
            color_format = "RGBA"