human/ui.py

#encoding = utf8
import json
import logging
import os
import queue
from logging import handlers
import tkinter
import tkinter.messagebox
from queue import Queue

import customtkinter
import cv2
import requests
import winsound
from PIL import Image, ImageTk

from playsound import playsound

from audio_render import AudioRender
# from Human import Human
from human import HumanContext
from utils import config_logging

# from tts.EdgeTTS import EdgeTTS

logger = logging.getLogger(__name__)

customtkinter.set_appearance_mode("System")  # Modes: "System" (standard), "Dark", "Light"
customtkinter.set_default_color_theme("green")  # Themes: "blue" (standard), "green", "dark-blue"


class App(customtkinter.CTk):
    def __init__(self):
        super().__init__()

        self._tts_url = 'http://localhost:8080'

        # configure window
        self.title("TTS demo")
        self.geometry(f"{1100}x{580}")

        self.grid_columnconfigure(1, weight=1)
        self.grid_rowconfigure((0, 1), weight=1)

        self.image_frame = customtkinter.CTkFrame(self, corner_radius=10)
        self.image_frame.grid(row=0, column=0, rowspan=2, columnspan=3,
                                padx=(20, 20), pady=(20, 0), sticky="nsew")
        self.image_frame.grid_rowconfigure(0, weight=1)
        self.logo_label = customtkinter.CTkLabel(self.image_frame, text="CustomTkinter",
                                                 font=customtkinter.CTkFont(size=20, weight="bold"))
        # self.logo_label.grid(row=0, column=0, padx=20, pady=(20, 10))

        self.entry = customtkinter.CTkEntry(self, placeholder_text="输入内容")
        self.entry.insert(0, "大家好，测试虚拟数字人。")
        self.entry.grid(row=2, column=0, columnspan=2, padx=(20, 0), pady=(20, 20), sticky="nsew")

        self.main_button_1 = customtkinter.CTkButton(master=self, fg_color="transparent", border_width=2,
                                                     text_color=("gray10", "#DCE4EE"), text='发送',
                                                     command=self.request_tts)
        self.main_button_1.grid(row=2, column=2, padx=(20, 20), pady=(20, 20), sticky="nsew")

        self._init_image_canvas()

        self._audio_render = AudioRender()
        # self._human = Human()
        self._queue = Queue()
        self._human_context = HumanContext()
        self._human_context.build()
        render = self._human_context.render_handler
        render.set_image_render(self)
        render.set_audio_render(self._audio_render)
        self._render()
        # self.play_audio()

    def destroy(self):
        self.on_destroy()
        super().destroy()

    def on_destroy(self):
        logger.info('------------App destroy------------')
        # self._human.on_destroy()

    def render_image(self, image):
        self._queue.put(image)

    def _init_image_canvas(self):
        self._canvas = customtkinter.CTkCanvas(self.image_frame)
        self._canvas.pack(fill=customtkinter.BOTH, expand=customtkinter.YES)

    def _render(self):
        after_time = 29
        try:
            image = self._queue.get(block=True, timeout=0.003)
            if image is None:
                self.after(after_time, self._render)
                return
        except queue.Empty:
            self.after(after_time, self._render)
            return

        iheight, iwidth = image.shape[0], image.shape[1]
        width = self.winfo_width()
        height = self.winfo_height()
        if iheight / iwidth >= width / height:
            image = cv2.resize(image, (int(width), int(iheight * width / iwidth)))
        else:
            image = cv2.resize(image, (int(iwidth * height / iheight), int(height)), interpolation=cv2.INTER_AREA)
        img = Image.fromarray(image)

        imgtk = ImageTk.PhotoImage(image=img)

        self._canvas.delete("all")

        self._canvas.imgtk = imgtk
        width = self.winfo_width() * 0.5
        height = self.winfo_height() * 0.5
        self._canvas.create_image(width, height, anchor=customtkinter.CENTER, image=imgtk)
        self._canvas.update()
        self.after(after_time, self._render)

    def request_tts(self):
        content = self.entry.get()
        # content = ''
        print('content:', content)
        self.entry.delete(0, customtkinter.END)
        self._human.pause_talk()
        self._human.read(content)
        # payload = {
        #   'text': content,
        #   'voice': 'zh-CN-XiaoyiNeural'
        # }
        # resp = requests.get(self._tts_url + '/tts', params=urlencode(payload))
        # if resp.status_code != 200:
        #     print('tts error', resp.status_code)
        #     return
        #
        # print(resp.content)
        #
        # resJson = json.loads(resp.text)
        # url = resJson.get('url')
        # self.download_tts(url)

    def download_tts(self, url):
        file_name = url[3:]
        print(file_name)
        download_url = self._tts_url + url
        print('download tts', download_url)
        resp = requests.get(download_url)
        with open('./audio/mp3/' + file_name, 'wb') as mp3:
            mp3.write(resp.content)

        from pydub import AudioSegment
        sound = AudioSegment.from_mp3('./audio/mp3/' + file_name)
        sound.export('./audio/wav/' + file_name + '.wav', format="wav")

    def on_render(self, image):
        self._queue.put(image)
        print('on_render', self._queue.qsize())


if __name__ == "__main__":
    # logging.basicConfig(filename='./logs/info.log', level=logging.INFO)
    config_logging('./logs/info.log', logging.INFO, logging.INFO)

    logger.info('------------start------------')
    app = App()
    app.mainloop()
    # app.on_destroy()
    logger.info('------------exit------------')
首次添加数字人 2024-09-02 00:13:34 +00:00			`#encoding = utf8`
			`import json`
			`import logging`
修改tts录制文件 2024-09-26 12:28:49 +00:00			`import os`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`import queue`
添加chunk处理 2024-09-04 16:51:14 +00:00			`from logging import handlers`
首次添加数字人 2024-09-02 00:13:34 +00:00			`import tkinter`
			`import tkinter.messagebox`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`from queue import Queue`

首次添加数字人 2024-09-02 00:13:34 +00:00			`import customtkinter`
modify ui to render 2024-09-25 06:37:15 +00:00			`import cv2`
首次添加数字人 2024-09-02 00:13:34 +00:00			`import requests`
修改tts录制文件 2024-09-26 12:28:49 +00:00			`import winsound`
modify human load face 2024-09-12 00:15:09 +00:00			`from PIL import Image, ImageTk`
首次添加数字人 2024-09-02 00:13:34 +00:00
修改tts录制文件 2024-09-26 12:28:49 +00:00			`from playsound import playsound`

modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`from audio_render import AudioRender`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`# from Human import Human`
			`from human import HumanContext`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`from utils import config_logging`

modify path and proptry access 2024-10-17 00:25:53 +00:00			`# from tts.EdgeTTS import EdgeTTS`
首次添加数字人 2024-09-02 00:13:34 +00:00
			`logger = logging.getLogger(__name__)`

			`customtkinter.set_appearance_mode("System") # Modes: "System" (standard), "Dark", "Light"`
			`customtkinter.set_default_color_theme("green") # Themes: "blue" (standard), "green", "dark-blue"`


			`class App(customtkinter.CTk):`
			`def __init__(self):`
			`super().__init__()`

			`self._tts_url = 'http://localhost:8080'`

			`# configure window`
修改tts录制文件 2024-09-26 12:28:49 +00:00			`self.title("TTS demo")`
首次添加数字人 2024-09-02 00:13:34 +00:00			`self.geometry(f"{1100}x{580}")`

			`self.grid_columnconfigure(1, weight=1)`
			`self.grid_rowconfigure((0, 1), weight=1)`

			`self.image_frame = customtkinter.CTkFrame(self, corner_radius=10)`
			`self.image_frame.grid(row=0, column=0, rowspan=2, columnspan=3,`
			`padx=(20, 20), pady=(20, 0), sticky="nsew")`
			`self.image_frame.grid_rowconfigure(0, weight=1)`
			`self.logo_label = customtkinter.CTkLabel(self.image_frame, text="CustomTkinter",`
			`font=customtkinter.CTkFont(size=20, weight="bold"))`
			`# self.logo_label.grid(row=0, column=0, padx=20, pady=(20, 10))`

			`self.entry = customtkinter.CTkEntry(self, placeholder_text="输入内容")`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`self.entry.insert(0, "大家好，测试虚拟数字人。")`
首次添加数字人 2024-09-02 00:13:34 +00:00			`self.entry.grid(row=2, column=0, columnspan=2, padx=(20, 0), pady=(20, 20), sticky="nsew")`

			`self.main_button_1 = customtkinter.CTkButton(master=self, fg_color="transparent", border_width=2,`
			`text_color=("gray10", "#DCE4EE"), text='发送',`
			`command=self.request_tts)`
			`self.main_button_1.grid(row=2, column=2, padx=(20, 20), pady=(20, 20), sticky="nsew")`

			`self._init_image_canvas()`

modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`self._audio_render = AudioRender()`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`# self._human = Human()`
			`self._queue = Queue()`
			`self._human_context = HumanContext()`
			`self._human_context.build()`
			`render = self._human_context.render_handler`
			`render.set_image_render(self)`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`render.set_audio_render(self._audio_render)`
modify human load face 2024-09-12 00:15:09 +00:00			`self._render()`
修改tts录制文件 2024-09-26 12:28:49 +00:00			`# self.play_audio()`
首次添加数字人 2024-09-02 00:13:34 +00:00
try close infer 2024-10-04 10:10:03 +00:00			`def destroy(self):`
			`self.on_destroy()`
			`super().destroy()`

添加chunk处理 2024-09-04 16:51:14 +00:00			`def on_destroy(self):`
			`logger.info('------------App destroy------------')`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`# self._human.on_destroy()`

			`def render_image(self, image):`
			`self._queue.put(image)`
修改tts录制文件 2024-09-26 12:28:49 +00:00
首次添加数字人 2024-09-02 00:13:34 +00:00			`def _init_image_canvas(self):`
			`self._canvas = customtkinter.CTkCanvas(self.image_frame)`
			`self._canvas.pack(fill=customtkinter.BOTH, expand=customtkinter.YES)`

modify human load face 2024-09-12 00:15:09 +00:00			`def _render(self):`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`after_time = 29`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`try:`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`image = self._queue.get(block=True, timeout=0.003)`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`if image is None:`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`self.after(after_time, self._render)`
modify path and proptry access 2024-10-17 00:25:53 +00:00			`return`
			`except queue.Empty:`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`self.after(after_time, self._render)`
modify human load face 2024-09-12 00:15:09 +00:00			`return`

modify ui to render 2024-09-25 06:37:15 +00:00			`iheight, iwidth = image.shape[0], image.shape[1]`
			`width = self.winfo_width()`
			`height = self.winfo_height()`
			`if iheight / iwidth >= width / height:`
			`image = cv2.resize(image, (int(width), int(iheight * width / iwidth)))`
			`else:`
			`image = cv2.resize(image, (int(iwidth * height / iheight), int(height)), interpolation=cv2.INTER_AREA)`
modify human load face 2024-09-12 00:15:09 +00:00			`img = Image.fromarray(image)`
modify ui to render 2024-09-25 06:37:15 +00:00
modify human load face 2024-09-12 00:15:09 +00:00			`imgtk = ImageTk.PhotoImage(image=img)`

			`self._canvas.delete("all")`

			`self._canvas.imgtk = imgtk`
			`width = self.winfo_width() * 0.5`
			`height = self.winfo_height() * 0.5`
			`self._canvas.create_image(width, height, anchor=customtkinter.CENTER, image=imgtk)`
			`self._canvas.update()`
modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`self.after(after_time, self._render)`
modify human load face 2024-09-12 00:15:09 +00:00
首次添加数字人 2024-09-02 00:13:34 +00:00			`def request_tts(self):`
			`content = self.entry.get()`
add audio render 2024-09-28 18:47:04 +00:00			`# content = ''`
首次添加数字人 2024-09-02 00:13:34 +00:00			`print('content:', content)`
			`self.entry.delete(0, customtkinter.END)`
添加打断逻辑 2024-10-04 08:44:06 +00:00			`self._human.pause_talk()`
添加chunk处理 2024-09-04 16:51:14 +00:00			`self._human.read(content)`
			`# payload = {`
			`# 'text': content,`
			`# 'voice': 'zh-CN-XiaoyiNeural'`
			`# }`
			`# resp = requests.get(self._tts_url + '/tts', params=urlencode(payload))`
			`# if resp.status_code != 200:`
			`# print('tts error', resp.status_code)`
			`# return`
			`#`
			`# print(resp.content)`
			`#`
			`# resJson = json.loads(resp.text)`
			`# url = resJson.get('url')`
			`# self.download_tts(url)`
首次添加数字人 2024-09-02 00:13:34 +00:00
			`def download_tts(self, url):`
			`file_name = url[3:]`
			`print(file_name)`
			`download_url = self._tts_url + url`
			`print('download tts', download_url)`
			`resp = requests.get(download_url)`
			`with open('./audio/mp3/' + file_name, 'wb') as mp3:`
			`mp3.write(resp.content)`

			`from pydub import AudioSegment`
			`sound = AudioSegment.from_mp3('./audio/mp3/' + file_name)`
			`sound.export('./audio/wav/' + file_name + '.wav', format="wav")`

modify ui and nlp tts code 2024-10-17 15:26:21 +00:00			`def on_render(self, image):`
			`self._queue.put(image)`
			`print('on_render', self._queue.qsize())`
添加chunk处理 2024-09-04 16:51:14 +00:00

			`if __name__ == "__main__":`
			`# logging.basicConfig(filename='./logs/info.log', level=logging.INFO)`
			`config_logging('./logs/info.log', logging.INFO, logging.INFO)`
merge overide 2024-09-09 00:30:15 +00:00
添加chunk处理 2024-09-04 16:51:14 +00:00			`logger.info('------------start------------')`
首次添加数字人 2024-09-02 00:13:34 +00:00			`app = App()`
			`app.mainloop()`
try close infer 2024-10-04 10:10:03 +00:00			`# app.on_destroy()`
			`logger.info('------------exit------------')`