human/nlp/nlp_doubao.py

171 lines
6.3 KiB
Python
Raw Normal View History

#encoding = utf8
2024-11-08 07:23:44 +00:00
import json
2024-10-10 11:01:13 +00:00
import logging
import time
2024-11-08 07:23:44 +00:00
import requests
from nlp.nlp_base import NLPBase
from volcenginesdkarkruntime import AsyncArk
2024-10-10 11:01:13 +00:00
logger = logging.getLogger(__name__)
2024-11-08 07:23:44 +00:00
class DouBaoSDK:
def __init__(self, token):
self._token = token
self.__client = AsyncArk(api_key=token)
self._stream = None
2024-11-16 02:13:11 +00:00
def request(self, question, handle, callback):
2024-11-08 07:23:44 +00:00
if self.__client is None:
self.__client = AsyncArk(api_key=self._token)
t = time.time()
2024-10-17 15:26:21 +00:00
logger.info(f'-------dou_bao ask:{question}')
2024-10-14 10:20:55 +00:00
try:
2024-11-16 02:13:11 +00:00
self._stream = self.__client.chat.completions.create(
2024-10-14 10:20:55 +00:00
model="ep-20241008152048-fsgzf",
messages=[
{"role": "system", "content": "你是测试客服,是由字节跳动开发的 AI 人工智能助手"},
{"role": "user", "content": question},
],
stream=True
)
2024-11-07 12:43:46 +00:00
2024-10-14 10:20:55 +00:00
sec = ''
2024-11-16 02:13:11 +00:00
for completion in self._stream:
2024-10-14 10:20:55 +00:00
sec = sec + completion.choices[0].delta.content
2024-11-08 07:23:44 +00:00
sec, message = handle.handle(sec)
2024-10-14 10:20:55 +00:00
if len(message) > 0:
2024-11-14 17:09:47 +00:00
# logger.info(f'-------dou_bao nlp time:{time.time() - t:.4f}s')
2024-11-08 07:23:44 +00:00
callback(message)
callback(sec)
2024-11-14 17:09:47 +00:00
# logger.info(f'-------dou_bao nlp time:{time.time() - t:.4f}s')
2024-11-16 02:13:11 +00:00
self._stream.close()
2024-11-08 07:23:44 +00:00
self._stream = None
2024-10-14 10:20:55 +00:00
except Exception as e:
2024-11-14 17:09:47 +00:00
logger.error(f'-------dou_bao error:{e}')
# logger.info(f'-------dou_bao nlp time:{time.time() - t:.4f}s')
2024-11-16 02:13:11 +00:00
def close(self):
2024-11-08 07:23:44 +00:00
if self._stream is not None:
2024-11-16 02:13:11 +00:00
self._stream.close()
2024-11-08 07:23:44 +00:00
self._stream = None
2024-10-17 15:26:21 +00:00
logger.info('AsyncArk close')
2024-10-14 10:20:55 +00:00
if self.__client is not None and not self.__client.is_closed():
2024-11-16 02:13:11 +00:00
self.__client.close()
2024-11-08 07:23:44 +00:00
self.__client = None
2024-11-08 23:39:03 +00:00
def aclose(self):
if self._stream is not None:
self._stream.close()
self._stream = None
logger.info('AsyncArk close')
if self.__client is not None and not self.__client.is_closed():
self.__client.close()
self.__client = None
2024-11-08 07:23:44 +00:00
class DouBaoHttp:
def __init__(self, token):
self.__token = token
self._response = None
self._requesting = False
def __request(self, question):
url = "https://ark.cn-beijing.volces.com/api/v3/chat/completions"
headers = {
"Authorization": "Bearer " + self.__token,
"Content-Type": "application/json"
}
data = {
"model": "ep-20241008152048-fsgzf",
"messages": question,
'stream': True
}
response = requests.post(url, headers=headers, json=data, stream=True)
return response
2024-11-16 02:13:11 +00:00
def request(self, question, handle, callback):
2024-11-08 07:23:44 +00:00
t = time.time()
self._requesting = True
logger.info(f'-------dou_bao ask:{question}')
msg_list = [
{"role": "system", "content": "你是测试客服,是由字节跳动开发的 AI 人工智能助手"},
{"role": "user", "content": question}
]
self._response = self.__request(msg_list)
if not self._response.ok:
2024-11-13 04:58:56 +00:00
logger.error(f"请求失败,状态码:{self._response.status_code}")
2024-11-08 07:23:44 +00:00
return
sec = ''
for chunk in self._response.iter_lines():
content = chunk.decode("utf-8").strip()
if len(content) < 1:
continue
content = content[5:]
2024-11-13 04:58:56 +00:00
content = content.strip()
if content == '[DONE]':
break
try:
content = json.loads(content)
except Exception as e:
logger.error(f"json解析失败错误信息{e, content}")
continue
2024-11-08 07:23:44 +00:00
sec = sec + content["choices"][0]["delta"]["content"]
sec, message = handle.handle(sec)
if len(message) > 0:
logger.info(f'-------dou_bao nlp time:{time.time() - t:.4f}s')
callback(message)
2024-11-13 04:58:56 +00:00
if len(sec) > 0:
callback(sec)
2024-11-08 07:23:44 +00:00
self._requesting = False
logger.info(f'-------dou_bao nlp time:{time.time() - t:.4f}s')
2024-11-16 02:13:11 +00:00
def close(self):
2024-11-08 07:23:44 +00:00
if self._response is not None and self._requesting:
self._response.close()
2024-11-08 23:39:03 +00:00
def aclose(self):
if self._response is not None and self._requesting:
self._response.close()
logger.info('DouBaoHttp close')
2024-11-08 07:23:44 +00:00
class DouBao(NLPBase):
def __init__(self, context, split, callback=None):
super().__init__(context, split, callback)
logger.info("DouBao init")
# Access Key ID
# AKLTYTdmOTBmNWFjODkxNDE2Zjk3MjU0NjRhM2JhM2IyN2Y
# AKLTNDZjNTdhNDlkZGE3NDZjMDlkMzk5YWQ3MDA4MTY1ZDc
# Secret Access Key
# WmpRelltRXhNbVkyWWpnNU5HRmpNamc0WTJZMFpUWmpOV1E1TTJFME1tTQ==
# TkRJMk1tTTFZamt4TkRVNE5HRTNZMkUyTnpFeU5qQmxNMkUwWXpaak1HRQ==
# endpoint_id
# ep-20241008152048-fsgzf
# api_key
# c9635f9e-0f9e-4ca1-ac90-8af25a541b74
# api_ky
# eyJhbGciOiJSUzI1NiIsInR5cCI6IkpXVCJ9.eyJpc3MiOiJhcmstY29uc29sZSIsImV4cCI6MTczMDk2NTMxOSwiaWF0IjoxNzI4MzczMzE5LCJ0IjoidXNlciIsImt2IjoxLCJhaWQiOiIyMTAyMjc3NDc1IiwidWlkIjoiMCIsImlzX291dGVyX3VzZXIiOnRydWUsInJlc291cmNlX3R5cGUiOiJlbmRwb2ludCIsInJlc291cmNlX2lkcyI6WyJlcC0yMDI0MTAwODE1MjA0OC1mc2d6ZiJdfQ.BHgFj-UKeu7IGG5VL2e6iPQEMNMkQrgmM46zYmTpoNG_ySgSFJLWYzbrIABZmqVDB4Rt58j8kvoORs-RHJUz81rXUlh3BYl9-ZwbggtAU7Z1pm54_qZ00jF0jQ6r-fUSXZo2PVCLxb_clNuEh06NyaV7ullZwUCyLKx3vhCsxPAuEvQvLc_qDBx-IYNT-UApVADaqMs-OyewoxahqQ7RvaHFF14R6ihmg9H0uvl00_JiGThJveszKvy_T-Qk6iPOy-EDI2pwJxdHMZ7By0bWK5EfZoK2hOvOSRD0BNTYnvrTfI0l2JgS0nwCVEPR4KSTXxU_oVVtuUSZp1UHvvkhvA
self.__token = 'c9635f9e-0f9e-4ca1-ac90-8af25a541b74'
self._dou_bao = DouBaoHttp(self.__token)
2024-11-16 02:13:11 +00:00
def _request(self, question):
self._dou_bao.request(question, self._split_handle, self._on_callback)
2024-11-08 07:23:44 +00:00
2024-11-16 02:13:11 +00:00
def _on_close(self):
2024-11-08 07:23:44 +00:00
if self._dou_bao is not None:
2024-11-16 02:13:11 +00:00
self._dou_bao.close()
2024-11-08 07:23:44 +00:00
logger.info('AsyncArk close')
2024-11-08 23:39:03 +00:00
def on_clear_cache(self, *args, **kwargs):
super().on_clear_cache(*args, **kwargs)
if self._dou_bao is not None:
self._dou_bao.aclose()
logger.info('DouBao clear_cache')