mirror of
https://github.com/BoardWare-Genius/jarvis-models.git
synced 2025-12-13 16:53:24 +00:00
feat: audio chat
This commit is contained in:
2
main.py
2
main.py
@ -46,4 +46,4 @@ async def workflows(script: Annotated[str, Form()], request: Request=None):
|
|||||||
ast.exec(dsl_runtime)
|
ast.exec(dsl_runtime)
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
uvicorn.run("main:app", host="127.0.0.1", port=8000, log_level="info")
|
uvicorn.run("main:app", host="0.0.0.0", port=8000, log_level="info")
|
||||||
|
|||||||
36
src/blackbox/audio_chat.py
Normal file
36
src/blackbox/audio_chat.py
Normal file
@ -0,0 +1,36 @@
|
|||||||
|
from fastapi import Request, Response,status
|
||||||
|
from fastapi.responses import JSONResponse
|
||||||
|
|
||||||
|
from .blackbox import Blackbox
|
||||||
|
|
||||||
|
class AudioChat(Blackbox):
|
||||||
|
|
||||||
|
def __init__(self, asr, gpt, tts):
|
||||||
|
self.asr = asr
|
||||||
|
self.gpt = gpt
|
||||||
|
self.tts = tts
|
||||||
|
|
||||||
|
def __call__(self, *args, **kwargs):
|
||||||
|
return self.processing(*args, **kwargs)
|
||||||
|
|
||||||
|
def valid(self, *args, **kwargs) -> bool :
|
||||||
|
data = args[0]
|
||||||
|
if isinstance(data, bytes):
|
||||||
|
return True
|
||||||
|
return False
|
||||||
|
|
||||||
|
async def processing(self, *args, **kwargs):
|
||||||
|
data = args[0]
|
||||||
|
text = await self.asr(data)
|
||||||
|
# TODO: ID
|
||||||
|
text = self.gpt("123", " " + text)
|
||||||
|
audio = self.tts(text)
|
||||||
|
return audio
|
||||||
|
|
||||||
|
async def fast_api_handler(self, request: Request) -> Response:
|
||||||
|
data = (await request.form()).get("audio")
|
||||||
|
if data is None:
|
||||||
|
return JSONResponse(content={"error": "data is required"}, status_code=status.HTTP_400_BAD_REQUEST)
|
||||||
|
d = await data.read()
|
||||||
|
by = await self.processing(d)
|
||||||
|
return Response(content=by.read(), media_type="audio/wav", headers={"Content-Disposition": "attachment; filename=audio.wav"})
|
||||||
@ -1,3 +1,4 @@
|
|||||||
|
from .audio_chat import AudioChat
|
||||||
from .sum import SUM
|
from .sum import SUM
|
||||||
from .sentiment import Sentiment
|
from .sentiment import Sentiment
|
||||||
from .tts import TTS
|
from .tts import TTS
|
||||||
@ -19,6 +20,7 @@ class BlackboxFactory:
|
|||||||
self.audio_to_text = AudioToText()
|
self.audio_to_text = AudioToText()
|
||||||
self.text_to_audio = TextToAudio()
|
self.text_to_audio = TextToAudio()
|
||||||
self.tesou = Tesou()
|
self.tesou = Tesou()
|
||||||
|
self.audio_chat = AudioChat(self.asr, self.tesou, self.tts)
|
||||||
|
|
||||||
def __call__(self, *args, **kwargs):
|
def __call__(self, *args, **kwargs):
|
||||||
return self.processing(*args, **kwargs)
|
return self.processing(*args, **kwargs)
|
||||||
@ -40,4 +42,6 @@ class BlackboxFactory:
|
|||||||
return self.sum
|
return self.sum
|
||||||
if blackbox_name == "tesou":
|
if blackbox_name == "tesou":
|
||||||
return self.tesou
|
return self.tesou
|
||||||
|
if blackbox_name == "audio_chat":
|
||||||
|
return self.audio_chat
|
||||||
raise ValueError("Invalid blockbox type")
|
raise ValueError("Invalid blockbox type")
|
||||||
@ -17,8 +17,7 @@ class Tesou(Blackbox):
|
|||||||
|
|
||||||
# 用户输入的数据格式为:[{"id": "123", "prompt": "叉烧饭,帮我查询叉烧饭的介绍"}]
|
# 用户输入的数据格式为:[{"id": "123", "prompt": "叉烧饭,帮我查询叉烧饭的介绍"}]
|
||||||
def processing(self, id, prompt) -> str:
|
def processing(self, id, prompt) -> str:
|
||||||
url = 'http://120.196.116.194:48891/'
|
url = 'http://120.196.116.194:48891/chat/'
|
||||||
|
|
||||||
message = {
|
message = {
|
||||||
"user_id": id,
|
"user_id": id,
|
||||||
"prompt": prompt,
|
"prompt": prompt,
|
||||||
|
|||||||
Reference in New Issue
Block a user