mirror of
https://github.com/open-webui/open-webui
synced 2025-01-01 08:42:14 +00:00
fix: audio
Some checks are pending
Deploy to HuggingFace Spaces / check-secret (push) Waiting to run
Deploy to HuggingFace Spaces / deploy (push) Blocked by required conditions
Create and publish Docker images with specific build args / build-main-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-main-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / build-cuda-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-cuda-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / build-ollama-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-ollama-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / merge-main-images (push) Blocked by required conditions
Create and publish Docker images with specific build args / merge-cuda-images (push) Blocked by required conditions
Create and publish Docker images with specific build args / merge-ollama-images (push) Blocked by required conditions
Python CI / Format Backend (3.11) (push) Waiting to run
Frontend Build / Format & Build Frontend (push) Waiting to run
Frontend Build / Frontend Unit Tests (push) Waiting to run
Integration Test / Run Cypress Integration Tests (push) Waiting to run
Integration Test / Run Migration Tests (push) Waiting to run
Some checks are pending
Deploy to HuggingFace Spaces / check-secret (push) Waiting to run
Deploy to HuggingFace Spaces / deploy (push) Blocked by required conditions
Create and publish Docker images with specific build args / build-main-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-main-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / build-cuda-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-cuda-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / build-ollama-image (linux/amd64) (push) Waiting to run
Create and publish Docker images with specific build args / build-ollama-image (linux/arm64) (push) Waiting to run
Create and publish Docker images with specific build args / merge-main-images (push) Blocked by required conditions
Create and publish Docker images with specific build args / merge-cuda-images (push) Blocked by required conditions
Create and publish Docker images with specific build args / merge-ollama-images (push) Blocked by required conditions
Python CI / Format Backend (3.11) (push) Waiting to run
Frontend Build / Format & Build Frontend (push) Waiting to run
Frontend Build / Frontend Unit Tests (push) Waiting to run
Integration Test / Run Cypress Integration Tests (push) Waiting to run
Integration Test / Run Migration Tests (push) Waiting to run
This commit is contained in:
parent
455b38dcc1
commit
70de5cf7b8
@ -218,7 +218,7 @@ async def update_audio_config(
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
def load_speech_pipeline():
|
def load_speech_pipeline(request):
|
||||||
from transformers import pipeline
|
from transformers import pipeline
|
||||||
from datasets import load_dataset
|
from datasets import load_dataset
|
||||||
|
|
||||||
@ -236,7 +236,11 @@ def load_speech_pipeline():
|
|||||||
@router.post("/speech")
|
@router.post("/speech")
|
||||||
async def speech(request: Request, user=Depends(get_verified_user)):
|
async def speech(request: Request, user=Depends(get_verified_user)):
|
||||||
body = await request.body()
|
body = await request.body()
|
||||||
name = hashlib.sha256(body).hexdigest()
|
name = hashlib.sha256(
|
||||||
|
body
|
||||||
|
+ str(request.app.state.config.TTS_ENGINE).encode("utf-8")
|
||||||
|
+ str(request.app.state.config.TTS_MODEL).encode("utf-8")
|
||||||
|
).hexdigest()
|
||||||
|
|
||||||
file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
|
file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
|
||||||
file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
|
file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
|
||||||
@ -256,10 +260,11 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
payload["model"] = request.app.state.config.TTS_MODEL
|
payload["model"] = request.app.state.config.TTS_MODEL
|
||||||
|
|
||||||
try:
|
try:
|
||||||
|
# print(payload)
|
||||||
async with aiohttp.ClientSession() as session:
|
async with aiohttp.ClientSession() as session:
|
||||||
async with session.post(
|
async with session.post(
|
||||||
url=f"{request.app.state.config.TTS_OPENAI_API_BASE_URL}/audio/speech",
|
url=f"{request.app.state.config.TTS_OPENAI_API_BASE_URL}/audio/speech",
|
||||||
data=payload,
|
json=payload,
|
||||||
headers={
|
headers={
|
||||||
"Content-Type": "application/json",
|
"Content-Type": "application/json",
|
||||||
"Authorization": f"Bearer {request.app.state.config.TTS_OPENAI_API_KEY}",
|
"Authorization": f"Bearer {request.app.state.config.TTS_OPENAI_API_KEY}",
|
||||||
@ -281,7 +286,7 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
await f.write(await r.read())
|
await f.write(await r.read())
|
||||||
|
|
||||||
async with aiofiles.open(file_body_path, "w") as f:
|
async with aiofiles.open(file_body_path, "w") as f:
|
||||||
await f.write(json.dumps(json.loads(body.decode("utf-8"))))
|
await f.write(json.dumps(payload))
|
||||||
|
|
||||||
return FileResponse(file_path)
|
return FileResponse(file_path)
|
||||||
|
|
||||||
@ -292,6 +297,7 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
try:
|
try:
|
||||||
if r.status != 200:
|
if r.status != 200:
|
||||||
res = await r.json()
|
res = await r.json()
|
||||||
|
|
||||||
if "error" in res:
|
if "error" in res:
|
||||||
detail = f"External: {res['error'].get('message', '')}"
|
detail = f"External: {res['error'].get('message', '')}"
|
||||||
except Exception:
|
except Exception:
|
||||||
@ -332,7 +338,7 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
await f.write(await r.read())
|
await f.write(await r.read())
|
||||||
|
|
||||||
async with aiofiles.open(file_body_path, "w") as f:
|
async with aiofiles.open(file_body_path, "w") as f:
|
||||||
await f.write(json.dumps(json.loads(body.decode("utf-8"))))
|
await f.write(json.dumps(payload))
|
||||||
|
|
||||||
return FileResponse(file_path)
|
return FileResponse(file_path)
|
||||||
|
|
||||||
@ -384,6 +390,9 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
async with aiofiles.open(file_path, "wb") as f:
|
async with aiofiles.open(file_path, "wb") as f:
|
||||||
await f.write(await r.read())
|
await f.write(await r.read())
|
||||||
|
|
||||||
|
async with aiofiles.open(file_body_path, "w") as f:
|
||||||
|
await f.write(json.dumps(payload))
|
||||||
|
|
||||||
return FileResponse(file_path)
|
return FileResponse(file_path)
|
||||||
|
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
@ -414,7 +423,7 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
import torch
|
import torch
|
||||||
import soundfile as sf
|
import soundfile as sf
|
||||||
|
|
||||||
load_speech_pipeline()
|
load_speech_pipeline(request)
|
||||||
|
|
||||||
embeddings_dataset = request.app.state.speech_speaker_embeddings_dataset
|
embeddings_dataset = request.app.state.speech_speaker_embeddings_dataset
|
||||||
|
|
||||||
@ -436,8 +445,9 @@ async def speech(request: Request, user=Depends(get_verified_user)):
|
|||||||
)
|
)
|
||||||
|
|
||||||
sf.write(file_path, speech["audio"], samplerate=speech["sampling_rate"])
|
sf.write(file_path, speech["audio"], samplerate=speech["sampling_rate"])
|
||||||
with open(file_body_path, "w") as f:
|
|
||||||
json.dump(json.loads(body.decode("utf-8")), f)
|
async with aiofiles.open(file_body_path, "w") as f:
|
||||||
|
await f.write(json.dumps(payload))
|
||||||
|
|
||||||
return FileResponse(file_path)
|
return FileResponse(file_path)
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user