bcci commited on
Commit
01f0881
·
verified ·
1 Parent(s): 9a74dea

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -8
app.py CHANGED
@@ -31,7 +31,7 @@ phoneme_vocab = config['vocab']
31
  # Download the model and voice files from Hugging Face Hub
32
  # ------------------------------------------------------------------------------
33
  model_repo = "onnx-community/Kokoro-82M-v1.0-ONNX"
34
- model_name = "onnx/model_quantized.onnx"
35
  voice_file_pattern = "*.bin"
36
  local_dir = "."
37
  snapshot_download(
@@ -241,14 +241,9 @@ def tts_streaming(text: str, voice: str = "af_heart", speed: float = 1.0, format
241
  # audio_tensor = torch.from_numpy(audio_int16.astype(np.float32) / 32767)
242
 
243
  # Yield the encoded audio chunk.
244
- if format.lower() == "wav":
245
- yield audio_int16
246
- elif format.lower() == "opus":
247
- yield audio_tensor_to_opus_bytes(audio_tensor, sample_rate=sample_rate)
248
- else:
249
- raise HTTPException(status_code=400, detail=f"Unsupported audio format: {format}")
250
 
251
- media_type = "audio/wav" if format.lower() == "wav" else "audio/opus"
252
  return StreamingResponse(
253
  audio_generator(),
254
  media_type=media_type,
 
31
  # Download the model and voice files from Hugging Face Hub
32
  # ------------------------------------------------------------------------------
33
  model_repo = "onnx-community/Kokoro-82M-v1.0-ONNX"
34
+ model_name = "onnx/model_q8f16.onnx"
35
  voice_file_pattern = "*.bin"
36
  local_dir = "."
37
  snapshot_download(
 
241
  # audio_tensor = torch.from_numpy(audio_int16.astype(np.float32) / 32767)
242
 
243
  # Yield the encoded audio chunk.
244
+ yield audio_int16.tobytes()
 
 
 
 
 
245
 
246
+ media_type = "audio/wav"
247
  return StreamingResponse(
248
  audio_generator(),
249
  media_type=media_type,