alethanhson commited on
Commit
bd02d7a
·
1 Parent(s): b460716
Files changed (1) hide show
  1. app.py +6 -5
app.py CHANGED
@@ -58,7 +58,7 @@ async def startup_event():
58
  logger.warning("GPU not available. Using CPU, performance may be slow!")
59
 
60
  try:
61
- generator = load_csm_1b(device="cuda")
62
  logger.info(f"Model loaded successfully on device: {device}")
63
  except Exception as e:
64
  logger.error(f"Could not load model: {str(e)}")
@@ -102,13 +102,14 @@ async def generate_audio(request: GenerateAudioRequest):
102
 
103
  buffer = io.BytesIO()
104
  torchaudio.save(buffer, audio.unsqueeze(0).cpu(), generator.sample_rate, format="wav")
105
- torchaudio.save("audio.wav", audio.unsqueeze(0).cpu(), generator.sample_rate)
106
  buffer.seek(0)
107
- audio_base64 = base64.b64encode(buffer.read()).decode("utf-8")
108
 
109
  return AudioResponse(
110
- audio_base64=audio_base64,
111
- sample_rate=generator.sample_rate
 
112
  )
113
 
114
  except Exception as e:
 
58
  logger.warning("GPU not available. Using CPU, performance may be slow!")
59
 
60
  try:
61
+ generator = load_csm_1b(device=device)
62
  logger.info(f"Model loaded successfully on device: {device}")
63
  except Exception as e:
64
  logger.error(f"Could not load model: {str(e)}")
 
102
 
103
  buffer = io.BytesIO()
104
  torchaudio.save(buffer, audio.unsqueeze(0).cpu(), generator.sample_rate, format="wav")
105
+ # torchaudio.save("audio.wav", audio.unsqueeze(0).cpu(), generator.sample_rate)
106
  buffer.seek(0)
107
+ # audio_base64 = base64.b64encode(buffer.read()).decode("utf-8")
108
 
109
  return AudioResponse(
110
+ content=buffer.read(),
111
+ media_type="audio/wav",
112
+ headers={"Content-Disposition": "attachment; filename=audio.wav"}
113
  )
114
 
115
  except Exception as e: