Steveeeeeeen HF staff commited on
Commit
e5d26e9
·
verified ·
1 Parent(s): 46f1390

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -7,6 +7,7 @@ from zonos.conditioning import make_cond_dict
7
 
8
  # Global cache to hold the loaded model
9
  MODEL = None
 
10
 
11
  def load_model():
12
  """
@@ -50,14 +51,14 @@ def tts(text, speaker_audio):
50
  # Get speaker embedding
51
  with torch.no_grad():
52
  spk_embedding = model.make_speaker_embedding(wav_tensor, sr)
53
- spk_embedding = spk_embedding.to(model.device, dtype=torch.bfloat16)
54
 
55
  # Prepare conditioning dictionary
56
  cond_dict = make_cond_dict(
57
  text=text, # The text prompt
58
  speaker=spk_embedding, # Speaker embedding from reference audio
59
  language="en-us", # Hard-coded language or switch to another if needed
60
- device=model.device,
61
  )
62
  conditioning = model.prepare_conditioning(cond_dict)
63
 
 
7
 
8
  # Global cache to hold the loaded model
9
  MODEL = None
10
+ device = "cuda"
11
 
12
  def load_model():
13
  """
 
51
  # Get speaker embedding
52
  with torch.no_grad():
53
  spk_embedding = model.make_speaker_embedding(wav_tensor, sr)
54
+ spk_embedding = spk_embedding.to(device, dtype=torch.bfloat16)
55
 
56
  # Prepare conditioning dictionary
57
  cond_dict = make_cond_dict(
58
  text=text, # The text prompt
59
  speaker=spk_embedding, # Speaker embedding from reference audio
60
  language="en-us", # Hard-coded language or switch to another if needed
61
+ device=device,
62
  )
63
  conditioning = model.prepare_conditioning(cond_dict)
64