Spaces:

Rogerjs
/

Voicecloner

Sleeping

Rogerjs commited on Dec 5, 2024

Commit

4f9d782

verified ·

1 Parent(s): 4d6d38d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,6 +9,13 @@ from scipy.io import wavfile
 from bark import generate_audio, SAMPLE_RATE
 from bark.generation import preload_models, load_model, generate_text_semantic
 class VoiceCloningApp:
     def __init__(self):
         # Create working directory
@@ -19,8 +26,8 @@ class VoiceCloningApp:
         # Explicit model loading with error handling
         try:
             print("Attempting to load Bark models...")
-            preload_models()
-            print("Bark models loaded successfully.")
         except Exception as e:
             print(f"Error loading Bark models: {e}")
             raise RuntimeError(f"Could not load Bark models: {e}")
@@ -62,13 +69,15 @@ class VoiceCloningApp:
                 history_prompt=None,
                 temp=0.7,
                 min_eos_p=0.05,
             )
             # Generate audio from semantic tokens
             audio_array = generate_audio(
                 semantic_tokens,
                 history_prompt=None,
-                temp=0.7
             )
             # Save generated audio

 from bark import generate_audio, SAMPLE_RATE
 from bark.generation import preload_models, load_model, generate_text_semantic
+# Add device detection
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+print("CUDA available:", torch.cuda.is_available())
+print("CUDA device count:", torch.cuda.device_count())
+if torch.cuda.is_available():
+    print("CUDA device name:", torch.cuda.get_device_name(0))
 class VoiceCloningApp:
     def __init__(self):
         # Create working directory
         # Explicit model loading with error handling
         try:
             print("Attempting to load Bark models...")
+            preload_models(device=device)
+            print(f"Bark models loaded successfully on {device}")
         except Exception as e:
             print(f"Error loading Bark models: {e}")
             raise RuntimeError(f"Could not load Bark models: {e}")
                 history_prompt=None,
                 temp=0.7,
                 min_eos_p=0.05,
+                device=device
             )
             # Generate audio from semantic tokens
             audio_array = generate_audio(
                 semantic_tokens,
                 history_prompt=None,
+                temp=0.7,
+                device=device
             )
             # Save generated audio