Spaces:

Rogerjs
/

Voicecloner

Sleeping

App Files Files Community

Roger commited on Dec 5, 2024

Commit

3a938ac

1 Parent(s): dd83b45

updated

Browse files

Files changed (2) hide show

app.py +20 -24
requirements.txt +1 -4

app.py CHANGED Viewed

@@ -7,14 +7,7 @@ from scipy.io import wavfile
 # Explicitly import Bark components
 from bark import generate_audio, SAMPLE_RATE
-from bark.generation import preload_models, load_model, generate_text_semantic
-# Add device detection
-device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-print("CUDA available:", torch.cuda.is_available())
-print("CUDA device count:", torch.cuda.device_count())
-if torch.cuda.is_available():
-    print("CUDA device name:", torch.cuda.get_device_name(0))
 class VoiceCloningApp:
     def __init__(self):
@@ -26,11 +19,17 @@ class VoiceCloningApp:
         # Explicit model loading with error handling
         try:
             print("Attempting to load Bark models...")
-            preload_models(device=device)
-            print(f"Bark models loaded successfully on {device}")
         except Exception as e:
             print(f"Error loading Bark models: {e}")
-            raise RuntimeError(f"Could not load Bark models: {e}")
     def process_reference_audio(self, audio_data):
         """Simple audio processing"""
@@ -63,21 +62,11 @@ class VoiceCloningApp:
             # Generate audio with explicit error handling
             print(f"Generating speech for text: {text}")
-            # Use alternative generation method
-            semantic_tokens = generate_text_semantic(
-                text,
-                history_prompt=None,
-                temp=0.7,
-                min_eos_p=0.05,
-                device=device
-            )
-            # Generate audio from semantic tokens
             audio_array = generate_audio(
-                semantic_tokens,
                 history_prompt=None,
-                temp=0.7,
-                device=device
             )
             # Save generated audio
@@ -89,9 +78,16 @@ class VoiceCloningApp:
         except Exception as e:
             print(f"Speech generation error: {e}")
             return None, f"Error generating speech: {str(e)}"
 def create_interface():
     app = VoiceCloningApp()
     # Use the most basic Gradio theme to avoid font issues

 # Explicitly import Bark components
 from bark import generate_audio, SAMPLE_RATE
+from bark.generation import preload_models
 class VoiceCloningApp:
     def __init__(self):
         # Explicit model loading with error handling
         try:
             print("Attempting to load Bark models...")
+            # Remove device argument
+            preload_models()
+            print("Bark models loaded successfully.")
         except Exception as e:
             print(f"Error loading Bark models: {e}")
+            # Log the full error for debugging
+            import traceback
+            traceback.print_exc()
+            # Provide a more informative error message
+            raise RuntimeError(f"Could not load Bark models. Error: {e}")
     def process_reference_audio(self, audio_data):
         """Simple audio processing"""
             # Generate audio with explicit error handling
             print(f"Generating speech for text: {text}")
+            # Simplified audio generation
             audio_array = generate_audio(
+                text,
                 history_prompt=None,
+                temp=0.7
             )
             # Save generated audio
         except Exception as e:
             print(f"Speech generation error: {e}")
+            # Log the full error for debugging
+            import traceback
+            traceback.print_exc()
             return None, f"Error generating speech: {str(e)}"
 def create_interface():
+    # Create working directory if it doesn't exist
+    working_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), "working_files")
+    os.makedirs(working_dir, exist_ok=True)
     app = VoiceCloningApp()
     # Use the most basic Gradio theme to avoid font issues

requirements.txt CHANGED Viewed

@@ -2,9 +2,6 @@ gradio>=3.50.2
 numpy
 scipy
 soundfile
-torch>=2.0.0+cu118
-torchvision>=0.15.0+cu118
-torchaudio>=2.0.0
 transformers
 git+https://github.com/suno-ai/bark.git
---extra-index-url https://download.pytorch.org/whl/cu118

 numpy
 scipy
 soundfile
+torch
 transformers
 git+https://github.com/suno-ai/bark.git