Spaces:

johann22
/

ss

Runtime error

App Files Files Community

johann22 commited on Nov 26, 2024

Commit

c7cebb0

•

1 Parent(s): 7c5664b

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -39

app.py CHANGED Viewed

@@ -1,43 +1,18 @@
-import outetts
-# Configure the model
-model_config = outetts.HFModelConfig_v1(
-    model_path="OuteAI/OuteTTS-0.2-500M",
-    language="en",  # Supported languages in v0.2: en, zh, ja, ko
-)
-# Initialize the interface
-interface = outetts.InterfaceHF(model_version="0.2", cfg=model_config)
-# Optional: Create a speaker profile (use a 10-15 second audio clip)
-# speaker = interface.create_speaker(
-#     audio_path="path/to/audio/file",
-#     transcript="Transcription of the audio file."
-# )
-# Optional: Save and load speaker profiles
-# interface.save_speaker(speaker, "speaker.json")
-# speaker = interface.load_speaker("speaker.json")
-# Optional: Load speaker from default presets
-interface.print_default_speakers()
-speaker = interface.load_default_speaker(name="male_1")
-output = interface.generate(
-    text="Speech synthesis is the artificial production of human speech. A computer system used for this purpose is called a speech synthesizer, and it can be implemented in software or hardware products.",
-    # Lower temperature values may result in a more stable tone,
-    # while higher values can introduce varied and expressive speech
-    temperature=0.1,
-    repetition_penalty=1.1,
-    max_length=4096,
-    # Optional: Use a speaker profile for consistent voice characteristics
-    # Without a speaker profile, the model will generate a voice with random characteristics
-    speaker=speaker,
-)
-# Save the synthesized speech to a file
-output.save("output.wav")
-# Optional: Play the synthesized speech
-output.play()

+import torch
+from diffusers import MochiPipeline
+from diffusers.utils import export_to_video
+import gradio as gr
+pipe = MochiPipeline.from_pretrained("genmo/mochi-1-preview", variant="bf16", torch_dtype=torch.bfloat16)
+# Enable memory savings
+pipe.enable_model_cpu_offload()
+pipe.enable_vae_tiling()
+prompt = "Close-up of a chameleon's eye, with its scaly skin changing color. Ultra high resolution 4k."
+frames = pipe(prompt, num_frames=84).frames[0]
+export_to_video(frames, "mochi.mp4", fps=30)
+with gr.Blocks() as b:
+    vid=gr.Video("mochi.mp4")
+b.launch()