ZeyuXie commited on
Commit
c2201d6
1 Parent(s): ccb7c0b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -32,9 +32,9 @@ class InferRunner:
32
  ).eval().to(device)
33
  self.scheduler = DDPMScheduler.from_pretrained(train_args.scheduler_name, subfolder="scheduler")
34
 
35
- def infer(caption, runner):
36
  with torch.no_grad():
37
- latents = runner.picomodel.demo_inference(caption, runner.scheduler, num_steps=200, guidance=3.0, num_samples=1, audio_len=16000*10, disable_progress=True)
38
  mel = runner.vae.decode_first_stage(latents)
39
  wave = runner.vae.decode_to_waveform(mel)[0][:audio_len]
40
  sf.write(f"synthesized/{caption}.wav", wave, samplerate=16000, subtype='PCM_16')
@@ -50,7 +50,7 @@ with gr.Blocks() as demo:
50
  with gr.Row():
51
  with gr.Column():
52
  prompt = gr.Textbox(label="Prompt: Input your caption formatted as 'event1 at onset1-offset1_onset2-offset2 and event2 at onset1-offset1.",
53
- value="spraying at 0.38-1.176_3.06-3.856 and gunshot at 1.729-3.729_4.367-6.367_7.031-9.031.")
54
  run_button = gr.Button()
55
 
56
  with gr.Accordion("Advanced options", open=False):
@@ -64,7 +64,7 @@ with gr.Blocks() as demo:
64
  outaudio = gr.Audio()
65
 
66
  run_button.click(fn=infer, inputs=[
67
- prompt, num_steps, guidance], outputs=[outaudio])
68
  # with gr.Row():
69
  # with gr.Column():
70
  # gr.Examples(
 
32
  ).eval().to(device)
33
  self.scheduler = DDPMScheduler.from_pretrained(train_args.scheduler_name, subfolder="scheduler")
34
 
35
+ def infer(caption, runner, num_steps=200, guidance=3.0):
36
  with torch.no_grad():
37
+ latents = runner.picomodel.demo_inference(caption, runner.scheduler, num_steps=num_steps, guidance=guidance, num_samples=1, audio_len=16000*10, disable_progress=True)
38
  mel = runner.vae.decode_first_stage(latents)
39
  wave = runner.vae.decode_to_waveform(mel)[0][:audio_len]
40
  sf.write(f"synthesized/{caption}.wav", wave, samplerate=16000, subtype='PCM_16')
 
50
  with gr.Row():
51
  with gr.Column():
52
  prompt = gr.Textbox(label="Prompt: Input your caption formatted as 'event1 at onset1-offset1_onset2-offset2 and event2 at onset1-offset1.",
53
+ value="spraying at 0.38-1.176_3.06-3.856 and gunshot at 1.729-3.729_4.367-6.367_7.031-9.031.",)
54
  run_button = gr.Button()
55
 
56
  with gr.Accordion("Advanced options", open=False):
 
64
  outaudio = gr.Audio()
65
 
66
  run_button.click(fn=infer, inputs=[
67
+ prompt, infer_runner, num_steps, guidance], outputs=[outaudio])
68
  # with gr.Row():
69
  # with gr.Column():
70
  # gr.Examples(