Spaces:
Running
on
Zero
Running
on
Zero
File size: 1,954 Bytes
a66ecf5 3efa2af 8dacb10 c989815 d45a9bf 46f15cd 3efa2af 46f15cd 3efa2af 016958e 3efa2af 7670c1c c1aae9d a66ecf5 0062591 a66ecf5 e4a10b7 a66ecf5 d4beeea 7095c54 016958e c989815 562962c d45a9bf ac3db70 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
import gradio as gr
from musiclib import musicgen
from io import BytesIO
import midi_util
from midi_util import VocabConfig
import tempfile
from glob import glob
import soundfile as sf
def gen(piano_only, length):
midi = ''
for item in musicgen(piano_only=piano_only, length=length):
midi = item
yield item, None
bio = BytesIO()
cfg = VocabConfig.from_json('./vocab_config.json')
text = midi.strip()
mid = midi_util.convert_str_to_midi(cfg, text)
with tempfile.NamedTemporaryFile(suffix='.midi', delete=False) as tmp:
mid.save(tmp.name)
yield midi, tmp.name
with gr.Blocks() as demo:
gr.Markdown("# RWKV 4 Music (MIDI)\n\nThis demo uses the RWKV 4 MIDI model available [here](https://huggingface.co/BlinkDL/rwkv-4-music/blob/main/RWKV-4-MIDI-560M-v1-20230717-ctx4096.pth). Details may be found [here](https://huggingface.co/BlinkDL/rwkv-4-music). The music generation code may be found [here](https://github.com/BlinkDL/ChatRWKV/tree/main/music). The MIDI Tokenizer may be found [here](https://github.com/briansemrau/MIDI-LLM-tokenizer).\n\nNot sure how to play MIDI files? I recommend using the open source [VLC Media Player](https://www.videolan.org/vlc/) with can play MIDI files using FluidSynth.")
piano_only = gr.Checkbox(label="Piano Only")
length = gr.Slider(label="Max Length (in tokens)", minimum=4, maximum=4096, step=1, value=4096, info="The audio may still be shorter than this")
synth = gr.Button("Synthesize")
txtout = gr.Textbox(interactive=False, label="MIDI Tokens")
fileout = gr.File(interactive=False, label="MIDI File", type="binary")
synth.click(gen, inputs=[piano_only, length], outputs=[txtout, fileout])
with gr.Accordion("Samples", open=False):
for i, audpath in enumerate(glob("*.wav")):
gr.Audio(interactive=False, value=sf.read(audpath), label=f'Sample {i + 1}')
demo.queue(api_open=False).launch(show_api=False) |