Spaces:

juancopi81
/

mutopia-guitar-composer

Build error

App Files Files Community

juancopi81 commited on Sep 23, 2022

Commit

d13787f

•

1 Parent(s): 197a713

Initial commit

Browse files

Files changed (4) hide show

README.md +1 -1
app.py +104 -0
requirements.txt +6 -0
utils.py +182 -0

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 title: Mutopia Guitar Composer
-emoji: 🏃
 colorFrom: blue
 colorTo: green
 sdk: gradio

 ---
 title: Mutopia Guitar Composer
+emoji: 🎸
 colorFrom: blue
 colorTo: green
 sdk: gradio

app.py ADDED Viewed

	@@ -0,0 +1,104 @@

+import gradio as gr
+from transformers import AutoTokenizer, TFGPT2LMHeadModel
+from transformers import pipeline
+import note_seq
+from utils import token_sequence_to_note_sequence, create_image_from_note_sequence
+SAMPLE_RATE=44100
+# Feel free to change this, I am using only three notes here because the model
+# works better this way.
+notes = ["D3", "G3", "E4"]
+notes_to_midi = {"D3": 50, "G3": 55, "E4": 64}
+time_signatures = ["4/4", "3/4", "2/4", "6/8"]
+time_signature_to_tokens = {"4/4": "4_4", "3/4": "3_4", "2/4": "2_4", "6/8": "6_8"}
+# Mutopi model for music generation
+mutopia_model = TFGPT2LMHeadModel.from_pretrained("juancopi81/mutopia_guitar_mmm")
+mutopia_tokenizer = AutoTokenizer.from_pretrained("juancopi81/mutopia_guitar_mmm")
+pipe = pipeline(
+    "text-generation", model=mutopia_model, tokenizer=mutopia_tokenizer, device=0
+)
+# Content for your demo:
+title = "Mutopia Guitar Composer"
+# I am adding here an image that I generated using DALL-E
+description = """
+The bot was trained to compose guitar music using the
+[Mutopia Guitar Dataset](https://huggingface.co/datasets/juancopi81/mutopia_guitar_dataset).
+Change the controllers and receive a new guitar piece!
+<figure>
+<center>
+<img src="https://drive.google.com/uc?export=view&id=1F22ofTCeJAHqVag4lJvBZugAE1OyabVA"
+width=200px alt="Robot playing the guitar">
+<figcaption>Image generated using DALL-E</figcaption>
+</center>
+</figure>
+"""
+article = """
+For a complete tutorial on how to create this demo from scratch, check out this
+[GitHub Repo](https://github.com/juancopi81/MMM_Mutopia_Guitar).
+"""
+# Helper function to create the string seed
+def create_seed(time_signature: str,
+                note: str,
+                bpm: int,
+                density: int) -> str:
+  seed = (f"PIECE_START TIME_SIGNATURE={time_signature_to_tokens[time_signature]} "
+          f"BPM={bpm} TRACK_START INST=0 DENSITY={density} "
+          f"BAR_START NOTE_ON={notes_to_midi[note]} ")
+  return seed
+def generate_guitar_piece(time_signature: str,
+                          note: str,
+                          bpm: int,
+                          density: int):
+  seed = create_seed(time_signature, note, bpm, density)
+  piece = pipe(seed, max_length=250)[0]["generated_text"]
+  # Convert text of notes to audio
+  note_sequence = token_sequence_to_note_sequence(piece)
+  synth = note_seq.midi_synth.fluidsynth
+  array_of_floats = synth(note_sequence, sample_rate=SAMPLE_RATE)
+  int16_data = note_seq.audio_io.float_samples_to_int16(array_of_floats)
+  piano_roll = create_image_from_note_sequence(note_sequence)
+  return (SAMPLE_RATE, int16_data), piano_roll
+# Create a block object
+demo = gr.Blocks()
+# Use your Block object as a context
+with demo:
+  gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>"
+              + title
+              + "</h1>")
+  gr.Markdown(description)
+  # UI for the inputs of the model
+  gr.Markdown("Select the generation parameters.")
+  with gr.Row():
+    time_signature = gr.Dropdown(time_signatures, value="4/4", label="Time signature")
+    note = gr.Dropdown(notes, value="G3", label="First note")
+    bpm = gr.Slider(minimum=60, maximum=140, step=10, value=90, label="Tempo")
+    density = gr.Slider(minimum=0, maximum=4, step=1, value=2, label="Density")
+  with gr.Row():
+    btn = gr.Button("Compose")
+  with gr.Row():
+    audio_output = gr.Audio()
+    image_output = gr.Image()
+  btn.click(generate_guitar_piece,
+            inputs = [
+                time_signature,
+                note,
+                bpm,
+                density
+            ],
+            outputs=[audio_output, image_output])
+  gr.Markdown(article)
+# Launch your demo
+demo.launch(debug=False)

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+transformers
+note-seq
+protobuf==3.20.1
+pyfluidsynth==1.3.0
+pandas
+matplotlib

utils.py ADDED Viewed

	@@ -0,0 +1,182 @@

+import collections
+import io
+import pandas as pd
+import matplotlib.pyplot as plt
+from matplotlib.patches import Rectangle
+from PIL import Image
+import note_seq
+import copy
+# Value of BPM for 1 second
+BPM_1_SECOND = 60
+# Variables to change based on the time signature
+numerator = ""
+denominator = ""
+def token_sequence_to_note_sequence(token_sequence,
+                                    use_program=True,
+                                    use_drums=False,
+                                    instrument_mapper=None,
+                                    only_guitar=True):
+    if isinstance(token_sequence, str):
+        token_sequence = token_sequence.split()
+    note_sequence = empty_note_sequence()
+    # Render all notes.
+    current_program = 1
+    current_is_drum = False
+    current_instrument = 0
+    track_count = 0
+    for token_index, token in enumerate(token_sequence):
+        if token == "PIECE_START":
+            pass
+        elif token == "PIECE_END":
+            print("The end.")
+            break
+        elif token.startswith("TIME_SIGNATURE="):
+            time_signature_str = token.split("=")[-1]
+            numerator = int(time_signature_str.split("_")[0])
+            denominator = int(time_signature_str.split("_")[-1])
+            time_signature = note_sequence.time_signatures.add()
+            time_signature.numerator = numerator
+            time_signature.denominator = denominator
+        elif token.startswith("BPM="):
+            bpm_str = token.split("=")[-1]
+            bpm = int(bpm_str)
+            note_sequence.tempos[0].qpm = bpm
+            pulse_duration, bar_duration = duration_in_sec(
+                bpm, numerator, denominator
+            )
+        elif token == "TRACK_START":
+            current_bar_index = 0
+            track_count += 1
+            pass
+        elif token == "TRACK_END":
+            pass
+        elif token == "KEYS_START":
+            pass
+        elif token == "KEYS_END":
+            pass
+        elif token.startswith("KEY="):
+            pass
+        elif token.startswith("INST"):
+            instrument = token.split("=")[-1]
+            if instrument != "DRUMS" and use_program:
+                if instrument_mapper is not None:
+                    if instrument in instrument_mapper:
+                        instrument = instrument_mapper[instrument]
+                current_program = int(instrument)
+                current_instrument = track_count
+                current_is_drum = False
+            if instrument == "DRUMS" and use_drums:
+                current_instrument = 0
+                current_program = 0
+                current_is_drum = True
+        elif token == "BAR_START":
+            current_time = (current_bar_index * bar_duration)
+            current_notes = {}
+        elif token == "BAR_END":
+            current_bar_index += 1
+            pass
+        elif token.startswith("NOTE_ON"):
+            pitch = int(token.split("=")[-1])
+            note = note_sequence.notes.add()
+            note.start_time = current_time
+            note.end_time = current_time + denominator * pulse_duration
+            note.pitch = pitch
+            note.instrument = current_instrument
+            note.program = current_program
+            note.velocity = 80
+            note.is_drum = current_is_drum
+            current_notes[pitch] = note
+        elif token.startswith("NOTE_OFF"):
+            pitch = int(token.split("=")[-1])
+            if pitch in current_notes:
+                note = current_notes[pitch]
+                note.end_time = current_time
+        elif token.startswith("TIME_DELTA"):
+            delta = float(token.split("=")[-1]) * (0.25) * pulse_duration
+            current_time += delta
+        elif token.startswith("DENSITY="):
+            pass
+        elif token == "[PAD]":
+            pass
+        else:
+            #print(f"Ignored token {token}.")
+            pass
+    # Make the instruments right.
+    instruments_drums = []
+    for note in note_sequence.notes:
+        pair = [note.program, note.is_drum]
+        if pair not in instruments_drums:
+            instruments_drums += [pair]
+        note.instrument = instruments_drums.index(pair)
+    if only_guitar:
+        for note in note_sequence.notes:
+            if not note.is_drum:
+                # Midi number for guitar is 23
+                note.instrument = 24
+                note.program = 24
+    return note_sequence
+# Calculate the duration in seconds of pulse and bar
+def duration_in_sec(bpm, numerator, denominator):
+    pulse_duration = BPM_1_SECOND / bpm
+    number_of_quarters_per_bar = (4 / denominator) * numerator
+    bar_duration = pulse_duration * number_of_quarters_per_bar
+    return pulse_duration, bar_duration
+def empty_note_sequence(qpm=120, total_time=0.0):
+    note_sequence = note_seq.protobuf.music_pb2.NoteSequence()
+    note_sequence.tempos.add().qpm = qpm
+    #note_sequence.ticks_per_quarter = note_seq.constants.STANDARD_PPQ
+    note_sequence.total_time = total_time
+    return note_sequence
+# Generate piano_roll
+def sequence_to_pandas_dataframe(sequence):
+      pd_dict = collections.defaultdict(list)
+      for note in sequence.notes:
+          pd_dict["start_time"].append(note.start_time)
+          pd_dict["end_time"].append(note.end_time)
+          pd_dict["duration"].append(note.end_time - note.start_time)
+          pd_dict["pitch"].append(note.pitch)
+          return pd.DataFrame(pd_dict)
+def dataframe_to_pianoroll_img(df):
+    fig = plt.figure(figsize=(8, 5))
+    ax = fig.add_subplot(111)
+    ax.scatter(df.start_time, df.pitch, c="white")
+    for _, row in df.iterrows():
+        ax.add_patch(Rectangle(
+            (row["start_time"], row["pitch"]-0.4),
+            row["duration"], 0.4, color="black"
+        ))
+    plt.xlabel('Seconds', fontsize=18)
+    plt.ylabel('MIDI pitch', fontsize=16)
+    return fig
+def fig2img(fig):
+    """Convert a Matplotlib figure to a PIL Image and return it"""
+    import io
+    buf = io.BytesIO()
+    fig.savefig(buf, format="png")
+    buf.seek(0)
+    img = Image.open(buf)
+    return img
+def create_image_from_note_sequence(sequence):
+    df_sequence = sequence_to_pandas_dataframe(sequence)
+    fig = dataframe_to_pianoroll_img(df_sequence)
+    img = fig2img(fig)
+    return img