Spaces:

JammyMachina
/

the-jam-machine-app

Running

App Files Files Community

m41w4r3.exe commited on Dec 19, 2022

Commit

7edf1ce

•

1 Parent(s): 2ec0615

minor initial fixes

Browse files

Files changed (5) hide show

app.py +0 -1
familizer.py +137 -0
generate.py +1 -4
generation_utils.py +141 -0
requirements.txt +16 -1

app.py CHANGED Viewed

@@ -2,7 +2,6 @@ import gradio as gr
 from load import LoadModel
 from generate import GenerateMidiText
 from constants import INSTRUMENT_CLASSES
-from encoder import MIDIEncoder
 from decoder import TextDecoder
 from utils import get_miditok, index_has_substring
 from playback import get_music

 from load import LoadModel
 from generate import GenerateMidiText
 from constants import INSTRUMENT_CLASSES
 from decoder import TextDecoder
 from utils import get_miditok, index_has_substring
 from playback import get_music

familizer.py ADDED Viewed

	@@ -0,0 +1,137 @@

+import random
+from joblib import Parallel, delayed
+from pathlib import Path
+from constants import INSTRUMENT_CLASSES, INSTRUMENT_TRANSFER_CLASSES
+from utils import get_files, timeit, FileCompressor
+class Familizer:
+    def __init__(self, n_jobs=-1, arbitrary=False):
+        self.n_jobs = n_jobs
+        self.reverse_family(arbitrary)
+    def get_family_number(self, program_number):
+        """
+        Given a MIDI instrument number, return its associated instrument family number.
+        """
+        for instrument_class in INSTRUMENT_CLASSES:
+            if program_number in instrument_class["program_range"]:
+                return instrument_class["family_number"]
+    def reverse_family(self, arbitrary):
+        """
+        Create a dictionary of family numbers to randomly assigned program numbers.
+        This is used to reverse the family number tokens back to program number tokens.
+        """
+        if arbitrary is True:
+            int_class = INSTRUMENT_TRANSFER_CLASSES
+        else:
+            int_class = INSTRUMENT_CLASSES
+        self.reference_programs = {}
+        for family in int_class:
+            self.reference_programs[family["family_number"]] = random.choice(
+                family["program_range"]
+            )
+    def get_program_number(self, family_number):
+        """
+        Given given a family number return a random program number in the respective program_range.
+        This is the reverse operation of get_family_number.
+        """
+        assert family_number in self.reference_programs
+        return self.reference_programs[family_number]
+    # Replace instruments in text files
+    def replace_instrument_token(self, token):
+        """
+        Given a MIDI program number in a word token, replace it with the family or program
+        number token depending on the operation.
+        e.g. INST=86 -> INST=10
+        """
+        inst_number = int(token.split("=")[1])
+        if self.operation == "family":
+            return "INST=" + str(self.get_family_number(inst_number))
+        elif self.operation == "program":
+            return "INST=" + str(self.get_program_number(inst_number))
+    def replace_instrument_in_text(self, text):
+        """Given a text piece, replace all instrument tokens with family number tokens."""
+        return " ".join(
+            [
+                self.replace_instrument_token(token)
+                if token.startswith("INST=") and not token == "INST=DRUMS"
+                else token
+                for token in text.split(" ")
+            ]
+        )
+    def replace_instruments_in_file(self, file):
+        """Given a text file, replace all instrument tokens with family number tokens."""
+        text = file.read_text()
+        file.write_text(self.replace_instrument_in_text(text))
+    @timeit
+    def replace_instruments(self):
+        """
+        Given a directory of text files:
+        Replace all instrument tokens with family number tokens.
+        """
+        files = get_files(self.output_directory, extension="txt")
+        Parallel(n_jobs=self.n_jobs)(
+            delayed(self.replace_instruments_in_file)(file) for file in files
+        )
+    def replace_tokens(self, input_directory, output_directory, operation):
+        """
+        Given a directory and an operation, perform the operation on all text files in the directory.
+        operation can be either 'family' or 'program'.
+        """
+        self.input_directory = input_directory
+        self.output_directory = output_directory
+        self.operation = operation
+        # Uncompress files, replace tokens, compress files
+        fc = FileCompressor(self.input_directory, self.output_directory, self.n_jobs)
+        fc.unzip()
+        self.replace_instruments()
+        fc.zip()
+        print(self.operation + " complete.")
+    def to_family(self, input_directory, output_directory):
+        """
+        Given a directory containing zip files, replace all instrument tokens with
+        family number tokens. The output is a directory of zip files.
+        """
+        self.replace_tokens(input_directory, output_directory, "family")
+    def to_program(self, input_directory, output_directory):
+        """
+        Given a directory containing zip files, replace all instrument tokens with
+        program number tokens. The output is a directory of zip files.
+        """
+        self.replace_tokens(input_directory, output_directory, "program")
+if __name__ == "__main__":
+    # Choose number of jobs for parallel processing
+    n_jobs = -1
+    # Instantiate Familizer
+    familizer = Familizer(n_jobs)
+    # Choose directory to process for program
+    input_directory = Path("midi/dataset/first_selection/validate").resolve()  # fmt: skip
+    output_directory = input_directory / "family"
+    # familize files
+    familizer.to_family(input_directory, output_directory)
+    # Choose directory to process for family
+    # input_directory = Path("../data/music_picks/encoded_samples/validate/family").resolve()  # fmt: skip
+    # output_directory = input_directory.parent / "program"
+    # # programize files
+    # familizer.to_program(input_directory, output_directory)

generate.py CHANGED Viewed

@@ -1,11 +1,8 @@
 from generation_utils import *
 from utils import WriteTextMidiToFile, get_miditok
 from load import LoadModel
-from constants import INSTRUMENT_CLASSES
-## import for execution
 from decoder import TextDecoder
-from playback import get_music, show_piano_roll
 class GenerateMidiText:

 from generation_utils import *
 from utils import WriteTextMidiToFile, get_miditok
 from load import LoadModel
 from decoder import TextDecoder
+from playback import get_music
 class GenerateMidiText:

generation_utils.py ADDED Viewed

	@@ -0,0 +1,141 @@

+import os
+import numpy as np
+import matplotlib.pyplot as plt
+import matplotlib
+from constants import INSTRUMENT_CLASSES
+# matplotlib settings
+matplotlib.use("Agg")  # for server
+matplotlib.rcParams["xtick.major.size"] = 0
+matplotlib.rcParams["ytick.major.size"] = 0
+matplotlib.rcParams["axes.facecolor"] = "grey"
+matplotlib.rcParams["axes.edgecolor"] = "none"
+def define_generation_dir(model_repo_path):
+    #### to remove later ####
+    if model_repo_path == "models/model_2048_fake_wholedataset":
+        model_repo_path = "misnaej/the-jam-machine"
+    #### to remove later ####
+    generated_sequence_files_path = f"midi/generated/{model_repo_path}"
+    if not os.path.exists(generated_sequence_files_path):
+        os.makedirs(generated_sequence_files_path)
+    return generated_sequence_files_path
+def bar_count_check(sequence, n_bars):
+    """check if the sequence contains the right number of bars"""
+    sequence = sequence.split(" ")
+    # find occurences of "BAR_END" in a "sequence"
+    # I don't check for "BAR_START" because it is not always included in "sequence"
+    # e.g. BAR_START is included the prompt when generating one more bar
+    bar_count = 0
+    for seq in sequence:
+        if seq == "BAR_END":
+            bar_count += 1
+    bar_count_matches = bar_count == n_bars
+    if not bar_count_matches:
+        print(f"Bar count is {bar_count} - but should be {n_bars}")
+    return bar_count_matches, bar_count
+def print_inst_classes(INSTRUMENT_CLASSES):
+    """Print the instrument classes"""
+    for classe in INSTRUMENT_CLASSES:
+        print(f"{classe}")
+def check_if_prompt_inst_in_tokenizer_vocab(tokenizer, inst_prompt_list):
+    """Check if the prompt instrument are in the tokenizer vocab"""
+    for inst in inst_prompt_list:
+        if f"INST={inst}" not in tokenizer.vocab:
+            instruments_in_dataset = np.sort(
+                [tok.split("=")[-1] for tok in tokenizer.vocab if "INST" in tok]
+            )
+            print_inst_classes(INSTRUMENT_CLASSES)
+            raise ValueError(
+                f"""The instrument {inst} is not in the tokenizer vocabulary.
+                Available Instruments: {instruments_in_dataset}"""
+            )
+def forcing_bar_count(input_prompt, generated, bar_count, expected_length):
+    """Forcing the generated sequence to have the expected length
+    expected_length and bar_count refers to the length of newly_generated_only (without input prompt)"""
+    if bar_count - expected_length > 0:  # Cut the sequence if too long
+        full_piece = ""
+        splited = generated.split("BAR_END ")
+        for count, spl in enumerate(splited):
+            if count < expected_length:
+                full_piece += spl + "BAR_END "
+        full_piece += "TRACK_END "
+        full_piece = input_prompt + full_piece
+        print(f"Generated sequence trunkated at {expected_length} bars")
+        bar_count_checks = True
+    elif bar_count - expected_length < 0:  # Do nothing it the sequence if too short
+        full_piece = input_prompt + generated
+        bar_count_checks = False
+        print(f"--- Generated sequence is too short - Force Regeration ---")
+    return full_piece, bar_count_checks
+def get_max_time(inst_midi):
+    max_time = 0
+    for inst in inst_midi.instruments:
+        max_time = max(max_time, inst.get_end_time())
+    return max_time
+def plot_piano_roll(inst_midi):
+    piano_roll_fig = plt.figure(figsize=(25, 3 * len(inst_midi.instruments)))
+    piano_roll_fig.tight_layout()
+    piano_roll_fig.patch.set_alpha(0.1)
+    inst_count = 0
+    beats_per_bar = 4
+    sec_per_beat = 0.5
+    next_beat = max(inst_midi.get_beats()) + np.diff(inst_midi.get_beats())[0]
+    bars_time = np.append(inst_midi.get_beats(), (next_beat))[::beats_per_bar].astype(
+        int
+    )
+    for inst in inst_midi.instruments:
+        inst_count += 1
+        plt.subplot(len(inst_midi.instruments), 1, inst_count)
+        for bar in bars_time:
+            plt.axvline(bar, color="grey", linewidth=0.5)
+        octaves = np.arange(0, 128, 12)
+        for octave in octaves:
+            plt.axhline(octave, color="grey", linewidth=0.5)
+        plt.yticks(octaves, visible=False)
+        p_midi_note_list = inst.notes
+        note_time = []
+        note_pitch = []
+        for note in p_midi_note_list:
+            note_time.append([note.start, note.end])
+            note_pitch.append([note.pitch, note.pitch])
+        plt.plot(
+            np.array(note_time).T,
+            np.array(note_pitch).T,
+            color="purple",
+            linewidth=3,
+            solid_capstyle="butt",
+        )
+        plt.ylim(0, 128)
+        xticks = np.array(bars_time)[:-1]
+        plt.tight_layout()
+        plt.xlim(min(bars_time), max(bars_time))
+        # plt.xlabel("bars")
+        plt.xticks(
+            xticks + 0.5 * beats_per_bar * sec_per_beat,
+            labels=xticks.argsort() + 1,
+            visible=False,
+        )
+        plt.title(inst.name, fontsize=10, color="white")
+    return piano_roll_fig

requirements.txt CHANGED Viewed

@@ -2,4 +2,19 @@ gradio
 matplotlib
 sys
 matplotlib
-numpy

 matplotlib
 sys
 matplotlib
+numpy
+joblib
+pathlib
+random
+transformers
+os
+miditok
+librosa
+pretty_midi
+pydub
+shutil
+scipy
+zipfile
+time
+json
+datetime