Popular-Hook-Transformer

Sleeping

App Files Files Community

asigalov61 commited on Oct 31, 2024

Commit

30ed745

verified ·

1 Parent(s): 07c6c95

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -91

app.py CHANGED Viewed

@@ -48,7 +48,7 @@ def mode_dur(seq):
 def mode_pitch(seq):
     return statistics.mode([t % 128 for t in seq if 256 < t < 512])
-parts_dict = sorted(set([str_strip(s[2]).rstrip('-') for s in melody_chords_f]))
 train_data = []
@@ -58,12 +58,12 @@ for m in tqdm.tqdm(melody_chords_f):
         for tv in range(-3, 3):
-            part = str_strip(m[2])
-            part_tok = parts_dict.index(part)
             score = [t+tv if 256 < t < 512 else t for t in m[5]]
-            seq = [916] + [part_tok+512, mode_time(score)+532, mode_dur(score)+660, mode_pitch(score)+tv+788]
             seq += score
@@ -144,61 +144,6 @@ def Generate_POP_Section(input_parsons_code,
     #===============================================================================
-    print('Instantiating Parsons Code Melody Transformer model...')
-    SEQ_LEN = 322
-    PAD_IDX = 392
-    model = TransformerWrapper(
-        num_tokens = PAD_IDX+1,
-        max_seq_len = SEQ_LEN,
-        attn_layers = Decoder(dim = 1024,
-                              depth = 4,
-                              heads = 8,
-                              rotary_pos_emb = True,
-                              attn_flash = True
-                             )
-        )
-    model = AutoregressiveWrapper(model, ignore_index = PAD_IDX, pad_value=PAD_IDX)
-    print('=' * 70)
-    print('Loading model checkpoint...')
-    model_path = 'Parsons_Code_Melody_Transformer_Trained_Model_13786_steps_0.3058_loss_0.8819_acc.pth'
-    model.load_state_dict(torch.load(model_path, map_location='cpu'))
-    model.cpu()
-    model.eval()
-    dtype = torch.bfloat16
-    ctx = torch.amp.autocast(device_type='cpu', dtype=dtype)
-    print('Done!')
-    print('=' * 70)
-    #===============================================================================
-    print('Prepping Parsons code string...')
-    td_str = re.sub('[^*DRU]', '', input_parsons_code)
-    print(len(td_str))
-    print('=' * 70)
-    if '*' in td_str and len(td_str) > 1:
-      code_mult = (64 // len(td_str[1:]))+1
-      mult_code = ('*' + (td_str[1:] * code_mult))[:64]
-    else:
-      mult_code = '*UUUUUUUDDDDDDDUUUUUUUDDDDDDDUUUUUUUDDDDDDDUUUUUUUDDDDDDDUUUUUUU'
-    pcode = parsons_code_to_tokens(mult_code)
-    print('Done!')
-    print('=' * 70)
     #===============================================================================
@@ -244,31 +189,42 @@ def Generate_POP_Section(input_parsons_code,
     song_f = []
     time = 0
-    dur = 4
     vel = 90
-    pitch = 60
     channel = 0
     for ss in song:
-        if 0 <= ss < 128:
-            time += ss * 32
-        if 128 <= ss < 256:
-            dur = (ss-128) * 32
-        if 256 <= ss < 384:
-            pitch = ss-256
-            song_f.append(['note', time, dur, channel, pitch, vel, 0])
-    fn1 = 'Parsons-Code-Melody-Transformer-Composition'
     detailed_stats = TMIDIX.Tegridy_ms_SONG_to_MIDI_Converter(song_f,
-                                                              output_signature = 'Parsons Code Melody Transformer',
                                                               output_file_name = fn1,
                                                               track_name='Project Los Angeles'
                                                               )
@@ -324,15 +280,14 @@ if __name__ == "__main__":
     with app:
-        gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>Parsons Code Melody Transformer</h1>")
-        gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>Generate unique melodies from Parsons codes</h1>")
         gr.Markdown(
-            "![Visitors](https://api.visitorbadge.io/api/visitors?path=asigalov61.Parsons-Code-Melody-Transformer&style=flat)\n\n"
-            "This is a demo for Clean Melodies subset of Tegridy MIDI Dataset\n\n"
-            "Check out [Tegridy MIDI Dataset](https://github.com/asigalov61/Tegridy-MIDI-Dataset) on GitHub!\n\n"
         )
-        gr.Markdown("## Enter Parsons code:")
         input_parsons_code = gr.Textbox(label="Parsons code",
                                         info="Make sure your Parsons code starts with *",
@@ -340,13 +295,6 @@ if __name__ == "__main__":
                                         value="*"
                                         )
-        clr_btn = gr.ClearButton(components=input_parsons_code)
-        def reset_pcode():
-            return '*'
-        clr_btn.click(reset_pcode, outputs=input_parsons_code)
         gr.Markdown("## Select generation options:")
         input_first_note_duration = gr.Slider(1, 127, value=15, step=1, label="First note duration value")

 def mode_pitch(seq):
     return statistics.mode([t % 128 for t in seq if 256 < t < 512])
+sections_dict = sorted(set([str_strip(s[2]).rstrip('-') for s in melody_chords_f]))
 train_data = []
         for tv in range(-3, 3):
+            section = str_strip(m[2])
+            section_tok = sections_dict.index(part)
             score = [t+tv if 256 < t < 512 else t for t in m[5]]
+            seq = [916] + [section_tok+512, mode_time(score)+532, mode_dur(score)+660, mode_pitch(score)+tv+788]
             seq += score
     #===============================================================================
     #===============================================================================
     song_f = []
     time = 0
+    dur = 0
     vel = 90
+    pitch = 0
     channel = 0
     for ss in song:
+      if 0 <= ss < 128:
+          time += ss * 32
+      if 128 <= ss < 256:
+          dur = (ss-128)* 32
+      if 256 <= ss < 512:
+          pitch = (ss-256) % 128
+          cha = (ss-256) // 128
+          if cha == 0:
+              channel = 3
+              vel = 110
+              patch = 40
+          else:
+              channel = 0
+              vel = 80
+              patch = 0
+          song_f.append(['note', time, dur, channel, pitch, vel, patch ])
+    fn1 = 'Popular-Hook-Transformer-Composition'
     detailed_stats = TMIDIX.Tegridy_ms_SONG_to_MIDI_Converter(song_f,
+                                                              output_signature = 'Popular Hook Transformer',
                                                               output_file_name = fn1,
                                                               track_name='Project Los Angeles'
                                                               )
     with app:
+        gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>Popular Hook Transformer</h1>")
+        gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>Generate unique POP music sections</h1>")
         gr.Markdown(
+            "This is a demo for popular-hook MIDI Dataset\n\n"
+            "Check out [popular-hook](https://huggingface.co/datasets/NEXTLab-ZJU/popular-hook) on Hugging Face!\n\n"
         )
+        gr.Markdown("## Select generation options:")
         input_parsons_code = gr.Textbox(label="Parsons code",
                                         info="Make sure your Parsons code starts with *",
                                         value="*"
                                         )
         gr.Markdown("## Select generation options:")
         input_first_note_duration = gr.Slider(1, 127, value=15, step=1, label="First note duration value")