Spaces:

asigalov61
/

Orpheus-Music-Transformer

Running on Zero

App Files Files Community

asigalov61 commited on Jun 11

Commit

419ed32

verified ·

1 Parent(s): 19ed5a0

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -21

app.py CHANGED Viewed

@@ -32,9 +32,9 @@ from x_transformer_2_3_1 import TransformerWrapper, AutoregressiveWrapper, Decod
 SEP = '=' * 70
 PDT = timezone('US/Pacific')
-MODEL_CHECKPOINT = 'Orpheus_Music_Transformer_No_Velocity_Trained_Model_21113_steps_0.3454_loss_0.895_acc.pth'
 SOUDFONT_PATH = 'SGM-v2.01-YamahaGrand-Guit-Bass-v2.7.sf2'
-NUM_OUT_BATCHES = 12
 PREVIEW_LENGTH = 120  # in tokens
 # -----------------------------
@@ -77,15 +77,15 @@ dtype = 'bfloat16'
 ptdtype = {'bfloat16': torch.bfloat16, 'float16': torch.float16}[dtype]
 ctx = torch.amp.autocast(device_type=device_type, dtype=ptdtype)
-SEQ_LEN = 4096
-PAD_IDX = 384
 model = TransformerWrapper(
     num_tokens=PAD_IDX + 1,
     max_seq_len=SEQ_LEN,
     attn_layers=Decoder(
         dim=2048,
-        depth=16,
         heads=32,
         rotary_pos_emb=True,
         attn_flash=True
@@ -246,14 +246,6 @@ def generate_music_and_state(input_midi, num_prime_tokens, num_gen_tokens, num_m
         final_composition = load_midi(input_midi)[:num_prime_tokens]
         midi_fname, midi_score = save_midi(final_composition)
         # Use the last note's time as a marker.
-        TMIDIX.Tegridy_ms_SONG_to_MIDI_Converter(
-            midi_score,
-            output_signature='Orpheus Music Transformer',
-            output_file_name=midi_fname,
-            track_name='Project Los Angeles',
-            list_of_MIDI_patches=[0]*16,
-            verbose=False
-        )
         block_lines.append(midi_score[-1][1] / 1000 if final_composition else 0)
     batched_gen_tokens = generate_music(final_composition, num_gen_tokens, num_mem_tokens,
@@ -264,16 +256,10 @@ def generate_music_and_state(input_midi, num_prime_tokens, num_gen_tokens, num_m
         preview_tokens = final_composition[-PREVIEW_LENGTH:]
         midi_fname, midi_score = save_midi(preview_tokens + tokens, batch_number=i)
         plot_kwargs = {'plot_title': f'Batch # {i}', 'return_plt': True}
         if len(final_composition) > PREVIEW_LENGTH:
             plot_kwargs['preview_length_in_notes'] = len([t for t in preview_tokens if t > 256])
-        TMIDIX.Tegridy_ms_SONG_to_MIDI_Converter(
-            midi_score,
-            output_signature='Orpheus Music Transformer',
-            output_file_name=midi_fname,
-            track_name='Project Los Angeles',
-            list_of_MIDI_patches=[0]*16,
-            verbose=False
-        )
         midi_plot = TMIDIX.plot_ms_SONG(midi_score, **plot_kwargs)
         midi_audio = midi_to_colab_audio(midi_fname + '.mid',
                                          soundfont_path=SOUDFONT_PATH,

 SEP = '=' * 70
 PDT = timezone('US/Pacific')
+MODEL_CHECKPOINT = 'Orpheus_Music_Transformer_Trained_Model_26002_steps_0.4232_loss_0.877_acc.pth'
 SOUDFONT_PATH = 'SGM-v2.01-YamahaGrand-Guit-Bass-v2.7.sf2'
+NUM_OUT_BATCHES = 8
 PREVIEW_LENGTH = 120  # in tokens
 # -----------------------------
 ptdtype = {'bfloat16': torch.bfloat16, 'float16': torch.float16}[dtype]
 ctx = torch.amp.autocast(device_type=device_type, dtype=ptdtype)
+SEQ_LEN = 8192
+PAD_IDX = 18819
 model = TransformerWrapper(
     num_tokens=PAD_IDX + 1,
     max_seq_len=SEQ_LEN,
     attn_layers=Decoder(
         dim=2048,
+        depth=8,
         heads=32,
         rotary_pos_emb=True,
         attn_flash=True
         final_composition = load_midi(input_midi)[:num_prime_tokens]
         midi_fname, midi_score = save_midi(final_composition)
         # Use the last note's time as a marker.
         block_lines.append(midi_score[-1][1] / 1000 if final_composition else 0)
     batched_gen_tokens = generate_music(final_composition, num_gen_tokens, num_mem_tokens,
         preview_tokens = final_composition[-PREVIEW_LENGTH:]
         midi_fname, midi_score = save_midi(preview_tokens + tokens, batch_number=i)
         plot_kwargs = {'plot_title': f'Batch # {i}', 'return_plt': True}
         if len(final_composition) > PREVIEW_LENGTH:
             plot_kwargs['preview_length_in_notes'] = len([t for t in preview_tokens if t > 256])
         midi_plot = TMIDIX.plot_ms_SONG(midi_score, **plot_kwargs)
         midi_audio = midi_to_colab_audio(midi_fname + '.mid',
                                          soundfont_path=SOUDFONT_PATH,