Spaces:

fffiloni
/

YuE

Paused

App Files Files Community

KingNish commited on Feb 7

Commit

c654b1b

·

verified ·

1 Parent(s): d8b1d07

Optimized for speed (#7)

- A patch of transformers (98915f7a2db0b5b80c135c8ee021c7e73f0488ab)
- Increased stage 2 batch size (c9e6e07806ab611efa8e609c110db1d450a450fa)
- Flash Attention 2 only supports fp16 (e5ae04a10082bfbc1f23931af7e09b9745cc3ae1)

Co-authored-by: Nishith Jain <[email protected]>

Files changed (3) hide show

app.py +1 -1
inference/infer.py +1 -1
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -124,7 +124,7 @@ def infer(genre_txt_content, lyrics_txt_content, num_segments, max_new_tokens):
         "--genre_txt", f"{genre_txt_path}",
         "--lyrics_txt", f"{lyrics_txt_path}",
         "--run_n_segments", str(num_segments),
-        "--stage2_batch_size", "4",
         "--output_dir", f"{output_dir}",
         "--cuda_idx", "0",
         "--max_new_tokens", str(max_new_tokens)

         "--genre_txt", f"{genre_txt_path}",
         "--lyrics_txt", f"{lyrics_txt_path}",
         "--run_n_segments", str(num_segments),
+        "--stage2_batch_size", "16",
         "--output_dir", f"{output_dir}",
         "--cuda_idx", "0",
         "--max_new_tokens", str(max_new_tokens)

inference/infer.py CHANGED Viewed

@@ -76,7 +76,7 @@ print(f"Using device: {device}")
 mmtokenizer = _MMSentencePieceTokenizer("./mm_tokenizer_v0.2_hf/tokenizer.model")
 model = AutoModelForCausalLM.from_pretrained(
     stage1_model,
-    torch_dtype=torch.bfloat16,
     attn_implementation="flash_attention_2", # To enable flashattn, you have to install flash-attn
     )
 model.to(device)

 mmtokenizer = _MMSentencePieceTokenizer("./mm_tokenizer_v0.2_hf/tokenizer.model")
 model = AutoModelForCausalLM.from_pretrained(
     stage1_model,
+    torch_dtype=torch.float16,
     attn_implementation="flash_attention_2", # To enable flashattn, you have to install flash-attn
     )
 model.to(device)

requirements.txt CHANGED Viewed

@@ -3,7 +3,7 @@ torchaudio==2.2.0 --index-url https://download.pytorch.org/whl/cu118
 omegaconf
 einops
 numpy<2
-transformers
 sentencepiece
 tqdm
 tensorboard

 omegaconf
 einops
 numpy<2
+git+https://github.com/KingNish24/transformers.git@yue-patch
 sentencepiece
 tqdm
 tensorboard