YuE-music-generator-demo-zero

Paused

KingNish commited on Jan 30

Commit

a75bb02

verified ·

1 Parent(s): b0328a4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -97,12 +97,7 @@ model = AutoModelForCausalLM.from_pretrained(
     attn_implementation="flash_attention_2",  # To enable flashattn, you have to install flash-attn
 ).to(device)
 model.eval()
-# Apply dynamic quantization
-model = torch.quantization.quantize_dynamic(
-    model, {torch.nn.Linear}, dtype=torch.qint8
-).to(device)
-model.eval()
 basic_model_config = './xcodec_mini_infer/final_ckpt/config.yaml'
 resume_path = './xcodec_mini_infer/final_ckpt/ckpt_00360000.pth'

     attn_implementation="flash_attention_2",  # To enable flashattn, you have to install flash-attn
 ).to(device)
 model.eval()
+# gonna use either gguf or vllm later
 basic_model_config = './xcodec_mini_infer/final_ckpt/config.yaml'
 resume_path = './xcodec_mini_infer/final_ckpt/ckpt_00360000.pth'