debisoft commited on
Commit
8673db4
·
1 Parent(s): 030c37e
Files changed (1) hide show
  1. app.py +31 -5
app.py CHANGED
@@ -4,13 +4,39 @@ import os
4
  import spaces
5
  import torch
6
 
7
- from transformers import AutoTokenizer, AutoModelForCausalLM
 
 
8
 
9
  huggingface_hub.login(os.getenv('HF_TOKEN'))
10
- tokenizer = AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-7B")
11
- model = AutoModelForCausalLM.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-7B")
12
- cuda_device = torch.device("cuda")
13
- cpu_device = torch.device("cpu")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
 
15
  @spaces.GPU
16
  def sentience_check():
 
4
  import spaces
5
  import torch
6
 
7
+ from peft import PeftModel, PeftConfig
8
+ from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, Qwen2_5_VLForConditionalGeneration
9
+ from datasets import load_dataset
10
 
11
  huggingface_hub.login(os.getenv('HF_TOKEN'))
12
+ peft_model_id = "debisoft/Qwen2.5-VL-3B-Instruct-thinking-function_calling-V0"
13
+
14
+ bnb_config = BitsAndBytesConfig(
15
+ load_in_4bit=True,
16
+ bnb_4bit_quant_type="nf4",
17
+ bnb_4bit_compute_dtype=torch.bfloat16,
18
+ bnb_4bit_use_double_quant=True,
19
+ )
20
+
21
+ device = "auto"
22
+ config = PeftConfig.from_pretrained(peft_model_id)
23
+ model = Qwen2_5_VLForConditionalGeneration.from_pretrained(config.base_model_name_or_path,
24
+ #AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path,
25
+ quantization_config=bnb_config,
26
+ device_map="auto",
27
+ )
28
+ tokenizer = AutoTokenizer.from_pretrained(peft_model_id)
29
+ model.resize_token_embeddings(len(tokenizer))
30
+ model = PeftModel.from_pretrained(model, peft_model_id,
31
+ #offload_folder = "offload/"
32
+ )
33
+
34
+ model.to(torch.bfloat16)
35
+ model.eval()
36
+
37
+ #tokenizer = AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-7B")
38
+ #model = AutoModelForCausalLM.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-7B")
39
+
40
 
41
  @spaces.GPU
42
  def sentience_check():