Model save

Files changed (4) hide show

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 library_name: peft
 license: llama3.2
-base_model: meta-llama/Llama-3.2-11B-Vision-Instruct
 tags:
 - generated_from_trainer
 model-index:
@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 # vision
-This model is a fine-tuned version of [meta-llama/Llama-3.2-11B-Vision-Instruct](https://huggingface.co/meta-llama/Llama-3.2-11B-Vision-Instruct) on the None dataset.
 ## Model description
@@ -50,8 +50,8 @@ The following hyperparameters were used during training:
 ### Framework versions
-- PEFT 0.13.2
-- Transformers 4.46.3
 - Pytorch 2.5.1+cu124
-- Datasets 3.1.0
-- Tokenizers 0.20.3

 ---
 library_name: peft
 license: llama3.2
+base_model: meta-llama/Llama-3.2-90B-Vision-Instruct
 tags:
 - generated_from_trainer
 model-index:
 # vision
+This model is a fine-tuned version of [meta-llama/Llama-3.2-90B-Vision-Instruct](https://huggingface.co/meta-llama/Llama-3.2-90B-Vision-Instruct) on the None dataset.
 ## Model description
 ### Framework versions
+- PEFT 0.14.0
+- Transformers 4.48.1
 - Pytorch 2.5.1+cu124
+- Datasets 3.2.0
+- Tokenizers 0.21.0

adapter_config.json CHANGED Viewed

@@ -4,8 +4,10 @@
     "base_model_class": "MllamaForConditionalGeneration",
     "parent_library": "transformers.models.mllama.modeling_mllama"
   },
-  "base_model_name_or_path": "meta-llama/Llama-3.2-11B-Vision-Instruct",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": "gaussian",
@@ -14,6 +16,7 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 8,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -25,11 +28,11 @@
   "target_modules": [
     "gate_proj",
     "down_proj",
     "v_proj",
     "o_proj",
-    "k_proj",
-    "q_proj",
-    "up_proj"
   ],
   "task_type": null,
   "use_dora": true,

     "base_model_class": "MllamaForConditionalGeneration",
     "parent_library": "transformers.models.mllama.modeling_mllama"
   },
+  "base_model_name_or_path": "meta-llama/Llama-3.2-90B-Vision-Instruct",
   "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": "gaussian",
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 8,
+  "lora_bias": false,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "target_modules": [
     "gate_proj",
     "down_proj",
+    "k_proj",
+    "up_proj",
     "v_proj",
     "o_proj",
+    "q_proj"
   ],
   "task_type": null,
   "use_dora": true,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:456b96c09ecb0399c2a082195f76b5d6571b96979abad28f29e0a85738a54213
-size 125866776

 version https://git-lfs.github.com/spec/v1
+oid sha256:a7c95bb53697da334a04606a8f35e42c92a0f4a1039f02a4e2c3dbac447ee8bc
+size 565641552

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:544822af527651abd2d3d28d1a662a73e1a67159daa8cd8c0f185664b07ecf86
-size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:0213928de50cc0998c65510c77ba2657b22ec0962a3b330744528cc45d23bd46
+size 5304