Model save

Files changed (4) hide show

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 library_name: peft
 license: llama3.2
-base_model: meta-llama/Llama-3.2-90B-Vision-Instruct
 tags:
 - generated_from_trainer
 model-index:
@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 # vision
-This model is a fine-tuned version of [meta-llama/Llama-3.2-90B-Vision-Instruct](https://huggingface.co/meta-llama/Llama-3.2-90B-Vision-Instruct) on the None dataset.
 ## Model description
@@ -50,8 +50,8 @@ The following hyperparameters were used during training:
 ### Framework versions
-- PEFT 0.14.0
-- Transformers 4.48.1
 - Pytorch 2.5.1+cu124
-- Datasets 3.2.0
-- Tokenizers 0.21.0

 ---
 library_name: peft
 license: llama3.2
+base_model: meta-llama/Llama-3.2-11B-Vision-Instruct
 tags:
 - generated_from_trainer
 model-index:
 # vision
+This model is a fine-tuned version of [meta-llama/Llama-3.2-11B-Vision-Instruct](https://huggingface.co/meta-llama/Llama-3.2-11B-Vision-Instruct) on the None dataset.
 ## Model description
 ### Framework versions
+- PEFT 0.13.2
+- Transformers 4.46.3
 - Pytorch 2.5.1+cu124
+- Datasets 3.1.0
+- Tokenizers 0.20.3

adapter_config.json CHANGED Viewed

@@ -4,10 +4,8 @@
     "base_model_class": "MllamaForConditionalGeneration",
     "parent_library": "transformers.models.mllama.modeling_mllama"
   },
-  "base_model_name_or_path": "meta-llama/Llama-3.2-90B-Vision-Instruct",
   "bias": "none",
-  "eva_config": null,
-  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": "gaussian",
@@ -16,7 +14,6 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 8,
-  "lora_bias": false,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -28,11 +25,11 @@
   "target_modules": [
     "gate_proj",
     "up_proj",
-    "k_proj",
-    "down_proj",
     "q_proj",
     "v_proj",
-    "o_proj"
   ],
   "task_type": null,
   "use_dora": true,

     "base_model_class": "MllamaForConditionalGeneration",
     "parent_library": "transformers.models.mllama.modeling_mllama"
   },
+  "base_model_name_or_path": "meta-llama/Llama-3.2-11B-Vision-Instruct",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": "gaussian",
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 8,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "target_modules": [
     "gate_proj",
     "up_proj",
     "q_proj",
     "v_proj",
+    "o_proj",
+    "k_proj",
+    "down_proj"
   ],
   "task_type": null,
   "use_dora": true,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77b2d889f8671542c22f7522191e50ab8989cfcc48f24095bb92bdc0ec0f1ffe
-size 565641552

 version https://git-lfs.github.com/spec/v1
+oid sha256:af7e0261e0f7942215af169e23eb2291a4ffce338e146a0e2427a1a2acb12bdb
+size 125866776

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7be3a410baf9a3d96121d993ef6297c0d25f808a13b4c6b6bfd17be030bad9ee
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:a469ffaf805a2747162fca45504aee937e08babf4949c6179b44ad1608a95574
 size 5304