Training in progress, step 500

Files changed (5) hide show

config.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-  "_name_or_path": "/home/edgeai/DeepSpeedExamples/training/autotuning/hf/gpt2-large/saved_based_exaone_block1024_Batch1_Rank28_last_layer_save/",
   "activation_function": "silu",
   "architectures": [
     "ExaoneTDForCausalLM"
   ],
   "attention_dropout": 0.0,
   "auto_map": {
-    "AutoConfig": "configuration_exaone.ExaoneConfig",
     "AutoModelForCausalLM": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForCausalLM",
     "AutoModelForSequenceClassification": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForSequenceClassification"
   },
@@ -32,7 +32,7 @@
     "rope_type": "llama3"
   },
   "rope_theta": 1000000,
-  "torch_dtype": "bfloat16",
   "transformers_version": "4.48.2",
   "use_cache": true,
   "vocab_size": 102400

 {
+  "_name_or_path": "/home/edgeai/rlhf/EXAONE_Decomposition/saved_based_exaone_block1024_Batch1_Rank28_last_layer_save",
   "activation_function": "silu",
   "architectures": [
     "ExaoneTDForCausalLM"
   ],
   "attention_dropout": 0.0,
   "auto_map": {
+    "AutoConfig": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--configuration_exaone.ExaoneConfig",
     "AutoModelForCausalLM": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForCausalLM",
     "AutoModelForSequenceClassification": "LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct--modeling_exaone.ExaoneForSequenceClassification"
   },
     "rope_type": "llama3"
   },
   "rope_theta": 1000000,
+  "torch_dtype": "float16",
   "transformers_version": "4.48.2",
   "use_cache": true,
   "vocab_size": 102400

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:25648d41b9c4841adda4184fcc5469ff03a925525b5b09785894013cab8629ae
-size 634692008

 version https://git-lfs.github.com/spec/v1
+oid sha256:2923be8ed2dbeefaa47b41012388622f63d58024e3e609fbe71e5563ebfb763b
+size 634690960

runs/Mar06_16-46-00_bizon3/events.out.tfevents.1741308444.bizon3.2149916.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a9ee2cf25e5d42545e722811d698e93c27239ed09c2e82c026fd8bdd7132d1f
+size 534292

tokenizer.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
   "version": "1.0",
-  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 256,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:356ad0a2f4757b2366d7565d0d097a2fbe122abbb7914bbd6acf189a1bd315b1
 size 7480

 version https://git-lfs.github.com/spec/v1
+oid sha256:00aec0357b99ec54ee52e47674ca67ee2873f77aa26885becdd6728a1c140625
 size 7480