lnewbould commited on Jan 28

Commit

2dd8abe

verified ·

1 Parent(s): dce11b8

Training in progress, step 14

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

config.json +62 -0
model.safetensors +3 -0
run-0/checkpoint-14/config.json +62 -0
run-0/checkpoint-14/model.safetensors +3 -0
run-0/checkpoint-14/optimizer.pt +3 -0
run-0/checkpoint-14/rng_state.pth +3 -0
run-0/checkpoint-14/scheduler.pt +3 -0
run-0/checkpoint-14/special_tokens_map.json +7 -0
run-0/checkpoint-14/tokenizer.json +0 -0
run-0/checkpoint-14/tokenizer_config.json +56 -0
run-0/checkpoint-14/trainer_state.json +47 -0
run-0/checkpoint-14/training_args.bin +3 -0
run-0/checkpoint-14/vocab.txt +0 -0
run-0/checkpoint-20/config.json +63 -0
run-0/checkpoint-20/model.safetensors +3 -0
run-0/checkpoint-20/optimizer.pt +3 -0
run-0/checkpoint-20/rng_state.pth +3 -0
run-0/checkpoint-20/scheduler.pt +3 -0
run-0/checkpoint-20/special_tokens_map.json +7 -0
run-0/checkpoint-20/tokenizer.json +0 -0
run-0/checkpoint-20/tokenizer_config.json +56 -0
run-0/checkpoint-20/trainer_state.json +74 -0
run-0/checkpoint-20/training_args.bin +3 -0
run-0/checkpoint-20/vocab.txt +0 -0
run-1/checkpoint-12/config.json +63 -0
run-1/checkpoint-12/model.safetensors +3 -0
run-1/checkpoint-12/optimizer.pt +3 -0
run-1/checkpoint-12/rng_state.pth +3 -0
run-1/checkpoint-12/scheduler.pt +3 -0
run-1/checkpoint-12/special_tokens_map.json +7 -0
run-1/checkpoint-12/tokenizer.json +0 -0
run-1/checkpoint-12/tokenizer_config.json +56 -0
run-1/checkpoint-12/trainer_state.json +56 -0
run-1/checkpoint-12/training_args.bin +3 -0
run-1/checkpoint-12/vocab.txt +0 -0
run-2/checkpoint-8/config.json +63 -0
run-2/checkpoint-8/model.safetensors +3 -0
run-2/checkpoint-8/optimizer.pt +3 -0
run-2/checkpoint-8/rng_state.pth +3 -0
run-2/checkpoint-8/scheduler.pt +3 -0
run-2/checkpoint-8/special_tokens_map.json +7 -0
run-2/checkpoint-8/tokenizer.json +0 -0
run-2/checkpoint-8/tokenizer_config.json +56 -0
run-2/checkpoint-8/trainer_state.json +47 -0
run-2/checkpoint-8/training_args.bin +3 -0
run-2/checkpoint-8/vocab.txt +0 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +56 -0
training_args.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "_name_or_path": "distilbert-base-cased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "business",
+    "1": "civil-law",
+    "2": "constitutional-law",
+    "3": "contract",
+    "4": "contract-law",
+    "5": "copyright",
+    "6": "criminal-law",
+    "7": "employment",
+    "8": "intellectual-property",
+    "9": "internet",
+    "10": "liability",
+    "11": "licensing",
+    "12": "privacy",
+    "13": "software",
+    "14": "tax-law",
+    "15": "trademark"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "business": 0,
+    "civil-law": 1,
+    "constitutional-law": 2,
+    "contract": 3,
+    "contract-law": 4,
+    "copyright": 5,
+    "criminal-law": 6,
+    "employment": 7,
+    "intellectual-property": 8,
+    "internet": 9,
+    "liability": 10,
+    "licensing": 11,
+    "privacy": 12,
+    "software": 13,
+    "tax-law": 14,
+    "trademark": 15
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "output_past": true,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "vocab_size": 28996
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a70896cda70c39157466e77a386e43d614d7340d26d1719e4aa7130a3a66c35
+size 263187752

run-0/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "_name_or_path": "distilbert-base-cased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "business",
+    "1": "civil-law",
+    "2": "constitutional-law",
+    "3": "contract",
+    "4": "contract-law",
+    "5": "copyright",
+    "6": "criminal-law",
+    "7": "employment",
+    "8": "intellectual-property",
+    "9": "internet",
+    "10": "liability",
+    "11": "licensing",
+    "12": "privacy",
+    "13": "software",
+    "14": "tax-law",
+    "15": "trademark"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "business": 0,
+    "civil-law": 1,
+    "constitutional-law": 2,
+    "contract": 3,
+    "contract-law": 4,
+    "copyright": 5,
+    "criminal-law": 6,
+    "employment": 7,
+    "intellectual-property": 8,
+    "internet": 9,
+    "liability": 10,
+    "licensing": 11,
+    "privacy": 12,
+    "software": 13,
+    "tax-law": 14,
+    "trademark": 15
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "output_past": true,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "vocab_size": 28996
+}

run-0/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a70896cda70c39157466e77a386e43d614d7340d26d1719e4aa7130a3a66c35
+size 263187752

run-0/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25b2494ab1b9dac2e6484e9d3478241e16951cdd84a8149adac7ac0685da688f
+size 526434810

run-0/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c0060471a9340f7cc602c9a86d1d9d308db5b4a83df50147b0235d18be03463
+size 13990

run-0/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:27c53eed2722d60729f122e697a32e584798b0e53daf02ec90e6986cd0796210
+size 1064

run-0/checkpoint-14/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-14/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-14/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-14/trainer_state.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 14,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.32,
+      "eval_loss": 2.4279966354370117,
+      "eval_runtime": 17.893,
+      "eval_samples_per_second": 2.794,
+      "eval_steps_per_second": 0.391,
+      "step": 7
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 14,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 0.0003461152202579902,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 8,
+    "weight_decay": 0.014902312802435893
+  }
+}

run-0/checkpoint-14/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1ed3819cb2fe27bc2256360d46825e1851f5dc0f656a064e111a2321bc7183d
+size 5240

run-0/checkpoint-14/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-20/config.json ADDED Viewed

	@@ -0,0 +1,63 @@

+{
+  "_name_or_path": "bert-base-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

run-0/checkpoint-20/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b5c78f06d53acb708acbededcab71be33db1f82befa21988d544cf84e01a340
+size 433313832

run-0/checkpoint-20/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebdba344973f22ac06783a08cb9d50a765090a0451d50ceee301dfe9109d9a6c
+size 866743162

run-0/checkpoint-20/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a5e70f9a75e0aac0493ef5d71898140525e32ebc99cfd539bb3be380e6c5d74
+size 13990

run-0/checkpoint-20/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f443f63848e306442cd3d7354d278af7ad02b517bd970aab51ae156d07ab0146
+size 1064

run-0/checkpoint-20/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-20/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-20/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-20/trainer_state.json ADDED Viewed

	@@ -0,0 +1,74 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 20,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.32,
+      "eval_loss": 2.5643558502197266,
+      "eval_runtime": 390.6347,
+      "eval_samples_per_second": 0.128,
+      "eval_steps_per_second": 0.018,
+      "step": 4
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.04,
+      "eval_loss": 2.9646835327148438,
+      "eval_runtime": 34.0619,
+      "eval_samples_per_second": 1.468,
+      "eval_steps_per_second": 0.206,
+      "step": 8
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.32,
+      "eval_loss": 2.424799680709839,
+      "eval_runtime": 36.2929,
+      "eval_samples_per_second": 1.378,
+      "eval_steps_per_second": 0.193,
+      "step": 12
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.32,
+      "eval_loss": 2.441561460494995,
+      "eval_runtime": 37.5071,
+      "eval_samples_per_second": 1.333,
+      "eval_steps_per_second": 0.187,
+      "step": 16
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 20,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 0.0003155201980058913,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "weight_decay": 0.08349846837378451
+  }
+}

run-0/checkpoint-20/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:416fa693723afbe856dcf1cebbf9340c6ae11df99f25c7e0b635d211fd4eee07
+size 5240

run-0/checkpoint-20/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-12/config.json ADDED Viewed

	@@ -0,0 +1,63 @@

+{
+  "_name_or_path": "bert-base-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

run-1/checkpoint-12/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30520ddf055b0086a5163e36b5ada08bd1c3e9a6f51e2571fa49704ca27339ea
+size 433313832

run-1/checkpoint-12/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac0234d7747b84c444f6eeb87ec5b8551c1e637989c561c85a404a7e66dad78a
+size 866743162

run-1/checkpoint-12/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:59cc0ca17123db86667fe2b999dc4d45bc2292f0becb83d9a367470fdcfcb14d
+size 13990

run-1/checkpoint-12/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e3d6714bfd9178c1fcd6acd23754c8b42175fb1c04f634c3dec9fe783e15bda
+size 1064

run-1/checkpoint-12/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-12/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-12/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-12/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 12,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.06,
+      "eval_loss": 2.7594950199127197,
+      "eval_runtime": 33.7649,
+      "eval_samples_per_second": 1.481,
+      "eval_steps_per_second": 0.207,
+      "step": 4
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.08,
+      "eval_loss": 2.6855175495147705,
+      "eval_runtime": 36.3771,
+      "eval_samples_per_second": 1.374,
+      "eval_steps_per_second": 0.192,
+      "step": 8
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 12,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.057465826568694e-05,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 16,
+    "weight_decay": 0.03723974867102458
+  }
+}

run-1/checkpoint-12/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a57174aa6cf65fa9f420f1adf1f57db12599f6d01b36cbb0bd8ebf327a14f28e
+size 5240

run-1/checkpoint-12/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-8/config.json ADDED Viewed

	@@ -0,0 +1,63 @@

+{
+  "_name_or_path": "bert-base-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6",
+    "7": "LABEL_7",
+    "8": "LABEL_8",
+    "9": "LABEL_9",
+    "10": "LABEL_10",
+    "11": "LABEL_11",
+    "12": "LABEL_12",
+    "13": "LABEL_13",
+    "14": "LABEL_14",
+    "15": "LABEL_15"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_10": 10,
+    "LABEL_11": 11,
+    "LABEL_12": 12,
+    "LABEL_13": 13,
+    "LABEL_14": 14,
+    "LABEL_15": 15,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6,
+    "LABEL_7": 7,
+    "LABEL_8": 8,
+    "LABEL_9": 9
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.47.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

run-2/checkpoint-8/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d0ff9d7553e5f401f66acc306718599e93884dd508d791993f33833deb328ca
+size 433313832

run-2/checkpoint-8/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:454214c0144d04c453ea1d2ec2b5a7df1c3423f6818f9756a14284705fa8283a
+size 866743162

run-2/checkpoint-8/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:feb9296950c146245afd5a3147821b22e6313de8735f850c30a3188a431ebf85
+size 13990

run-2/checkpoint-8/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af27b588f87c0fb3db5b0d16c4f98bbfbf7bb779576355ce3f3345eaaa70abdc
+size 1064

run-2/checkpoint-8/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-8/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-2/checkpoint-8/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-2/checkpoint-8/trainer_state.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 8,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.08,
+      "eval_loss": 2.832538366317749,
+      "eval_runtime": 34.3925,
+      "eval_samples_per_second": 1.454,
+      "eval_steps_per_second": 0.204,
+      "step": 4
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 8,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.2303999115294106e-05,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 16,
+    "weight_decay": 0.08430555410163074
+  }
+}

run-2/checkpoint-8/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e6eda4fffe5514c3c46c347e7e1ea3b00ffee475601396824284afe9850a3a9
+size 5240

run-2/checkpoint-8/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c1ed3819cb2fe27bc2256360d46825e1851f5dc0f656a064e111a2321bc7183d
+size 5240