dafqi commited on
Commit
1944a3f
·
verified ·
1 Parent(s): b067766

Training in progress, step 1386

Browse files
config.json CHANGED
@@ -1,15 +1,16 @@
1
  {
2
- "_name_or_path": "indobenchmark/indobert-large-p2",
3
- "_num_labels": 5,
4
  "architectures": [
5
  "BertForSequenceClassification"
6
  ],
7
  "attention_probs_dropout_prob": 0.1,
 
8
  "classifier_dropout": null,
9
- "directionality": "bidi",
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
- "hidden_size": 1024,
13
  "id2label": {
14
  "0": "LABEL_0",
15
  "1": "LABEL_1",
@@ -21,7 +22,7 @@
21
  "7": "LABEL_7"
22
  },
23
  "initializer_range": 0.02,
24
- "intermediate_size": 4096,
25
  "label2id": {
26
  "LABEL_0": 0,
27
  "LABEL_1": 1,
@@ -35,20 +36,15 @@
35
  "layer_norm_eps": 1e-12,
36
  "max_position_embeddings": 512,
37
  "model_type": "bert",
38
- "num_attention_heads": 16,
39
- "num_hidden_layers": 24,
40
  "output_past": true,
41
  "pad_token_id": 0,
42
- "pooler_fc_size": 768,
43
- "pooler_num_attention_heads": 12,
44
- "pooler_num_fc_layers": 3,
45
- "pooler_size_per_head": 128,
46
- "pooler_type": "first_token_transform",
47
  "position_embedding_type": "absolute",
48
  "problem_type": "single_label_classification",
49
  "torch_dtype": "float32",
50
  "transformers_version": "4.41.2",
51
  "type_vocab_size": 2,
52
  "use_cache": true,
53
- "vocab_size": 30522
54
  }
 
1
  {
2
+ "_name_or_path": "indolem/indobertweet-base-uncased",
 
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
  "classifier_dropout": null,
9
+ "eos_token_ids": 0,
10
+ "gradient_checkpointing": false,
11
  "hidden_act": "gelu",
12
  "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
  "id2label": {
15
  "0": "LABEL_0",
16
  "1": "LABEL_1",
 
22
  "7": "LABEL_7"
23
  },
24
  "initializer_range": 0.02,
25
+ "intermediate_size": 3072,
26
  "label2id": {
27
  "LABEL_0": 0,
28
  "LABEL_1": 1,
 
36
  "layer_norm_eps": 1e-12,
37
  "max_position_embeddings": 512,
38
  "model_type": "bert",
39
+ "num_attention_heads": 12,
40
+ "num_hidden_layers": 12,
41
  "output_past": true,
42
  "pad_token_id": 0,
 
 
 
 
 
43
  "position_embedding_type": "absolute",
44
  "problem_type": "single_label_classification",
45
  "torch_dtype": "float32",
46
  "transformers_version": "4.41.2",
47
  "type_vocab_size": 2,
48
  "use_cache": true,
49
+ "vocab_size": 31923
50
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff43b81d5456ed79197955151460048ae337893715dbeca6221f0d43c3e0f02b
3
- size 1340647360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:832bf6a484f5a7413177ae637dc3d04a93df506e6e8238d2d4316cc7474819ba
3
+ size 442280976
runs/Jun17_12-01-03_34a384f90984/events.out.tfevents.1718625668.34a384f90984.35.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c1f5d4d37c2a4440e6753b55ed61d2551d10cc281e54ef9ce9e5bca6d39b962
3
+ size 5270
runs/Jun17_12-02-01_34a384f90984/events.out.tfevents.1718625725.34a384f90984.35.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b6026c3b062d1e17ce7c66e565208c49d6a385cede1198358fd315a60eafd98
3
+ size 5270
runs/Jun17_12-02-21_34a384f90984/events.out.tfevents.1718625744.34a384f90984.35.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:544d6f03bf279bc284e79879877c452688fcfae4aa4b25328598e1c562d42cdc
3
+ size 153088
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -17,7 +17,7 @@
17
  "special": true
18
  },
19
  "2": {
20
- "content": "[CLS]",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
@@ -25,7 +25,7 @@
25
  "special": true
26
  },
27
  "3": {
28
- "content": "[SEP]",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
@@ -33,7 +33,7 @@
33
  "special": true
34
  },
35
  "4": {
36
- "content": "[MASK]",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
 
17
  "special": true
18
  },
19
  "2": {
20
+ "content": "[MASK]",
21
  "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
 
25
  "special": true
26
  },
27
  "3": {
28
+ "content": "[CLS]",
29
  "lstrip": false,
30
  "normalized": false,
31
  "rstrip": false,
 
33
  "special": true
34
  },
35
  "4": {
36
+ "content": "[SEP]",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:111c8481d172ed012edca5066dc154abef9801174d271b17d00964b9c42c4793
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b9a5b3f3669d8fc64f37abee5ab1b30d10f732e707c47f1c0d8e17701872ff
3
  size 5112
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff