devkyle commited on
Commit
b773623
·
verified ·
1 Parent(s): a27d987

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -14,28 +14,15 @@
14
  "decoder_attention_heads": 8,
15
  "decoder_ffn_dim": 2048,
16
  "decoder_layerdrop": 0.0,
17
- "decoder_layers": 6,
18
- "decoder_start_token_id": 50258,
19
  "dropout": 0.1,
20
  "encoder_attention_heads": 8,
21
  "encoder_ffn_dim": 2048,
22
  "encoder_layerdrop": 0.0,
23
- "encoder_layers": 6,
24
  "eos_token_id": 50257,
25
- "forced_decoder_ids": [
26
- [
27
- 1,
28
- 50259
29
- ],
30
- [
31
- 2,
32
- 50359
33
- ],
34
- [
35
- 3,
36
- 50363
37
- ]
38
- ],
39
  "init_std": 0.02,
40
  "is_encoder_decoder": true,
41
  "mask_feature_length": 10,
@@ -54,7 +41,7 @@
54
  "pad_token_id": 50257,
55
  "scale_embedding": false,
56
  "torch_dtype": "float32",
57
- "transformers_version": "4.46.0",
58
  "use_cache": true,
59
  "use_weighted_layer_sum": false,
60
  "vocab_size": 51865
 
14
  "decoder_attention_heads": 8,
15
  "decoder_ffn_dim": 2048,
16
  "decoder_layerdrop": 0.0,
17
+ "decoder_layers": 4,
18
+ "decoder_start_token_id": 50257,
19
  "dropout": 0.1,
20
  "encoder_attention_heads": 8,
21
  "encoder_ffn_dim": 2048,
22
  "encoder_layerdrop": 0.0,
23
+ "encoder_layers": 4,
24
  "eos_token_id": 50257,
25
+ "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "init_std": 0.02,
27
  "is_encoder_decoder": true,
28
  "mask_feature_length": 10,
 
41
  "pad_token_id": 50257,
42
  "scale_embedding": false,
43
  "torch_dtype": "float32",
44
+ "transformers_version": "4.46.2",
45
  "use_cache": true,
46
  "use_weighted_layer_sum": false,
47
  "vocab_size": 51865
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:387d8a955be00aad2cc5451a7e24d8c8feaf96628330064688d0b20444659624
3
- size 290403936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b89f88333a53fa0c438c0c48a7b65a818c742d4b1a50a8445808e3e72c44ee8
3
+ size 231555856
runs/Nov06_05-42-23_1e0891b0c80a/events.out.tfevents.1730871769.1e0891b0c80a.293.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edf59c7ffb7a9a38e3a03b0e107001d37041e1b458b69e405188ba57fcaa58d8
3
+ size 7016
runs/Nov06_06-07-08_1e0891b0c80a/events.out.tfevents.1730873238.1e0891b0c80a.293.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52bd72a47ca1f23bbeeb452c695596dde7595d4ad11631b3d07ac487440b1b5c
3
+ size 7016
runs/Nov06_10-45-00_7484ea4f2c9e/events.out.tfevents.1730889919.7484ea4f2c9e.207.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96ba6e71c8a756e24db9d296dcb209328e84b062585405e998e1176a6f3ef6e9
3
+ size 7016
runs/Nov06_10-52-45_7484ea4f2c9e/events.out.tfevents.1730890369.7484ea4f2c9e.207.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b963c68dcbbcc8967f740b63717b46161f4e3b56f5a2873985f2086b0e799a1a
3
+ size 15087
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4165a9818c2b3182da9de8a0411641d9c46ed49a724c5d69798e8f33a18de61d
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b680413bd9cdd4437d954ceff5873c4f6d3a7162064f106960074c11833e671e
3
+ size 5560