ZongqianLi commited on
Commit
d80431a
·
1 Parent(s): d15df52

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. global_step999/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step999/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step999/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step999/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step999/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step999/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step999/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step999/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step999/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step999/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step999/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step999/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step999/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step999/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step999/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step999/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step999/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step999/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step999/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step999/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step999/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step999/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step999/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step999/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step999/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step999/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step999/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step999/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step999/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step999/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step999/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step999/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step999/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step999/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step999/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step999/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step999/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step999/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step999/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step999/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step999/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step999/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step999/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step999/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step999/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step999/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step999/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step999/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step999/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-large-cased",
3
+ "architectures": [
4
+ "BertForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 16,
19
+ "num_hidden_layers": 24,
20
+ "pad_token_id": 0,
21
+ "pooler_fc_size": 768,
22
+ "pooler_num_attention_heads": 12,
23
+ "pooler_num_fc_layers": 3,
24
+ "pooler_size_per_head": 128,
25
+ "pooler_type": "first_token_transform",
26
+ "position_embedding_type": "absolute",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.25.1",
29
+ "type_vocab_size": 2,
30
+ "use_cache": true,
31
+ "vocab_size": 28996
32
+ }
global_step999/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e6f2a4d0fc65ffb1623c2a8cac32a7370644ff30c3b15cdee62d6ead666130
3
+ size 100088099
global_step999/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e31cbd95a4ab2de38ea9ece66bd0cb9ed261d025ebffef1e02e47816f7135734
3
+ size 100088099
global_step999/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267
global_step999/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae95546f97fee05f1698d2df9d3f8aa4aaadf4420a6e774d92defd0fbd093bb2
3
+ size 100088099
global_step999/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc6ca75917becba110abef1a4b17c58e00ec9b6c5cea258a2d61567147b07e12
3
+ size 100088099
global_step999/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b0fb7a564db79c4cdec25ba034876d97dcd4c2f188f6965d11f90a7856df468
3
+ size 100088099
global_step999/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e47168f5842320bea522801d8e289c57215360400982c8967d740950d3abb9a
3
+ size 100088099
global_step999/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267
global_step999/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04404b6eacc76f1423cf287786a7db0388af2d1bdceba9ce5f9d7c78ed48bfa4
3
+ size 100088099
global_step999/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be8fce9214cd7692ccc3a64874b6f5fabf81eac69bb319ecbaf88886fb162206
3
+ size 100088099
global_step999/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f795e9d48733f11daa008263b018cde840c8db845e48fcfbab48c4253b8d46
3
+ size 100088099
global_step999/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e529b64c22a6aa5de7e4f419c512bbec927a5381936466000186ce2b29aef8f
3
+ size 100088099
global_step999/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267
global_step999/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6f0db197406d890ff414175393b304751c0e8d4d401908d511b6b3a032d0811
3
+ size 100088099
global_step999/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:827ab62b83b5b836b92033b71bbf0383d9e1f3b00ae4d09cb999d0fe9deffd4c
3
+ size 100088099
global_step999/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d79348a2a415f8f09ab7cffef69688a9fe8779cb805ddbe70949a2f8594132ee
3
+ size 100088099
global_step999/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b4cd251e6ea0478d45e0e4b3cbfcf2187314ae7c9765ca8368527045732d5b
3
+ size 100088099
global_step999/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c223bf9cb23952fe33af2685f8b018f07b4187eb20957b9a77d4ab20cf83744
3
+ size 100088099
global_step999/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267
global_step999/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9e9dd173534145f4017c925d9696ae9c016facf3359f8aab9ac084e46d29f6d
3
+ size 100088099
global_step999/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82fdaf3c7ff06fa9af1f2fba22fa8cf945a0d91e8d7c79ee8f943d427c0c456e
3
+ size 100088099
global_step999/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7b0b7a914aab91053a66b12ada056bd014344a048e7f5602083acba48deec28
3
+ size 100088099
global_step999/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0964a771dfd5f93b7ae99a90cb2f7ca11fb5cf25f0e13a4ae4d29f3c6b088de0
3
+ size 100088099
global_step999/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267
global_step999/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7955bc3cf606c6042e4dc2ed9820f5ff923af964fced0a29cc6182d455993c53
3
+ size 100088099
global_step999/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b991250803ab8af2b4080de297af8dadba48a23f8c59b202e68059faac522e
3
+ size 172267
global_step999/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf154d86b7bd542865f5934d300e7d94e2a90007a87f74bf5ab67d22f7622981
3
+ size 100088099
global_step999/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef61100eb852b5a744a3526da9565787929ff0cf3bbcc87189ad9b1a770cc9e
3
+ size 172267
global_step999/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4183ba7f8728277ed99944c6d9167f5d30671864c654c83bd168327768f609f
3
+ size 100088099
global_step999/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b46e02e69462d0a5e604968975fb1579ccc1f5a82406998a8d8c34ef40b06fc3
3
+ size 100088099
global_step999/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2e4d6b9d5958118bc97eb35c8ddc50cfcb7fde29b0fc6a68fefa1e61983c01
3
+ size 172267
global_step999/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e389e0f88beeab3aaef689a1a693d4474c82cb7dfe1e9a429d89642939a9948f
3
+ size 100088099
global_step999/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c20f8ffd00ebe3c83f6268afe3aa2ef9ac95605a79fca3df113da87fa18959
3
+ size 172267