ZongqianLi commited on
Commit
7d40fe7
·
1 Parent(s): 5f5aa0f

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +26 -0
  2. global_step33600/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step33600/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step33600/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step33600/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step33600/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step33600/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step33600/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step33600/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step33600/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step33600/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step33600/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step33600/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step33600/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step33600/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step33600/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step33600/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step33600/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step33600/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step33600/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step33600/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step33600/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step33600/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step33600/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step33600/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step33600/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step33600/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step33600/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step33600/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step33600/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step33600/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step33600/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step33600/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step33600/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step33600/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step33600/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step33600/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step33600/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step33600/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step33600/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step33600/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step33600/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step33600/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step33600/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step33600/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step33600/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step33600/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step33600/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step33600/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step33600/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-base-cased",
3
+ "architectures": [
4
+ "BertForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.25.1",
23
+ "type_vocab_size": 2,
24
+ "use_cache": true,
25
+ "vocab_size": 28996
26
+ }
global_step33600/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99c683560d95f79bd2515952c04daf7d37b19626eb757b2970d3c491be4af6c0
3
+ size 32506595
global_step33600/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23173613cbea056dda038112bbdc678621e9b3ebf0733e345542249420693f7f
3
+ size 32506595
global_step33600/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923
global_step33600/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5972c466f05dad1bbc3d874182d92effac6ed4e49324f3f1584061ff48f7fcad
3
+ size 32506595
global_step33600/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:249563be085753d2421df21d551647fb13655cc7015223a0c84ac53ecab6e935
3
+ size 32506595
global_step33600/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92287935dbd5501e6007e7af651e721dd5c7902786b58a7f23cda643289b1fd
3
+ size 32506595
global_step33600/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c8a66911dbe7bde33ede5512bf24cb87bc092a1a2d3a80e37e10575b1d079fd
3
+ size 32506595
global_step33600/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923
global_step33600/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e439617b7a7e337e7fe680f8a7ef56d2a9fe8668f2882097995d3edda2442d1
3
+ size 32506595
global_step33600/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc436060be9eb164755a7a4a9515698de02b1003e0f21399878d803380b1cabb
3
+ size 32506595
global_step33600/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:237b949572a2354c6fbe4fd39baeb419f389fc709ea833b2233a97b94b07bbf8
3
+ size 32506595
global_step33600/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a02494879c8f84e724e8bd0a698bf4411ceab53f81a4dcfcde2d578082686676
3
+ size 32506595
global_step33600/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923
global_step33600/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abbd45b5bb67f1ebc1d47f02cd463bfaaccd60b510e14453774fc0edf24e560e
3
+ size 32506595
global_step33600/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8939388ce074e5382210ac243f68397f5055742918b94da2a587e711de523f7d
3
+ size 32506595
global_step33600/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8fa7884f9711dc9b93bc1d5d294ef9fb4aec3586c1edb481807b2ecd1f92b0a
3
+ size 32506595
global_step33600/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b79961522f504dc9a19c58e63ec42f004b06165a66a9c7149e93fd160e81e10
3
+ size 32506595
global_step33600/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4fe94086404e58cf687eb4c6a12f6d6b5a5fdc808344ab4e6cd8164edc273f8
3
+ size 32506595
global_step33600/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923
global_step33600/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48450a8b10092a71d5b09907e1384b230170d0e4e88b86b40145cca28030c7b8
3
+ size 32506595
global_step33600/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:893d681adcf8ee7ee80060c4c95c7c49d8ca61a4a173de7034f9186ec0741c90
3
+ size 32506595
global_step33600/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b3bc5119f119b9fc63fc3b7ac75f1e3aa0cc92e176ecd6f80d04a52f9827e83
3
+ size 32506595
global_step33600/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d7d3a26990507663123d7d970a02382e117b6ea23f10be32e2b96788f13513d
3
+ size 32506595
global_step33600/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923
global_step33600/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb0d9f47877b324d8298a42f540a2c7d9c8582754a7bc444166654375d9f17e6
3
+ size 32506595
global_step33600/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6571337aebdb6aba973406c7d80ae1f2480cfe156f287f70478c8087f059df6a
3
+ size 90923
global_step33600/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a57886739dd9b26e8737e37f080c71a58e827ef6b59a2137fc5c5c8d8dcffaa3
3
+ size 32506595
global_step33600/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:038a26826e806123847f7a40d8ade8c7b114ff4f39ae112a3f6afaacdded59f9
3
+ size 90923
global_step33600/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b866e44c3aa88740ee619bc41880dcfad3c6c3a34a6a4c4f5b509d7419a25e89
3
+ size 32506595
global_step33600/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:469da73c05f12d5142d587346b58ce7ff7d05565c34032047f8ff3f4ce68c161
3
+ size 32506595
global_step33600/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f02f1bc0d515c83d1d3bd02f46c7af129655e5ffae33977aaec6e68144352ea2
3
+ size 90923
global_step33600/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:834358210e0fe86239d8110c23188648c47d2cd823f708ed12ad1d4467d01958
3
+ size 32506595
global_step33600/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fa07a46b1ea8f51b6831cb2e4871752ec3079b92c43269a39cc56b216987b9
3
+ size 90923