ZongqianLi commited on
Commit
d5c8b75
1 Parent(s): ca62e53

Upload 130 files

Browse files
This view is limited to 50 files because it contains too many changes. 聽 See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. global_step1100/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  3. global_step1100/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  4. global_step1100/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  5. global_step1100/zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  6. global_step1100/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  7. global_step1100/zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step1100/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  9. global_step1100/zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. global_step1100/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  11. global_step1100/zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  12. global_step1100/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  13. global_step1100/zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  14. global_step1100/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  15. global_step1100/zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  16. global_step1100/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  17. global_step1100/zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  18. global_step1100/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  19. global_step1100/zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  20. global_step1100/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  21. global_step1100/zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  22. global_step1100/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  23. global_step1100/zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  24. global_step1100/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  25. global_step1100/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  26. global_step1100/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  27. global_step1100/zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  28. global_step1100/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  29. global_step1100/zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  30. global_step1100/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  31. global_step1100/zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  32. global_step1100/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  33. global_step1100/zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  34. global_step1100/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  35. global_step1100/zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  36. global_step1100/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  37. global_step1100/zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  38. global_step1100/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  39. global_step1100/zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  40. global_step1100/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  41. global_step1100/zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  42. global_step1100/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
  43. global_step1100/zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  44. global_step1100/zero_pp_rank_29_mp_rank_00_model_states.pt +3 -0
  45. global_step1100/zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  46. global_step1100/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
  47. global_step1100/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  48. global_step1100/zero_pp_rank_30_mp_rank_00_model_states.pt +3 -0
  49. global_step1100/zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  50. global_step1100/zero_pp_rank_31_mp_rank_00_model_states.pt +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "bert-large-cased",
3
+ "architectures": [
4
+ "BertForQuestionAnswering"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "directionality": "bidi",
9
+ "gradient_checkpointing": false,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 1024,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 4096,
15
+ "layer_norm_eps": 1e-12,
16
+ "max_position_embeddings": 512,
17
+ "model_type": "bert",
18
+ "num_attention_heads": 16,
19
+ "num_hidden_layers": 24,
20
+ "pad_token_id": 0,
21
+ "pooler_fc_size": 768,
22
+ "pooler_num_attention_heads": 12,
23
+ "pooler_num_fc_layers": 3,
24
+ "pooler_size_per_head": 128,
25
+ "pooler_type": "first_token_transform",
26
+ "position_embedding_type": "absolute",
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.25.1",
29
+ "type_vocab_size": 2,
30
+ "use_cache": true,
31
+ "vocab_size": 28996
32
+ }
global_step1100/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:568a86f7888adaf0abf29dcccac236f6caa26d457fac5c7d6ea15d3a710d6618
3
+ size 99764579
global_step1100/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2d91d76016d0a9acc950d3e6a879f6856562605eac17601e780ca8ebfb5bf02
3
+ size 99764579
global_step1100/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673
global_step1100/zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18a1cd850e9127a199921750c5005e0ae149450e50a11bd39585a23cb7883658
3
+ size 99764579
global_step1100/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce3ce71e1e0d57709957a76707e01f851360e703a145033f3dcd40f995798175
3
+ size 99764579
global_step1100/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b5a2c3ab18b32d7ad9ab81cba0983e10f8534eb2a8c49cd54d26dc7b5e14eab
3
+ size 99764579
global_step1100/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f82e6085f8d0d58368e2771918d29f4491337b7a3e089b3b1f683bec255dfc
3
+ size 99764579
global_step1100/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673
global_step1100/zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54f3740266bcaaa39ed93af5d9f40333db0ce0208354561b963d82f76b5a2a67
3
+ size 99764579
global_step1100/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03324a9ba9c86591c121b25f754075185c6999773141d0b35ca33778748546b3
3
+ size 99764579
global_step1100/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7acf1fc24e7d9c11b18f5bcfe75a48e62eecfbf1c2cdca15a068ad53c9c35c4
3
+ size 99764579
global_step1100/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086d75243f35dc9299cbb76687e473377da2186fb02286e4e6c53c27b9d431a8
3
+ size 99764579
global_step1100/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673
global_step1100/zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:633bd6d20b35bfa77ca33d1f71268e9c49510119dba1e9e0cea7d90bfa7d84cc
3
+ size 99764579
global_step1100/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee7ab894fab06bd772b79a0cbcec170f3dfb05958b159a8112cb4b8404e8dbdd
3
+ size 99764579
global_step1100/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95f4daba2c08f5845d15d1565e0905b0268bebb355f6adc71b3b7354448bc22f
3
+ size 99764579
global_step1100/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:651cc71531aba63e02fb86a721f096f93402f49ac77e70f35b81fd6004c687da
3
+ size 99764579
global_step1100/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3034b912833b9a4876618daf5eb231133b9a9e55f727a4f96deea01285a5fb9
3
+ size 99764579
global_step1100/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673
global_step1100/zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf45a6a02d1e5845808c6b399363b230f19d78dc910db0f2b24d5cc94c7c2a47
3
+ size 99764579
global_step1100/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ae593c29034f20b9fa29ff779c2be63e7aa336a7947f0200e03535839480e0c
3
+ size 99764579
global_step1100/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b92b84108131f586636fa1e32e6464510b5db6de7b21d5d3eea5a0eaddb7adf2
3
+ size 99764579
global_step1100/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:337073d6a8cad34ad2be55daca96c29757e63ab008c5f782b718a266ce3ef670
3
+ size 99764579
global_step1100/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673
global_step1100/zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85c9e75dc184150431a5bd5b03320091fb83b63167e2efbd2b173e3e62757da5
3
+ size 99764579
global_step1100/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a3bdf866fbb1dd51923d9b658f7165ebdf88b34f2483f04978d7bf225d2e329
3
+ size 170673
global_step1100/zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c78be946903e6b0fed3eb7cb262a77545e14332678830835b1698352dd38057e
3
+ size 99764579
global_step1100/zero_pp_rank_29_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3006fd795f8ee5a367bc41c06d1fca00de3503069dfbdb44f32543f5a49a894c
3
+ size 170673
global_step1100/zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c173da8b62c12b52593442042fbaa74e7bc88108b143f50bd8906d637aca59bf
3
+ size 99764579
global_step1100/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a42f05f44692bc629560b3e9355f5cd4077ebf05d12393d4c6a8a3ed14fb7d36
3
+ size 99764579
global_step1100/zero_pp_rank_30_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0db399c8cc9e77874c895ecef8ace2da4ad90eddec98b1e281c79e057abe2c6
3
+ size 170673
global_step1100/zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b368cfb66876252a26710010d75467936a097cefb61b1a29f04de69ae9292f7
3
+ size 99764579
global_step1100/zero_pp_rank_31_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:952f9ab15c7c4a3515531b1412f02c9a14ef7ffb8f7568883a2a170282e5b4eb
3
+ size 170673