Upload folder using huggingface_hub
Browse files- .gitignore +3 -0
- config.json +63 -0
- generation_config.json +7 -0
- onnx/decoder_model.onnx +3 -0
- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_q4f16.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_q4f16.onnx +3 -0
- onnx/decoder_model_quantized.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_q4f16.onnx +3 -0
- onnx/decoder_with_past_model_quantized.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
- onnx/encoder_model.onnx +3 -0
- onnx/encoder_model_bnb4.onnx +3 -0
- onnx/encoder_model_fp16.onnx +3 -0
- onnx/encoder_model_int8.onnx +3 -0
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_q4f16.onnx +3 -0
- onnx/encoder_model_quantized.onnx +3 -0
- onnx/encoder_model_uint8.onnx +3 -0
- quantize_config.json +18 -0
.gitignore
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
node_modules
|
2 |
+
.DS_Store
|
3 |
+
.cache
|
config.json
ADDED
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
+
"_name_or_path": "allenai/unifiedqa-v2-t5-large-1363200",
|
4 |
+
"architectures": [
|
5 |
+
"T5ForConditionalGeneration"
|
6 |
+
],
|
7 |
+
"classifier_dropout": 0.0,
|
8 |
+
"d_ff": 4096,
|
9 |
+
"d_kv": 64,
|
10 |
+
"d_model": 1024,
|
11 |
+
"decoder_start_token_id": 0,
|
12 |
+
"dense_act_fn": "relu",
|
13 |
+
"dropout_rate": 0.1,
|
14 |
+
"eos_token_id": 1,
|
15 |
+
"feed_forward_proj": "relu",
|
16 |
+
"gradient_checkpointing": false,
|
17 |
+
"initializer_factor": 1.0,
|
18 |
+
"is_encoder_decoder": true,
|
19 |
+
"is_gated_act": false,
|
20 |
+
"layer_norm_epsilon": 1e-06,
|
21 |
+
"model_type": "t5",
|
22 |
+
"n_positions": 512,
|
23 |
+
"num_decoder_layers": 24,
|
24 |
+
"num_heads": 16,
|
25 |
+
"num_layers": 24,
|
26 |
+
"output_past": true,
|
27 |
+
"pad_token_id": 0,
|
28 |
+
"relative_attention_max_distance": 128,
|
29 |
+
"relative_attention_num_buckets": 32,
|
30 |
+
"task_specific_params": {
|
31 |
+
"summarization": {
|
32 |
+
"early_stopping": true,
|
33 |
+
"length_penalty": 2.0,
|
34 |
+
"max_length": 200,
|
35 |
+
"min_length": 30,
|
36 |
+
"no_repeat_ngram_size": 3,
|
37 |
+
"num_beams": 4,
|
38 |
+
"prefix": "summarize: "
|
39 |
+
},
|
40 |
+
"translation_en_to_de": {
|
41 |
+
"early_stopping": true,
|
42 |
+
"max_length": 300,
|
43 |
+
"num_beams": 4,
|
44 |
+
"prefix": "translate English to German: "
|
45 |
+
},
|
46 |
+
"translation_en_to_fr": {
|
47 |
+
"early_stopping": true,
|
48 |
+
"max_length": 300,
|
49 |
+
"num_beams": 4,
|
50 |
+
"prefix": "translate English to French: "
|
51 |
+
},
|
52 |
+
"translation_en_to_ro": {
|
53 |
+
"early_stopping": true,
|
54 |
+
"max_length": 300,
|
55 |
+
"num_beams": 4,
|
56 |
+
"prefix": "translate English to Romanian: "
|
57 |
+
}
|
58 |
+
},
|
59 |
+
"torch_dtype": "float32",
|
60 |
+
"transformers_version": "4.49.0",
|
61 |
+
"use_cache": true,
|
62 |
+
"vocab_size": 32128
|
63 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"decoder_start_token_id": 0,
|
4 |
+
"eos_token_id": 1,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.49.0"
|
7 |
+
}
|
onnx/decoder_model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eacf36c151a0e80a5e56b29a12b13d7d141442903ec2c440e05e5ba397e41c2
|
3 |
+
size 1743103924
|
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aa43fde0b81236f5c19188832203c5bdcc2f12f93353f97fb11d3be8866b200
|
3 |
+
size 359021207
|
onnx/decoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:199acf8fe1137d1a7f9f6ec5c0a3e88dd981d8dcd267351923d68c1dec95b9e8
|
3 |
+
size 871854042
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18e01e1399486daca9a148552d65db1412e95fac90ffe52cc30cd78546ed2589
|
3 |
+
size 569935579
|
onnx/decoder_model_merged.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9767947c33e56c3dbd086b185445d1941caf8a22afd5212ffacda88b91350bf2
|
3 |
+
size 1743785138
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f87a8b0cc6e48d5b5f003a3ef4fc979550cbcdefd43de613dd7399aba3dd96f
|
3 |
+
size 359730549
|
onnx/decoder_model_merged_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4195cb679d9f618bd9203b904e6a011e44cfca24c8fe2a24a69a82e5f88d962
|
3 |
+
size 872566908
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484ca47766b2241f1807858cd0d6bfd0bb19a13963d55e03bf9610598f4a3566
|
3 |
+
size 570861604
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da10cc93d24f1ca402f2b32d43d7123aed6dd62d61423b899a9a6c001ba030af
|
3 |
+
size 384892701
|
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3fc819145cd9839b886e68e49a2f73ad200d591a43ca1eb3e180a75ad691e76
|
3 |
+
size 293815015
|
onnx/decoder_model_merged_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484ca47766b2241f1807858cd0d6bfd0bb19a13963d55e03bf9610598f4a3566
|
3 |
+
size 570861604
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:607702c5c1d4fd0e2ee1cdab2edfe85afa6b8ac20b4b5182dc832e3b3bba1d66
|
3 |
+
size 570861604
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aae945492b9bba23ef0c1d863df7946bff8fbad584a3dff9f39a59545c6d74d0
|
3 |
+
size 384185087
|
onnx/decoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:327f23c1e68b5eb084e90b62bcee01469318695fb647cbe50a92556ca8169d0e
|
3 |
+
size 293075749
|
onnx/decoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18e01e1399486daca9a148552d65db1412e95fac90ffe52cc30cd78546ed2589
|
3 |
+
size 569935579
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:191f9704159093a716b39479931466b12625630a59231a5607e63e1783669513
|
3 |
+
size 569935579
|
onnx/decoder_with_past_model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bbb87cf546c27752e74c802c04a5253a5508aba37f3f2ec47ae005a6cbd7ead
|
3 |
+
size 1541646646
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fc098bef6dca1af77318e403751b64507d1cf3b603535c2805acb73aee07386
|
3 |
+
size 330571481
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0c78f732bd579ccff6fcec98c7e28bc87de1575425f21998679b9980d6ef84f
|
3 |
+
size 771079836
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6643652ea9240ead5db02803c60ca2c9d104991af18a8ae889249f396b323d78
|
3 |
+
size 519180586
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7a537a2c85646e84ca7d4f85c666a2e40aa7e2f8b5c35b4d5fc870f0df0ccc2
|
3 |
+
size 352590017
|
onnx/decoder_with_past_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d886a4c3a9647217b8506b93581a291091e99a782dd95d9fab4c146fd8123569
|
3 |
+
size 264646182
|
onnx/decoder_with_past_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6643652ea9240ead5db02803c60ca2c9d104991af18a8ae889249f396b323d78
|
3 |
+
size 519180586
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bb934a16f22b01e5e889a563bdb236ac526b0911156225e72d9d2748a26f050
|
3 |
+
size 519180586
|
onnx/encoder_model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d035485c1b20d730ac894b55da61fefdf834ab86c3f4e6f8f59753f511ff0c9
|
3 |
+
size 1340052960
|
onnx/encoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8440235cd98a04e0b0ff7f5c9dd7debc7e179a1757cf10b7bb92ab96b7292e44
|
3 |
+
size 301985347
|
onnx/encoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5292fa2c69d3e7453809bd34ec396f78059988a74c56d156ee2db5138a6c9333
|
3 |
+
size 670174435
|
onnx/encoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b8b952c6fd418a9c59778cfc9ce31c3aee8c6707edc3ae70db77d63486a61ce
|
3 |
+
size 336656192
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb98fdc7d0e0a39f3c35a952ad718554da185d3b6286ede5d644cbf307c2b390
|
3 |
+
size 320858539
|
onnx/encoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc89605ea50f72c21a3a8b546aa60c8b1527849368a9075e6e04a9f4b5d7f2bf
|
3 |
+
size 236085421
|
onnx/encoder_model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b8b952c6fd418a9c59778cfc9ce31c3aee8c6707edc3ae70db77d63486a61ce
|
3 |
+
size 336656192
|
onnx/encoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a880fdd6d7847448eb6f87b8def9e02da3024c090aeaaadd55ce86c2543be76
|
3 |
+
size 336656192
|
quantize_config.json
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"modes": [
|
3 |
+
"fp16",
|
4 |
+
"q8",
|
5 |
+
"int8",
|
6 |
+
"uint8",
|
7 |
+
"q4",
|
8 |
+
"q4f16",
|
9 |
+
"bnb4"
|
10 |
+
],
|
11 |
+
"per_channel": true,
|
12 |
+
"reduce_range": true,
|
13 |
+
"block_size": null,
|
14 |
+
"is_symmetric": true,
|
15 |
+
"accuracy_level": null,
|
16 |
+
"quant_type": 1,
|
17 |
+
"op_block_list": null
|
18 |
+
}
|