tomasmcm commited on
Commit
530cc48
·
verified ·
1 Parent(s): d01def5

Upload folder using huggingface_hub

Browse files
.gitignore ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ node_modules
2
+ .DS_Store
3
+ .cache
config.json ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "allenai/unifiedqa-v2-t5-large-1363200",
4
+ "architectures": [
5
+ "T5ForConditionalGeneration"
6
+ ],
7
+ "classifier_dropout": 0.0,
8
+ "d_ff": 4096,
9
+ "d_kv": 64,
10
+ "d_model": 1024,
11
+ "decoder_start_token_id": 0,
12
+ "dense_act_fn": "relu",
13
+ "dropout_rate": 0.1,
14
+ "eos_token_id": 1,
15
+ "feed_forward_proj": "relu",
16
+ "gradient_checkpointing": false,
17
+ "initializer_factor": 1.0,
18
+ "is_encoder_decoder": true,
19
+ "is_gated_act": false,
20
+ "layer_norm_epsilon": 1e-06,
21
+ "model_type": "t5",
22
+ "n_positions": 512,
23
+ "num_decoder_layers": 24,
24
+ "num_heads": 16,
25
+ "num_layers": 24,
26
+ "output_past": true,
27
+ "pad_token_id": 0,
28
+ "relative_attention_max_distance": 128,
29
+ "relative_attention_num_buckets": 32,
30
+ "task_specific_params": {
31
+ "summarization": {
32
+ "early_stopping": true,
33
+ "length_penalty": 2.0,
34
+ "max_length": 200,
35
+ "min_length": 30,
36
+ "no_repeat_ngram_size": 3,
37
+ "num_beams": 4,
38
+ "prefix": "summarize: "
39
+ },
40
+ "translation_en_to_de": {
41
+ "early_stopping": true,
42
+ "max_length": 300,
43
+ "num_beams": 4,
44
+ "prefix": "translate English to German: "
45
+ },
46
+ "translation_en_to_fr": {
47
+ "early_stopping": true,
48
+ "max_length": 300,
49
+ "num_beams": 4,
50
+ "prefix": "translate English to French: "
51
+ },
52
+ "translation_en_to_ro": {
53
+ "early_stopping": true,
54
+ "max_length": 300,
55
+ "num_beams": 4,
56
+ "prefix": "translate English to Romanian: "
57
+ }
58
+ },
59
+ "torch_dtype": "float32",
60
+ "transformers_version": "4.49.0",
61
+ "use_cache": true,
62
+ "vocab_size": 32128
63
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.49.0"
7
+ }
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eacf36c151a0e80a5e56b29a12b13d7d141442903ec2c440e05e5ba397e41c2
3
+ size 1743103924
onnx/decoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aa43fde0b81236f5c19188832203c5bdcc2f12f93353f97fb11d3be8866b200
3
+ size 359021207
onnx/decoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:199acf8fe1137d1a7f9f6ec5c0a3e88dd981d8dcd267351923d68c1dec95b9e8
3
+ size 871854042
onnx/decoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e01e1399486daca9a148552d65db1412e95fac90ffe52cc30cd78546ed2589
3
+ size 569935579
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9767947c33e56c3dbd086b185445d1941caf8a22afd5212ffacda88b91350bf2
3
+ size 1743785138
onnx/decoder_model_merged_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f87a8b0cc6e48d5b5f003a3ef4fc979550cbcdefd43de613dd7399aba3dd96f
3
+ size 359730549
onnx/decoder_model_merged_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4195cb679d9f618bd9203b904e6a011e44cfca24c8fe2a24a69a82e5f88d962
3
+ size 872566908
onnx/decoder_model_merged_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:484ca47766b2241f1807858cd0d6bfd0bb19a13963d55e03bf9610598f4a3566
3
+ size 570861604
onnx/decoder_model_merged_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da10cc93d24f1ca402f2b32d43d7123aed6dd62d61423b899a9a6c001ba030af
3
+ size 384892701
onnx/decoder_model_merged_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3fc819145cd9839b886e68e49a2f73ad200d591a43ca1eb3e180a75ad691e76
3
+ size 293815015
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:484ca47766b2241f1807858cd0d6bfd0bb19a13963d55e03bf9610598f4a3566
3
+ size 570861604
onnx/decoder_model_merged_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:607702c5c1d4fd0e2ee1cdab2edfe85afa6b8ac20b4b5182dc832e3b3bba1d66
3
+ size 570861604
onnx/decoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aae945492b9bba23ef0c1d863df7946bff8fbad584a3dff9f39a59545c6d74d0
3
+ size 384185087
onnx/decoder_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:327f23c1e68b5eb084e90b62bcee01469318695fb647cbe50a92556ca8169d0e
3
+ size 293075749
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e01e1399486daca9a148552d65db1412e95fac90ffe52cc30cd78546ed2589
3
+ size 569935579
onnx/decoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:191f9704159093a716b39479931466b12625630a59231a5607e63e1783669513
3
+ size 569935579
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bbb87cf546c27752e74c802c04a5253a5508aba37f3f2ec47ae005a6cbd7ead
3
+ size 1541646646
onnx/decoder_with_past_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc098bef6dca1af77318e403751b64507d1cf3b603535c2805acb73aee07386
3
+ size 330571481
onnx/decoder_with_past_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0c78f732bd579ccff6fcec98c7e28bc87de1575425f21998679b9980d6ef84f
3
+ size 771079836
onnx/decoder_with_past_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6643652ea9240ead5db02803c60ca2c9d104991af18a8ae889249f396b323d78
3
+ size 519180586
onnx/decoder_with_past_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7a537a2c85646e84ca7d4f85c666a2e40aa7e2f8b5c35b4d5fc870f0df0ccc2
3
+ size 352590017
onnx/decoder_with_past_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d886a4c3a9647217b8506b93581a291091e99a782dd95d9fab4c146fd8123569
3
+ size 264646182
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6643652ea9240ead5db02803c60ca2c9d104991af18a8ae889249f396b323d78
3
+ size 519180586
onnx/decoder_with_past_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bb934a16f22b01e5e889a563bdb236ac526b0911156225e72d9d2748a26f050
3
+ size 519180586
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d035485c1b20d730ac894b55da61fefdf834ab86c3f4e6f8f59753f511ff0c9
3
+ size 1340052960
onnx/encoder_model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8440235cd98a04e0b0ff7f5c9dd7debc7e179a1757cf10b7bb92ab96b7292e44
3
+ size 301985347
onnx/encoder_model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5292fa2c69d3e7453809bd34ec396f78059988a74c56d156ee2db5138a6c9333
3
+ size 670174435
onnx/encoder_model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b8b952c6fd418a9c59778cfc9ce31c3aee8c6707edc3ae70db77d63486a61ce
3
+ size 336656192
onnx/encoder_model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb98fdc7d0e0a39f3c35a952ad718554da185d3b6286ede5d644cbf307c2b390
3
+ size 320858539
onnx/encoder_model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc89605ea50f72c21a3a8b546aa60c8b1527849368a9075e6e04a9f4b5d7f2bf
3
+ size 236085421
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b8b952c6fd418a9c59778cfc9ce31c3aee8c6707edc3ae70db77d63486a61ce
3
+ size 336656192
onnx/encoder_model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a880fdd6d7847448eb6f87b8def9e02da3024c090aeaaadd55ce86c2543be76
3
+ size 336656192
quantize_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modes": [
3
+ "fp16",
4
+ "q8",
5
+ "int8",
6
+ "uint8",
7
+ "q4",
8
+ "q4f16",
9
+ "bnb4"
10
+ ],
11
+ "per_channel": true,
12
+ "reduce_range": true,
13
+ "block_size": null,
14
+ "is_symmetric": true,
15
+ "accuracy_level": null,
16
+ "quant_type": 1,
17
+ "op_block_list": null
18
+ }