Xenova HF Staff commited on
Commit
09fbb30
·
verified ·
1 Parent(s): aad6418

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -40,3 +40,5 @@ onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
  onnx/model_fp16.onnx_data_1 filter=lfs diff=lfs merge=lfs -text
41
  onnx/model_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
42
  onnx/model_q8.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
 
40
  onnx/model_fp16.onnx_data_1 filter=lfs diff=lfs merge=lfs -text
41
  onnx/model_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
42
  onnx/model_q8.onnx_data filter=lfs diff=lfs merge=lfs -text
43
+ onnx/model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
44
+ onnx/model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -53,14 +53,19 @@
53
  "rope_type": "default"
54
  },
55
  "tie_embedding": true,
56
- "transformers_version": "5.0.0.dev0",
 
57
  "use_cache": true,
58
  "use_pos_enc": true,
59
  "vocab_size": 65536,
60
  "transformers.js_config": {
61
- "kv_cache_dtype": {
62
- "fp32": "float32"
 
63
  },
64
- "use_external_data_format": true
 
 
 
65
  }
66
  }
 
53
  "rope_type": "default"
54
  },
55
  "tie_embedding": true,
56
+ "tie_word_embeddings": true,
57
+ "transformers_version": "5.1.0",
58
  "use_cache": true,
59
  "use_pos_enc": true,
60
  "vocab_size": 65536,
61
  "transformers.js_config": {
62
+ "use_external_data_format": {
63
+ "model.onnx": 3,
64
+ "model_fp16.onnx": 2
65
  },
66
+ "kv_cache_dtype": {
67
+ "q4f16": "float16",
68
+ "fp16": "float16"
69
+ }
70
  }
71
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.54.0"
7
- }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
  "pad_token_id": 0,
6
+ "transformers_version": "5.1.0"
7
+ }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48f0ef6fc4a205c0d7228c7d2a92443114b4c471a8a588efd47474f3ba9d0043
3
- size 145492
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf4a28589b70ad89e2a7bd4bb96673388c83f84e0cee024a68edd50a26452fa8
3
+ size 140810
onnx/model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e71dc1e6ac7522e29d454772e0799945d3ca327b7f0ca7f8f46f2cd17ef161f5
3
- size 2130132992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d09021f0d84568e3cc5f8420b0940a390698db3a2dd976aa737846b73fa4f3
3
+ size 2063007744
onnx/model.onnx_data_1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b61a4574a61fcf7295ed5ed729ae601f7f35199123355031ec0ba3ae5db517c5
3
- size 2139348992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fea31f1d31cae36c22dc152158929e11166d5fec564ed5ac593708e5949f6a84
3
+ size 2072240128
onnx/model.onnx_data_2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:066a0b34a6a8279687c652d6282b55e512e01d92f3e84d97b44c2bde0608c9c1
3
- size 444645376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b691a34d2969fce9abed636a029951c579964d8f899d62a0d6ca43d24df2121f
3
+ size 578879488
onnx/model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb5c5524c9da2bb3b6c816be4f9881df60f8f61b6b7acc3cd2aa2b17b366cb31
3
- size 151225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:112553fae9673ec1f71aadc3530c741abed58cdead71b9c19dd5d721417f0a40
3
+ size 140027
onnx/model_fp16.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99cbdb07dee247db39a63f479d92be89572792a7a9a6c65f113d0bf5134306bd
3
- size 2134740992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e29e346d8cecb9555b4b5abb1f5ab66fca8bda6eab075505261a22bfd3d0b12
3
+ size 2067623936
onnx/model_fp16.onnx_data_1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39440614fe3459ceffe3dc6edd54f988ea03554af831b9a34645d291a3ae2875
3
- size 222322688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5382e7baed997a1106686033dbf7bd31278b37ffb61ceb87de6458a0c1c79d4
3
+ size 289439744
onnx/model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e8088d6d8f0cd84887f0a1c79b5f78379a876a529a9a5e75bb973aa74cb73e2
3
- size 172944
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5bc6cf550a03b3af4e7b4cde18760cfc5a8b68d50f6213a8c91461bb7ed5eee
3
+ size 183173
onnx/model_q4.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb7185ee124d2bec30fdd28a6e6726aba1d32daa7fd4b128899d6fa1b8cd1d6c
3
- size 1217650688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ac2808138dc4e1c1d4e7bf1dcde0a8551305ac827641a68360a5984c79d37ce
3
+ size 850059264
onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:047e8393e85292a885d7443509d571e25441db7c31559195b67db0b1607ab0bc
3
+ size 182795
onnx/model_q4f16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da02a690901817926fe4b8cda11e3fddc42604729dd4ce62c39df53a3ec2094d
3
+ size 760279040
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:916f4d713725879067f40eac140a9b93d9a74c50c3c00bf4f9b0e88d1c247c71
3
+ size 185703
onnx/model_quantized.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20753c26acaa4ae486b5e3c9a0c7b3abd4d6608029763c9ea83cdf56aea0a4f9
3
+ size 1520558080
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "additional_special_tokens": null,
3
  "backend": "tokenizers",
4
  "bos_token": "<|startoftext|>",
5
  "clean_up_tokenization_spaces": false,
@@ -11,7 +10,6 @@
11
  "attention_mask"
12
  ],
13
  "model_max_length": 1000000000000000019884624838656,
14
- "model_specific_special_tokens": {},
15
  "pad_token": "<|pad|>",
16
  "sp_model_kwargs": {},
17
  "spaces_between_special_tokens": false,
 
1
  {
 
2
  "backend": "tokenizers",
3
  "bos_token": "<|startoftext|>",
4
  "clean_up_tokenization_spaces": false,
 
10
  "attention_mask"
11
  ],
12
  "model_max_length": 1000000000000000019884624838656,
 
13
  "pad_token": "<|pad|>",
14
  "sp_model_kwargs": {},
15
  "spaces_between_special_tokens": false,