Xenova HF Staff commited on
Commit
f6a3e33
·
verified ·
1 Parent(s): 59d85ac

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -39,3 +39,4 @@ onnx/model_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
39
  onnx/model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
  onnx/model_q4f32.onnx_data filter=lfs diff=lfs merge=lfs -text
41
  onnx/model_q8.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
39
  onnx/model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
40
  onnx/model_q4f32.onnx_data filter=lfs diff=lfs merge=lfs -text
41
  onnx/model_q8.onnx_data filter=lfs diff=lfs merge=lfs -text
42
+ onnx/model_quantized.onnx_data filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -4,7 +4,6 @@
4
  ],
5
  "block_auto_adjust_ff_dim": true,
6
  "block_dim": 1024,
7
- "block_ff_dim": 6656,
8
  "block_ffn_dim_multiplier": 1.0,
9
  "block_mlp_init_scale": 1.0,
10
  "block_multiple_of": 256,
@@ -19,6 +18,7 @@
19
  "conv_use_xavier_init": true,
20
  "dtype": "bfloat16",
21
  "eos_token_id": 7,
 
22
  "hidden_size": 1024,
23
  "initializer_range": 0.02,
24
  "intermediate_size": 6656,
@@ -52,15 +52,16 @@
52
  "rope_theta": 1000000.0,
53
  "rope_type": "default"
54
  },
55
- "tie_embedding": true,
56
- "transformers_version": "5.0.0.dev0",
57
  "use_cache": true,
58
  "use_pos_enc": true,
59
  "vocab_size": 65536,
60
  "transformers.js_config": {
 
61
  "kv_cache_dtype": {
62
- "fp32": "float32"
63
- },
64
- "use_external_data_format": true
65
  }
66
  }
 
4
  ],
5
  "block_auto_adjust_ff_dim": true,
6
  "block_dim": 1024,
 
7
  "block_ffn_dim_multiplier": 1.0,
8
  "block_mlp_init_scale": 1.0,
9
  "block_multiple_of": 256,
 
18
  "conv_use_xavier_init": true,
19
  "dtype": "bfloat16",
20
  "eos_token_id": 7,
21
+ "full_attn_idxs": null,
22
  "hidden_size": 1024,
23
  "initializer_range": 0.02,
24
  "intermediate_size": 6656,
 
52
  "rope_theta": 1000000.0,
53
  "rope_type": "default"
54
  },
55
+ "tie_word_embeddings": true,
56
+ "transformers_version": "5.5.0.dev0",
57
  "use_cache": true,
58
  "use_pos_enc": true,
59
  "vocab_size": 65536,
60
  "transformers.js_config": {
61
+ "use_external_data_format": true,
62
  "kv_cache_dtype": {
63
+ "q4f16": "float16",
64
+ "fp16": "float16"
65
+ }
66
  }
67
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.54.0"
7
- }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 7,
5
  "pad_token_id": 0,
6
+ "transformers_version": "5.5.0.dev0"
7
+ }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c43efd6be4b93b69676b8d6c9699042cd0aef76329eea1934636111103880ff
3
- size 145288
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccbf08c2e3a752af056182733da1ce9f0b0ad4961d1bc0fc97ef4a6f064c6e5b
3
+ size 141116
onnx/model.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ec28c8f2c6e5cbca8c5e6b15d6b51cf849a91b5f51a4f495f7fbc3dc6ca0dc
3
  size 1450700800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6401d6753c3e299b0dbe7778489339c0aa3af480b2446d47c4d4a46b18c32d8
3
  size 1450700800
onnx/model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea5f5fa192a5c3dae08ffbcaa3c8eeeeffb417aa3ac7d9e51ae71a8c5b108f64
3
- size 151040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feb1c4a52e2756183f5ec7dd8d2c2d53d31465ba5050765b6c9f9c7a0a6c4705
3
+ size 140155
onnx/model_fp16.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdca4e312c904c91527ad62299d4c17e5e9b699938cd1fb18c8a7d90c8468ddc
3
  size 725350400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f0ed790a23eafc73b1c5a77cf85628b4c04294fdc391aea387b58ad3b52f36
3
  size 725350400
onnx/model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ff97f8b65726cf78aff596b82a61e8dc1bc86745310023badec30568dda94a5
3
- size 173505
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a705712e93aafaba1346b32245fa59e7857a46e2272003c0e8c524977e0de8
3
+ size 183442
onnx/model_q4.onnx_data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae94bc207a6d5e4d3f9f3ef3334f62374c452414d5d783ae367dc33f3154a7d5
3
- size 289140736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ec6ad38a4c463dcb3dba671d06a1d9861be3a23e51290d818b95c0b7d2a5db
3
+ size 293629952
onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3012c28a119828561c90196331435d91c43c1a6ab4898ac79715585fff1dff85
3
+ size 182827
onnx/model_q4f16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9256ecd417b801b441d926ebe5ead4ebf50ac1a5a0f8f7914cf60d9d6452ef69
3
+ size 254965760
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb7d0a2b14c7ffc8031d306e7d4dacb88f14070082c5708b673afe05013adde3
3
+ size 185941
onnx/model_quantized.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a37d3df8609169f802eb7ca3b8d19669bf9367f292ab46696c84bbe3b19cbd9
3
+ size 509931520
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -3,6 +3,7 @@
3
  "bos_token": "<|startoftext|>",
4
  "clean_up_tokenization_spaces": false,
5
  "eos_token": "<|im_end|>",
 
6
  "is_local": false,
7
  "legacy": false,
8
  "model_input_names": [
 
3
  "bos_token": "<|startoftext|>",
4
  "clean_up_tokenization_spaces": false,
5
  "eos_token": "<|im_end|>",
6
+ "extra_special_tokens": [],
7
  "is_local": false,
8
  "legacy": false,
9
  "model_input_names": [