riczhou commited on
Commit
6751d10
·
verified ·
1 Parent(s): 30938fd

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
mlc-chat-config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "deepseek_v2",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "vocab_size": 102400,
7
+ "hidden_size": 2048,
8
+ "intermediate_size": 10944,
9
+ "moe_intermediate_size": 1408,
10
+ "num_hidden_layers": 27,
11
+ "num_attention_heads": 16,
12
+ "num_key_value_heads": 16,
13
+ "n_shared_experts": 2,
14
+ "n_routed_experts": 64,
15
+ "num_experts_per_tok": 6,
16
+ "norm_topk_prob": false,
17
+ "first_k_dense_replace": 1,
18
+ "moe_layer_freq": 1,
19
+ "routed_scaling_factor": 1.0,
20
+ "attention_bias": false,
21
+ "kv_lora_rank": 512,
22
+ "qk_rope_head_dim": 64,
23
+ "v_head_dim": 128,
24
+ "qk_nope_head_dim": 128,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_theta": 10000,
27
+ "q_lora_rank": null,
28
+ "rope_scaling": {
29
+ "beta_fast": 32,
30
+ "beta_slow": 1,
31
+ "factor": 40,
32
+ "mscale": 0.707,
33
+ "mscale_all_dim": 0.707,
34
+ "original_max_position_embeddings": 4096,
35
+ "type": "yarn"
36
+ },
37
+ "context_window_size": 163840,
38
+ "prefill_chunk_size": 8192,
39
+ "tensor_parallel_shards": 1,
40
+ "dtype": "float32",
41
+ "max_batch_size": 128
42
+ },
43
+ "vocab_size": 102400,
44
+ "context_window_size": 163840,
45
+ "sliding_window_size": -1,
46
+ "prefill_chunk_size": 8192,
47
+ "attention_sink_size": -1,
48
+ "tensor_parallel_shards": 1,
49
+ "pipeline_parallel_stages": 1,
50
+ "temperature": 0.3,
51
+ "presence_penalty": 0.0,
52
+ "frequency_penalty": 0.0,
53
+ "repetition_penalty": 1.0,
54
+ "top_p": 0.95,
55
+ "tokenizer_files": [
56
+ "tokenizer.json",
57
+ "tokenizer_config.json"
58
+ ],
59
+ "tokenizer_info": {
60
+ "token_postproc_method": "byte_level",
61
+ "prepend_space_in_encode": false,
62
+ "strip_space_in_decode": false
63
+ },
64
+ "conv_template": {
65
+ "name": "deepseek_v2",
66
+ "system_template": "{system_message}",
67
+ "system_message": "",
68
+ "system_prefix_token_ids": [
69
+ 100000
70
+ ],
71
+ "add_role_after_system_message": true,
72
+ "roles": {
73
+ "user": "User",
74
+ "assistant": "Assistant"
75
+ },
76
+ "role_templates": {
77
+ "user": "{user_message}",
78
+ "assistant": "{assistant_message}",
79
+ "tool": "{tool_message}"
80
+ },
81
+ "messages": [],
82
+ "seps": [
83
+ "\n\n",
84
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
85
+ ],
86
+ "role_content_sep": ": ",
87
+ "role_empty_sep": ":",
88
+ "stop_str": [
89
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
90
+ ],
91
+ "stop_token_ids": [
92
+ 100001
93
+ ],
94
+ "function_string": "",
95
+ "use_function_calling": false
96
+ },
97
+ "pad_token_id": 0,
98
+ "bos_token_id": 100000,
99
+ "eos_token_id": 100001
100
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a679f69648082b612a453de560fa6a77d17bf1e0464e08613a52cf308c7af0cc
3
+ size 419430400
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c0c0f57a106b2136d9d60e2c813a05f8134d4774f7ed1e63fa7b32a80806a0
3
+ size 419430400
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc3c55dcc1d79327637200fef13300eb71d3d628712c30d04f818ea1e02d1255
3
+ size 31719424
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3a63582ed1419f8305c2e6debb993a2aa3168350ae3ee9cc62c7ad6ecd67160
3
+ size 369098752
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:931262ad80fb84c03aea977a5879a7263bcd2caf7455f0e71e52445eb70d36bc
3
+ size 30680064
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81729321620b57eb90e9333d34a99c5a0f4b6a4a2f1ae2cddba946d3982964ba
3
+ size 31719424
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58a95c00587eafb512c8ffb488c9d14f2833f3f5fde46bc6379e720ead7bae55
3
+ size 738197504
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62381460c63fad20e764e65e938684eae7b0e23f6d99b1a69617cbbc9576c71b
3
+ size 369098752
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a05b024c74815180671dc21d6498e3d5e854a5ce41bafef241685b62fc782ced
3
+ size 30680064
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2fba23491568f81ffad108ad6975e54e84e8a763df3f886096794fc3b98dd99
3
+ size 31719424
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34002213ea405c42149fdb8b89f890c362e3f40d16f62de006b2335777836c2d
3
+ size 738197504
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6177b8af596559ed4b8f0523bc50b62d59094604c920ae021542db861146b4
3
+ size 369098752
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecc65b84320ae8a790cdb6cb322f99aaa8e9596ef7ade219f6856a6de34c6b68
3
+ size 11542528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d95ad7970200415f0a1e0b267e17db358966d137ada9514e92e990c639ecad8a
3
+ size 738197504
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b57a42566032bfd69448cea521112e43f58d97dd01c83d05626e5624b5fec9ac
3
+ size 369098752
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:378ee55a3db1e7bd4d30bf1a3cde16993e9127f9c44593e08326f74b4551a4b3
3
+ size 30680064
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f37481caab0470865bbed70bc92a1ec85676a2903d6777c3bb4c037cd12b9e37
3
+ size 31719424
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:383d6a2964a7689cc2433e9a00134e0b2a649a4e3027c6ab86e02eedede704af
3
+ size 738197504
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef49552dfc191f8bfea513c3c48f53cd16ca91a45b68a50a6cac77797f63f796
3
+ size 369098752
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6f1cd81f86495fa9737985c4c9d6cff4c35f27dce7f48b9697dd646830057ec
3
+ size 30680064
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ba2c7c80430214aeec0a1a9622255d6bf0668bd20f63b286c173bacdf89698
3
+ size 31719424
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bac3165de1e60085127aa7710568e0e828972fc7fb26c90340d779a7209efaf
3
+ size 738197504
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aa8cb4a4dc989e0b6e87e86a69abff151c679c7b8c801ebec0d1654a73481e9
3
+ size 89653248
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfa4b0cc4ea7135732b0f50f2cf5ac215c7b50f7b57063898515f6f046b62568
3
+ size 369098752
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3efdb6b8cc87bb2ba77189f06be8c19615593f77b64257c97742ab4b5197be06
3
+ size 30680064
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5310be629d3f30292eadbc368d4db9fd7e48e457c3ded51dc80277f4e727141c
3
+ size 31719424
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:834a2f54db36d7f2d4a746f670cb6bc20d9f98b930c240710ee7aac5d11b124d
3
+ size 738197504
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f242f51fecbdd7e9fb3c2bd48b5d26e4c90ef0fd40decad45439e2933f7a5197
3
+ size 369098752
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9e4512e449a83e9093f4e0ed305db06fa5ab2a22d5fcdf9c0673607a4e5da1f
3
+ size 30680064
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a8f251bec25719559ca7438fd60c0c806d1cfe5d23d17eb975b978cdf4bb782
3
+ size 31719424
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62a59cfb5661db2326b8c67ed36461bbeeb457108eb49a4380d708e527ac2334
3
+ size 738197504
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7971bd82a72a0c8433b4dcfe884efd313c79f792cadd3d03eaee1773d554ff1
3
+ size 369098752
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30aff8e7e28cdcd63bb62955accf9ff19b3f964ab5fd51aa3ac029bfbcf78f14
3
+ size 30680064
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:accb12da31d09964b677d4b22d4e79f07d38bc7be041cac4bb2c0b15bf7ad50d
3
+ size 44826624
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eca83b9ba47d55c5d753bb29ea043c9cd97263ffc835ff97559448e8c3958e02
3
+ size 31719424
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5cfbfd0adf5ab2b1aaad8bdf4bc6009cab8420bda580be073353e0b0ccb579e
3
+ size 738197504
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb5d8ba7b4ce33d1d85f14073b294394294dc02a29561402a93ccd6b7b426edc
3
+ size 369098752
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f77c48d7438d2fb5ac98f51305cb5ad3768eb45e2dba562ec9f60f7367d6c69c
3
+ size 30680064
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53fa5494535856142ee52307ce3074768e18aa22d4b6c332717ee5796a4bf247
3
+ size 31719424
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50d97d02700fa7a84256be423535565e40847b9a920d7a33abfa0e8ea08ed461
3
+ size 738197504
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:280d8a938ae204f00496c4fae0be0812ce1837787c99704e4d3452be78ebb5d4
3
+ size 369098752
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6314488142da4fa7aa0841ac62f43696ff48e118d7ea267d2910d047735e7da9
3
+ size 30680064
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00e012cb4c89578529d85a121cb36caf9fc6084704549865fa268980e36eb5a2
3
+ size 31719424
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01b6018f587b2104a9d61d6993ad6933631c665357a8f71d1967d800c888c001
3
+ size 738197504
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7e2001f0ee1b1f74612ddb58ed758504bcbd2f99c191570a9467839da093fc1
3
+ size 27538432
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3fa027b5710fc0d0dc761aadb5cd48eba9b5a848597b059339a9bb13aefc319
3
+ size 369098752
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bba210d408ac2f3408a6dcf883ba9ad68a215a55b4095f550814476e87f04445
3
+ size 30680064
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ad07ab71cbe62bb0cafc5b074e3ae868fd2d7c1ca5a620a81618e6187e6c7f2
3
+ size 31719424