Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .msc +0 -0
- .mv +1 -0
- config.json +40 -0
- configuration.json +1 -0
- merges.txt +0 -0
- model-00001-of-00118.safetensors +3 -0
- model-00002-of-00118.safetensors +3 -0
- model-00003-of-00118.safetensors +3 -0
- model-00004-of-00118.safetensors +3 -0
- model-00005-of-00118.safetensors +3 -0
- model-00006-of-00118.safetensors +3 -0
- model-00007-of-00118.safetensors +3 -0
- model-00008-of-00118.safetensors +3 -0
- model-00009-of-00118.safetensors +3 -0
- model-00010-of-00118.safetensors +3 -0
- model-00011-of-00118.safetensors +3 -0
- model-00012-of-00118.safetensors +3 -0
- model-00013-of-00118.safetensors +3 -0
- model-00014-of-00118.safetensors +3 -0
- model-00015-of-00118.safetensors +3 -0
- model-00016-of-00118.safetensors +3 -0
- model-00017-of-00118.safetensors +3 -0
- model-00018-of-00118.safetensors +3 -0
- model-00019-of-00118.safetensors +3 -0
- model-00020-of-00118.safetensors +3 -0
- model-00021-of-00118.safetensors +3 -0
- model-00022-of-00118.safetensors +3 -0
- model-00023-of-00118.safetensors +3 -0
- model-00024-of-00118.safetensors +3 -0
- model-00025-of-00118.safetensors +3 -0
- model-00026-of-00118.safetensors +3 -0
- model-00027-of-00118.safetensors +3 -0
- model-00028-of-00118.safetensors +3 -0
- model-00029-of-00118.safetensors +3 -0
- model-00030-of-00118.safetensors +3 -0
- model-00031-of-00118.safetensors +3 -0
- model-00032-of-00118.safetensors +3 -0
- model-00033-of-00118.safetensors +3 -0
- model-00034-of-00118.safetensors +3 -0
- model-00035-of-00118.safetensors +3 -0
- model-00036-of-00118.safetensors +3 -0
- model-00037-of-00118.safetensors +3 -0
- model-00038-of-00118.safetensors +3 -0
- model-00039-of-00118.safetensors +3 -0
- model-00040-of-00118.safetensors +3 -0
- model-00041-of-00118.safetensors +3 -0
- model-00042-of-00118.safetensors +3 -0
- model-00043-of-00118.safetensors +3 -0
- model-00044-of-00118.safetensors +3 -0
- model-00045-of-00118.safetensors +3 -0
.msc
ADDED
Binary file (10.7 kB). View file
|
|
.mv
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
Revision:master,CreatedAt:1753414958
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"Qwen2MoeForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 151643,
|
7 |
+
"decoder_sparse_step": 1,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 16384,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"max_window_layers": 28,
|
16 |
+
"mlp_only_layers": [],
|
17 |
+
"model_type": "qwen2_moe",
|
18 |
+
"moe_intermediate_size": 1536,
|
19 |
+
"norm_topk_prob": true,
|
20 |
+
"num_attention_heads": 64,
|
21 |
+
"num_experts": 128,
|
22 |
+
"num_experts_per_tok": 8,
|
23 |
+
"num_hidden_layers": 94,
|
24 |
+
"num_key_value_heads": 4,
|
25 |
+
"output_router_logits": false,
|
26 |
+
"qkv_bias": false,
|
27 |
+
"rms_norm_eps": 1e-06,
|
28 |
+
"rope_scaling": null,
|
29 |
+
"rope_theta": 5000000.0,
|
30 |
+
"router_aux_loss_coef": 0.001,
|
31 |
+
"shared_expert_intermediate_size": 0,
|
32 |
+
"sliding_window": null,
|
33 |
+
"tie_word_embeddings": false,
|
34 |
+
"torch_dtype": "bfloat16",
|
35 |
+
"transformers_version": "4.51.3",
|
36 |
+
"use_cache": true,
|
37 |
+
"use_qk_norm": true,
|
38 |
+
"use_sliding_window": false,
|
39 |
+
"vocab_size": 151936
|
40 |
+
}
|
configuration.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"framework":"Pytorch","task":"text-generation"}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6ee892b96983b30c2ab6aabfb507625b05071991129515aff658db9691419ef
|
3 |
+
size 3991955880
|
model-00002-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50f3690d9ca2fc491af3c8e68b3fe39155b8b4745c17356e60aa1f86bf5e68dd
|
3 |
+
size 3994081856
|
model-00003-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7abec76f18b0ed4c37b0bc7d1a990bd1abbad2684476edd2657a53f06756b58
|
3 |
+
size 3994081856
|
model-00004-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0907c3204f7a4658427db5fd4e61398eddf63c10615c0610e43cb3c5b371eb05
|
3 |
+
size 3988822448
|
model-00005-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c40ca3e04508ca33cba860330220ba183b268f144a7e38799b80841b714f985
|
3 |
+
size 3994081784
|
model-00006-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0792ddfc132f64d67ac19cd49c7063c6a273afe065528a22b66ffef69425aa03
|
3 |
+
size 3994081856
|
model-00007-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e3af0e36505455968544d21dd27958bd67c970cebd0dd378d1cb380a3070518
|
3 |
+
size 3994081856
|
model-00008-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18bce9478549f2372efdf291781c73fe59b18d9d99d7883bc77876fe51854c11
|
3 |
+
size 3994081856
|
model-00009-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:876a530bb2f165eebc8d4299a3bd6ca7e2fbff6fffffadf0664d8dc60cb32792
|
3 |
+
size 3988822456
|
model-00010-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4db039290306c7aaefc7b73f21b5dfc69d45eec9561e9686fc133fb51960c72a
|
3 |
+
size 3994081784
|
model-00011-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03028ca3c973564b0edb3e2281945c8b70e67726658a51e0df25cf9b698e5410
|
3 |
+
size 3994081856
|
model-00012-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8e514e48ae0abecf540a30cb3c25a0279f574a8dc41a37bfd3fc61166499742
|
3 |
+
size 3994081856
|
model-00013-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a57ba3900a6316de2a1ee2c838362db932edd2d51737c0ec91d0ca950e2a7a7
|
3 |
+
size 3994081944
|
model-00014-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c342f94a08e9b8c77b26b7036ba6d5e5f0a6286435ed8c48e448bf0ac3150701
|
3 |
+
size 3988822776
|
model-00015-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b00942677bfe7109f470115fcc2627cebc506eb6cf293950a7f7ea6f363c8fe
|
3 |
+
size 3994082088
|
model-00016-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b5a535d7ac5ff335234cc5a45fcbb683ed125f81a359dd1db0e56a561f3982f
|
3 |
+
size 3994082176
|
model-00017-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:135c454ab6608988e77ec0c7bbdcd293ece38493a7ce44049569a6d4d2944ba6
|
3 |
+
size 3994082176
|
model-00018-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5323a2c977d2a674fbc1c873d45261f4e4ffbf8a7be4a057453e290d7523ae4
|
3 |
+
size 3994082176
|
model-00019-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58b9be7051da0e391b23e22a2a356d3e4528164cfc3899494e84f0246a5981f0
|
3 |
+
size 3988822776
|
model-00020-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b503c8a0d9160f8adcf038df6963b1a370d41e47f4cef0a49a6267b796b7b4c4
|
3 |
+
size 3994082088
|
model-00021-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a0b41f3f89a1ffb0df85cd5c14be463c9c4e4a255ed19e7e96f2641d7e1929b
|
3 |
+
size 3994082160
|
model-00022-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c952bbbd0300c1f3ab8e034a080ae4eb0016e90ed2274dcd22d3786972e36c23
|
3 |
+
size 3994082176
|
model-00023-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:315abaf08128196616024ffc3bccb2fdeda1c2864094fc8967faf5ef329561e3
|
3 |
+
size 3994082176
|
model-00024-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05666d803688653bab3925d79f2975c2d980458a445f2498d1655f5f91013a88
|
3 |
+
size 3939555920
|
model-00025-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d6fecef7d06b9fd15fa66f19fb8710b412a8ee82fb00277c90c781d8e9b1658
|
3 |
+
size 3993016808
|
model-00026-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcc0c8b1b5b720b2aa4a26dd31c8727957f2319a303fc77016c917aa0e88952b
|
3 |
+
size 3994082160
|
model-00027-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fba38162368a55d486e8f8f930c5c43fe4651e9ed5108a243b873f66fdb247bd
|
3 |
+
size 3994082176
|
model-00028-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6d86f488816c479e1c29e5abb1b1978bc72897fc59a2a9f48510351cccefbf5
|
3 |
+
size 3994082176
|
model-00029-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:607ed19a00bb8acbeb0e0e42aa87dbc53801f39db0037863ef213ad4d290e4ae
|
3 |
+
size 3998276288
|
model-00030-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5aaea852a8075473f82655a63a2eb0e52959b513d59d545af9cc3db45b5f50d
|
3 |
+
size 3997211632
|
model-00031-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d6b5cd3ab1edab6cee36c1e9d247947b6df28c0819649c8ca1bd86a550e5386
|
3 |
+
size 3994082160
|
model-00032-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5a66bcb5cc879678781f1067edc00646419ec2edd756439775491ce3a7b3acf
|
3 |
+
size 3994082176
|
model-00033-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21db193b373d1b60ed5817faa1a71305f2e7b67860dc101eac60ac1638c9f506
|
3 |
+
size 3994082176
|
model-00034-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e06bde20e529c528bba181b2bd28d0d9672511c5b61e625d17e5af970eb3257
|
3 |
+
size 3994082200
|
model-00035-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c0715d00097c2fc1ecaa6db8b64f18bdef8d2ed9ee7289664fc6c07b9b9b626
|
3 |
+
size 3988822680
|
model-00036-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4157226ad6f09e701ab1aa4c3ca1f91225ba3d8b55b34fded8b3c85ab1ff02f
|
3 |
+
size 3994082152
|
model-00037-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a89bdb91088163e30a1ec12a116942c856ae03d2cf6da35c19c89b161544ce42
|
3 |
+
size 3994082176
|
model-00038-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:557c3c9f000a9c668c79f3aa828cdbbc6bd9964ca07ae5aed41e6854539ee131
|
3 |
+
size 3994082176
|
model-00039-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10d8c34441a5ce1167ac67d120ce89e76c41b61be75a5fe74c81e6e86f273058
|
3 |
+
size 3994082200
|
model-00040-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44cb269ce442ce8daf8e003ead6be0028aebfa876dca71875c69a4c45aabf89a
|
3 |
+
size 3988822696
|
model-00041-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87c5e1830ece3874be1aa0061ea948450b6db1968e15fee3a9e1b513bfa6502c
|
3 |
+
size 3994082144
|
model-00042-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df37f6a28d209e5a16d7948b63ac1be8aa3b4ec0c2b896393de3dcda34d2e831
|
3 |
+
size 3994082176
|
model-00043-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:665987ad9c57e64681dacdd1e720f44b65615ac00c0c433f72f79d98fa118c4b
|
3 |
+
size 3994082176
|
model-00044-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9b5fe4a1265f48826c67878c5c692f4b6044b9f2e2c5be9db35eeeb3aceabea
|
3 |
+
size 3994082192
|
model-00045-of-00118.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b4843915f9148142c23e5edeb1c21d356d773a78edab4c4dc9f1c1eecc24f60
|
3 |
+
size 3988822704
|