littlebird13 commited on
Commit
8546b01
·
verified ·
1 Parent(s): 501220d

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .msc +0 -0
  2. .mv +1 -0
  3. config.json +40 -0
  4. configuration.json +1 -0
  5. merges.txt +0 -0
  6. model-00001-of-00118.safetensors +3 -0
  7. model-00002-of-00118.safetensors +3 -0
  8. model-00003-of-00118.safetensors +3 -0
  9. model-00004-of-00118.safetensors +3 -0
  10. model-00005-of-00118.safetensors +3 -0
  11. model-00006-of-00118.safetensors +3 -0
  12. model-00007-of-00118.safetensors +3 -0
  13. model-00008-of-00118.safetensors +3 -0
  14. model-00009-of-00118.safetensors +3 -0
  15. model-00010-of-00118.safetensors +3 -0
  16. model-00011-of-00118.safetensors +3 -0
  17. model-00012-of-00118.safetensors +3 -0
  18. model-00013-of-00118.safetensors +3 -0
  19. model-00014-of-00118.safetensors +3 -0
  20. model-00015-of-00118.safetensors +3 -0
  21. model-00016-of-00118.safetensors +3 -0
  22. model-00017-of-00118.safetensors +3 -0
  23. model-00018-of-00118.safetensors +3 -0
  24. model-00019-of-00118.safetensors +3 -0
  25. model-00020-of-00118.safetensors +3 -0
  26. model-00021-of-00118.safetensors +3 -0
  27. model-00022-of-00118.safetensors +3 -0
  28. model-00023-of-00118.safetensors +3 -0
  29. model-00024-of-00118.safetensors +3 -0
  30. model-00025-of-00118.safetensors +3 -0
  31. model-00026-of-00118.safetensors +3 -0
  32. model-00027-of-00118.safetensors +3 -0
  33. model-00028-of-00118.safetensors +3 -0
  34. model-00029-of-00118.safetensors +3 -0
  35. model-00030-of-00118.safetensors +3 -0
  36. model-00031-of-00118.safetensors +3 -0
  37. model-00032-of-00118.safetensors +3 -0
  38. model-00033-of-00118.safetensors +3 -0
  39. model-00034-of-00118.safetensors +3 -0
  40. model-00035-of-00118.safetensors +3 -0
  41. model-00036-of-00118.safetensors +3 -0
  42. model-00037-of-00118.safetensors +3 -0
  43. model-00038-of-00118.safetensors +3 -0
  44. model-00039-of-00118.safetensors +3 -0
  45. model-00040-of-00118.safetensors +3 -0
  46. model-00041-of-00118.safetensors +3 -0
  47. model-00042-of-00118.safetensors +3 -0
  48. model-00043-of-00118.safetensors +3 -0
  49. model-00044-of-00118.safetensors +3 -0
  50. model-00045-of-00118.safetensors +3 -0
.msc ADDED
Binary file (10.7 kB). View file
 
.mv ADDED
@@ -0,0 +1 @@
 
 
1
+ Revision:master,CreatedAt:1753414958
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2MoeForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 151643,
7
+ "decoder_sparse_step": 1,
8
+ "eos_token_id": 151645,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 16384,
14
+ "max_position_embeddings": 131072,
15
+ "max_window_layers": 28,
16
+ "mlp_only_layers": [],
17
+ "model_type": "qwen2_moe",
18
+ "moe_intermediate_size": 1536,
19
+ "norm_topk_prob": true,
20
+ "num_attention_heads": 64,
21
+ "num_experts": 128,
22
+ "num_experts_per_tok": 8,
23
+ "num_hidden_layers": 94,
24
+ "num_key_value_heads": 4,
25
+ "output_router_logits": false,
26
+ "qkv_bias": false,
27
+ "rms_norm_eps": 1e-06,
28
+ "rope_scaling": null,
29
+ "rope_theta": 5000000.0,
30
+ "router_aux_loss_coef": 0.001,
31
+ "shared_expert_intermediate_size": 0,
32
+ "sliding_window": null,
33
+ "tie_word_embeddings": false,
34
+ "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.51.3",
36
+ "use_cache": true,
37
+ "use_qk_norm": true,
38
+ "use_sliding_window": false,
39
+ "vocab_size": 151936
40
+ }
configuration.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"framework":"Pytorch","task":"text-generation"}
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6ee892b96983b30c2ab6aabfb507625b05071991129515aff658db9691419ef
3
+ size 3991955880
model-00002-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50f3690d9ca2fc491af3c8e68b3fe39155b8b4745c17356e60aa1f86bf5e68dd
3
+ size 3994081856
model-00003-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7abec76f18b0ed4c37b0bc7d1a990bd1abbad2684476edd2657a53f06756b58
3
+ size 3994081856
model-00004-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0907c3204f7a4658427db5fd4e61398eddf63c10615c0610e43cb3c5b371eb05
3
+ size 3988822448
model-00005-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c40ca3e04508ca33cba860330220ba183b268f144a7e38799b80841b714f985
3
+ size 3994081784
model-00006-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0792ddfc132f64d67ac19cd49c7063c6a273afe065528a22b66ffef69425aa03
3
+ size 3994081856
model-00007-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3af0e36505455968544d21dd27958bd67c970cebd0dd378d1cb380a3070518
3
+ size 3994081856
model-00008-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18bce9478549f2372efdf291781c73fe59b18d9d99d7883bc77876fe51854c11
3
+ size 3994081856
model-00009-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:876a530bb2f165eebc8d4299a3bd6ca7e2fbff6fffffadf0664d8dc60cb32792
3
+ size 3988822456
model-00010-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4db039290306c7aaefc7b73f21b5dfc69d45eec9561e9686fc133fb51960c72a
3
+ size 3994081784
model-00011-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03028ca3c973564b0edb3e2281945c8b70e67726658a51e0df25cf9b698e5410
3
+ size 3994081856
model-00012-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8e514e48ae0abecf540a30cb3c25a0279f574a8dc41a37bfd3fc61166499742
3
+ size 3994081856
model-00013-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a57ba3900a6316de2a1ee2c838362db932edd2d51737c0ec91d0ca950e2a7a7
3
+ size 3994081944
model-00014-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c342f94a08e9b8c77b26b7036ba6d5e5f0a6286435ed8c48e448bf0ac3150701
3
+ size 3988822776
model-00015-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b00942677bfe7109f470115fcc2627cebc506eb6cf293950a7f7ea6f363c8fe
3
+ size 3994082088
model-00016-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b5a535d7ac5ff335234cc5a45fcbb683ed125f81a359dd1db0e56a561f3982f
3
+ size 3994082176
model-00017-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:135c454ab6608988e77ec0c7bbdcd293ece38493a7ce44049569a6d4d2944ba6
3
+ size 3994082176
model-00018-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5323a2c977d2a674fbc1c873d45261f4e4ffbf8a7be4a057453e290d7523ae4
3
+ size 3994082176
model-00019-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58b9be7051da0e391b23e22a2a356d3e4528164cfc3899494e84f0246a5981f0
3
+ size 3988822776
model-00020-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b503c8a0d9160f8adcf038df6963b1a370d41e47f4cef0a49a6267b796b7b4c4
3
+ size 3994082088
model-00021-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a0b41f3f89a1ffb0df85cd5c14be463c9c4e4a255ed19e7e96f2641d7e1929b
3
+ size 3994082160
model-00022-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c952bbbd0300c1f3ab8e034a080ae4eb0016e90ed2274dcd22d3786972e36c23
3
+ size 3994082176
model-00023-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:315abaf08128196616024ffc3bccb2fdeda1c2864094fc8967faf5ef329561e3
3
+ size 3994082176
model-00024-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05666d803688653bab3925d79f2975c2d980458a445f2498d1655f5f91013a88
3
+ size 3939555920
model-00025-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d6fecef7d06b9fd15fa66f19fb8710b412a8ee82fb00277c90c781d8e9b1658
3
+ size 3993016808
model-00026-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc0c8b1b5b720b2aa4a26dd31c8727957f2319a303fc77016c917aa0e88952b
3
+ size 3994082160
model-00027-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fba38162368a55d486e8f8f930c5c43fe4651e9ed5108a243b873f66fdb247bd
3
+ size 3994082176
model-00028-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6d86f488816c479e1c29e5abb1b1978bc72897fc59a2a9f48510351cccefbf5
3
+ size 3994082176
model-00029-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:607ed19a00bb8acbeb0e0e42aa87dbc53801f39db0037863ef213ad4d290e4ae
3
+ size 3998276288
model-00030-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5aaea852a8075473f82655a63a2eb0e52959b513d59d545af9cc3db45b5f50d
3
+ size 3997211632
model-00031-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d6b5cd3ab1edab6cee36c1e9d247947b6df28c0819649c8ca1bd86a550e5386
3
+ size 3994082160
model-00032-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5a66bcb5cc879678781f1067edc00646419ec2edd756439775491ce3a7b3acf
3
+ size 3994082176
model-00033-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21db193b373d1b60ed5817faa1a71305f2e7b67860dc101eac60ac1638c9f506
3
+ size 3994082176
model-00034-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e06bde20e529c528bba181b2bd28d0d9672511c5b61e625d17e5af970eb3257
3
+ size 3994082200
model-00035-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c0715d00097c2fc1ecaa6db8b64f18bdef8d2ed9ee7289664fc6c07b9b9b626
3
+ size 3988822680
model-00036-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4157226ad6f09e701ab1aa4c3ca1f91225ba3d8b55b34fded8b3c85ab1ff02f
3
+ size 3994082152
model-00037-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a89bdb91088163e30a1ec12a116942c856ae03d2cf6da35c19c89b161544ce42
3
+ size 3994082176
model-00038-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:557c3c9f000a9c668c79f3aa828cdbbc6bd9964ca07ae5aed41e6854539ee131
3
+ size 3994082176
model-00039-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d8c34441a5ce1167ac67d120ce89e76c41b61be75a5fe74c81e6e86f273058
3
+ size 3994082200
model-00040-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44cb269ce442ce8daf8e003ead6be0028aebfa876dca71875c69a4c45aabf89a
3
+ size 3988822696
model-00041-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87c5e1830ece3874be1aa0061ea948450b6db1968e15fee3a9e1b513bfa6502c
3
+ size 3994082144
model-00042-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df37f6a28d209e5a16d7948b63ac1be8aa3b4ec0c2b896393de3dcda34d2e831
3
+ size 3994082176
model-00043-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665987ad9c57e64681dacdd1e720f44b65615ac00c0c433f72f79d98fa118c4b
3
+ size 3994082176
model-00044-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9b5fe4a1265f48826c67878c5c692f4b6044b9f2e2c5be9db35eeeb3aceabea
3
+ size 3994082192
model-00045-of-00118.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b4843915f9148142c23e5edeb1c21d356d773a78edab4c4dc9f1c1eecc24f60
3
+ size 3988822704