Kebob commited on
Commit
5bb9142
·
verified ·
1 Parent(s): 8defcde

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +66 -0
  2. model-00001.safetensors +3 -0
  3. model-00002.safetensors +3 -0
  4. model-00003.safetensors +3 -0
  5. model-00004.safetensors +3 -0
  6. model-00005.safetensors +3 -0
  7. model-00006.safetensors +3 -0
  8. model-00007.safetensors +3 -0
  9. model-00008.safetensors +3 -0
  10. model-00009.safetensors +3 -0
  11. model-00010.safetensors +3 -0
  12. model-00011.safetensors +3 -0
  13. model-00012.safetensors +3 -0
  14. model-00013.safetensors +3 -0
  15. model-00014.safetensors +3 -0
  16. model-00015.safetensors +3 -0
  17. model-00016.safetensors +3 -0
  18. model-00017.safetensors +3 -0
  19. model-00018.safetensors +3 -0
  20. model-00019.safetensors +3 -0
  21. model-00020.safetensors +3 -0
  22. model-00021.safetensors +3 -0
  23. model-00022.safetensors +3 -0
  24. model-00023.safetensors +3 -0
  25. model-00024.safetensors +3 -0
  26. model-00025.safetensors +3 -0
  27. model-00026.safetensors +3 -0
  28. model-00027.safetensors +3 -0
  29. model-00028.safetensors +3 -0
  30. model-00029.safetensors +3 -0
  31. model-00030.safetensors +3 -0
  32. model-00031.safetensors +3 -0
  33. model-00032.safetensors +3 -0
  34. model-00033.safetensors +3 -0
  35. model-00034.safetensors +3 -0
  36. model-00035.safetensors +3 -0
  37. model-00036.safetensors +3 -0
  38. model-00037.safetensors +3 -0
  39. model-00038.safetensors +3 -0
  40. model-00039.safetensors +3 -0
  41. model-00040.safetensors +3 -0
  42. model-00041.safetensors +3 -0
  43. model-00042.safetensors +3 -0
  44. model-00043.safetensors +3 -0
  45. model-00044.safetensors +3 -0
  46. model-00045.safetensors +3 -0
  47. model-00046.safetensors +3 -0
  48. model-00047.safetensors +3 -0
  49. model-00048.safetensors +3 -0
  50. model-00049.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV32ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 0,
8
+ "eos_token_id": 1,
9
+ "ep_size": 1,
10
+ "first_k_dense_replace": 3,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 7168,
13
+ "index_head_dim": 128,
14
+ "index_n_heads": 64,
15
+ "index_topk": 2048,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 18432,
18
+ "kv_lora_rank": 512,
19
+ "max_position_embeddings": 163840,
20
+ "model_type": "deepseek_v32",
21
+ "moe_intermediate_size": 2048,
22
+ "moe_layer_freq": 1,
23
+ "n_group": 8,
24
+ "n_routed_experts": 256,
25
+ "n_shared_experts": 1,
26
+ "norm_topk_prob": true,
27
+ "num_attention_heads": 128,
28
+ "num_experts_per_tok": 8,
29
+ "num_hidden_layers": 61,
30
+ "num_key_value_heads": 128,
31
+ "num_nextn_predict_layers": 1,
32
+ "q_lora_rank": 1536,
33
+ "qk_nope_head_dim": 128,
34
+ "qk_rope_head_dim": 64,
35
+ "quantization_config": {
36
+ "activation_scheme": "dynamic",
37
+ "fmt": "e4m3",
38
+ "quant_method": "fp8",
39
+ "scale_fmt": "ue8m0",
40
+ "weight_block_size": [
41
+ 128,
42
+ 128
43
+ ]
44
+ },
45
+ "rms_norm_eps": 1e-06,
46
+ "rope_scaling": {
47
+ "beta_fast": 32,
48
+ "beta_slow": 1,
49
+ "factor": 40,
50
+ "mscale": 1.0,
51
+ "mscale_all_dim": 1.0,
52
+ "original_max_position_embeddings": 4096,
53
+ "type": "yarn"
54
+ },
55
+ "rope_theta": 10000,
56
+ "routed_scaling_factor": 2.5,
57
+ "scoring_func": "sigmoid",
58
+ "tie_word_embeddings": false,
59
+ "topk_group": 4,
60
+ "topk_method": "noaux_tc",
61
+ "torch_dtype": "bfloat16",
62
+ "transformers_version": "4.44.2",
63
+ "use_cache": true,
64
+ "v_head_dim": 128,
65
+ "vocab_size": 129280
66
+ }
model-00001.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d36338ab918d1b8fa2c2a29d9ed0aab51c7454bdd36f435d478f4fd84e1d513
3
+ size 5523776832
model-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e47efe57203ff5496bc23b2c39217cf8ff5ad8bce1ca520b0c87e52e19e2fef
3
+ size 5523776752
model-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f98ea78f18177a1d541caf9828eb04164f0ea729aaba111e3a16801db6ead414
3
+ size 5523776672
model-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75211301451d8d919350dfbe5b56ffb2e1d57575f5dea12e2dbf871e7f4dbf7f
3
+ size 5523776712
model-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:041cecde1e61482ff226a631891f941c15ee2a383352f23819906a769548298d
3
+ size 5523776672
model-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c312d1613552fa5b5b1494c3975dadc60d2c4624541848e2e3ff05597ad92534
3
+ size 5523776632
model-00007.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e37aa4646a2375def7dae972e797bf22d0c4cb1f9956650d14ac673791192cb5
3
+ size 5523776584
model-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c61c0bdcfe15bef27ff980e07d87d44d2d4fda837868c9d894f36d300146501
3
+ size 5523779328
model-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4506b83e8f71241ffdcc0a1371549cbe7e52ccc2868336fd2d34bbdda6bac7
3
+ size 5523779504
model-00010.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d189023a74bb90490dd9f6205c85929d3fe4faf5a27f3240f71ce521a0c5817a
3
+ size 5523779464
model-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ad637153e3e039a8388bba1a1c508950b960067184b419d0bead0d8354619f
3
+ size 5523779424
model-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71eab587006cbd6eb389f8189766787abd8874602ed0137add7da01749ff321b
3
+ size 5523779384
model-00013.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:019e6ba59a515258be26f3aa628378739531ffa9e6b113069aafd4575e798853
3
+ size 5523779344
model-00014.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8809251c367081a99718cc34de9868e223c6152213bdb1aa2362c6f7123c97ea
3
+ size 5523779368
model-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16ec01666879b2e0eac7d3cfe7edccab711148c230be33bb47249337ed6176f6
3
+ size 5523779328
model-00016.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfb8dba61c3ac56244009765e20cc39f5a14003815b051aef3477ad3b0ab912a
3
+ size 5523779288
model-00017.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8aa97b21326365372cf43fb4f05e726cecd919c1a6dbe2836fd6a0ff4a2def
3
+ size 5523779248
model-00018.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f71b169ee9a422e46e3d51be1401717a7daa73da9725dedded0324395351b6
3
+ size 5523779208
model-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c31960fb1233fbaedae5ae1b13cdbfff59a5003b090d0e26aa03f7a1b5b82e36
3
+ size 5523779168
model-00020.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd8d1816feb0f4703b050c037a2ae3a3e4c5461af849aa4a3bd70e3fdeccdf6
3
+ size 5523779128
model-00021.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:946ad2e0a519f2fd6565f369e7cec85df8ea3e4ce959a703c9060e2cb51c64a4
3
+ size 5523779120
model-00022.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88e3cfdce082344a6e685d2aff22158dd819691509b6675bbfcffd0abacd1b19
3
+ size 5523779016
model-00023.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30c21a8dd896d5bcec34831b880f53803f5b8022926fb315bb62b49da5253c32
3
+ size 5523778928
model-00024.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:762dc5d4ebda529b2e47a3bda1ef7068361bf49c423a9f6d26032e79f2522af8
3
+ size 5523778960
model-00025.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9abd42b2af251d3f6640496aa11225792c20bc0f969bae29127a9147615593f
3
+ size 5523779104
model-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b1378dc3358d9b646143cff1cd4bcfd36cc5da3895257aa4ffa187b419aaf4f
3
+ size 5523779248
model-00027.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3d29ce502d4796f5e8e7c1c2d7a902b821df507ffc4e89392c3111888a55ef1
3
+ size 5523779392
model-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3d9280264d97881cff4b0354be0b517b2ab187b620ef99ee164238a9f2424a0
3
+ size 5523779536
model-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18cadfe29c0c5a230a4482f402e0d1c3295d87954c2eb34a9cdc91ee4679d38a
3
+ size 5523779680
model-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:035734ee7f4b2a3f7e2f418b20d36df4bc9ff9f334b880a1d1a3d72bf2e907c8
3
+ size 5523779824
model-00031.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43aa7f3b3b2729f44462148560fd1018dd98a316641ccf458c0978684caa4080
3
+ size 5523779832
model-00032.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:703d8e79df30f537bc3e6899db05fa03843dfdbceb8e8e4a7985175533af9c52
3
+ size 5523779832
model-00033.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1038bab1413b7fe012896e03aeb5eb9580be0d742894dcb4836d22571d12eb4c
3
+ size 5523779832
model-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc9d360b6a783a6b834daa1e182e6cd36f3304194ee30296f06d57121bf1bbeb
3
+ size 5523779832
model-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6372f93ea4b0c40204e08cee331ae538e318df309e698093a1aada6f74309462
3
+ size 5523779880
model-00036.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f366c80ac4855605ac252c07d1f18ad2e7ceea53fc97127ddd4e71b9f50c9619
3
+ size 5523779904
model-00037.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faa956b05c8a873b874ccde8c152df1ebb2434fc4dab92ca4b3864bb97130b7c
3
+ size 5523779904
model-00038.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0862558cf51ac33b599fdb287522fc3fc0189525211441e39acc1af5dcbfd6fc
3
+ size 5523779904
model-00039.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2a6afbaa95cff6b4caf73d03c1520f6d49dafc7d515c4564b4e607e5bb2df2a
3
+ size 5523779904
model-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b393d885aa04420c3c58829662782a9a43861f88dcd84576e37b19736af6da35
3
+ size 5523779904
model-00041.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3865d5c4ff10aa4408f306d23c74ff58ea9c0b32db59c0b36204e96cd523c851
3
+ size 5523779904
model-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53123643c5d79f0c107b9f9cb6301c7c0473165dc6968118413b059691415082
3
+ size 5523779920
model-00043.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c41a277f86ed44e069ec931244ab7ef3d032a3d1f32380c63e277d4e19c053
3
+ size 5523779928
model-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed75a19bc6cd8a2dd8626a0891bb439cc209133ce770ec8b224a18a7056cd6d6
3
+ size 5523779808
model-00045.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c190201750ff84632ada5af74c6c3f85ee6ed4eb6254cee030e818de9265060
3
+ size 5523779720
model-00046.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f4dcc1ea0fc0dd8f96b49533814e2cb9aa02d567c37810132420b1c92dab5b7
3
+ size 5523779656
model-00047.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f239edafaf7b901fe8574e9da0c9ae610dc22aca4113b374b0129ff37e3ac3a9
3
+ size 5523779696
model-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74f82acbd8d5e50a662332b1886b42f7195efeeec558181c394f64272c3e8844
3
+ size 5523779656
model-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f70db73a1fc08a81529b5ed17da5c6ff497cb5cc2ceb8931ab2ccdc7c4e65834
3
+ size 5523779616