Upload DeepseekV3ForCausalLM
Browse files- config.json +1 -1
- model-00001-of-00003.safetensors +1 -1
- model-00002-of-00003.safetensors +1 -1
- model-00003-of-00003.safetensors +1 -1
config.json
CHANGED
|
@@ -18,7 +18,7 @@
|
|
| 18 |
"initializer_range": 0.02,
|
| 19 |
"intermediate_size": 5632,
|
| 20 |
"kv_lora_rank": 128,
|
| 21 |
-
"max_position_embeddings":
|
| 22 |
"model_type": "deepseek_v3",
|
| 23 |
"moe_intermediate_size": 1024,
|
| 24 |
"moe_layer_freq": 1,
|
|
|
|
| 18 |
"initializer_range": 0.02,
|
| 19 |
"intermediate_size": 5632,
|
| 20 |
"kv_lora_rank": 128,
|
| 21 |
+
"max_position_embeddings": 163840,
|
| 22 |
"model_type": "deepseek_v3",
|
| 23 |
"moe_intermediate_size": 1024,
|
| 24 |
"moe_layer_freq": 1,
|
model-00001-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4997707928
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c3e1cec8a1aca895ace36650331267ec973c21a7d31befccfe5d09020a40c872
|
| 3 |
size 4997707928
|
model-00002-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4997719544
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ba967f5043ad40af1e981dc5cea2fe56942f9ae7e8ffaa01078dbf21cf2e3b6
|
| 3 |
size 4997719544
|
model-00003-of-00003.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2289388312
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f949df8d995a821fe44e3ce6b24a7e19e915f5d7ee34d3149668952ab5b518d5
|
| 3 |
size 2289388312
|