smohammadi commited on
Commit
65dfbbd
·
verified ·
1 Parent(s): db45587

Upload DeepseekV3ForCausalLM

Browse files
config.json CHANGED
@@ -18,7 +18,7 @@
18
  "initializer_range": 0.02,
19
  "intermediate_size": 5632,
20
  "kv_lora_rank": 128,
21
- "max_position_embeddings": 32768,
22
  "model_type": "deepseek_v3",
23
  "moe_intermediate_size": 1024,
24
  "moe_layer_freq": 1,
 
18
  "initializer_range": 0.02,
19
  "intermediate_size": 5632,
20
  "kv_lora_rank": 128,
21
+ "max_position_embeddings": 163840,
22
  "model_type": "deepseek_v3",
23
  "moe_intermediate_size": 1024,
24
  "moe_layer_freq": 1,
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01da893cf5e85147bfdfc17018fc80850ebf0d174ef8a959ff6539caf0dfd22f
3
  size 4997707928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3e1cec8a1aca895ace36650331267ec973c21a7d31befccfe5d09020a40c872
3
  size 4997707928
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac058872184b435943db1c6cf3dc0bd5bc05113df6e4e0f421a22185929f07f9
3
  size 4997719544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ba967f5043ad40af1e981dc5cea2fe56942f9ae7e8ffaa01078dbf21cf2e3b6
3
  size 4997719544
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cded5196bf0cbd614664d8785d2b0e489d844dcea1174ff4b65dd4beba8f271f
3
  size 2289388312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f949df8d995a821fe44e3ce6b24a7e19e915f5d7ee34d3149668952ab5b518d5
3
  size 2289388312