sky-2002 commited on
Commit
9af308d
·
verified ·
1 Parent(s): d8ad225

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +16 -0
config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_attention_heads": 8,
3
+ "input_dim": 512,
4
+ "embed_dim": 512,
5
+ "q_latent_dim": 128,
6
+ "kv_latent_dim": 128,
7
+ "max_token_len": 512,
8
+ "num_shared_experts": 2,
9
+ "num_routed_experts": 4,
10
+ "moe_top_k": 2,
11
+ "expert_intermediate_dim": 1536,
12
+ "num_dense_ffn": 1,
13
+ "num_moe_ffn": 2,
14
+ "vocab_size": 50257,
15
+ "max_batch_size": 24
16
+ }