We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b04970f commit 7064fc6Copy full SHA for 7064fc6
configs/qwen3-8b-eagle3.json
@@ -11,7 +11,7 @@
11
"hidden_size": 4096,
12
"initializer_range": 0.02,
13
"intermediate_size": 12288,
14
- "max_position_embeddings": 2048,
+ "max_position_embeddings": 40960,
15
"max_window_layers": 36,
16
"model_type": "llama",
17
"num_attention_heads": 32,
0 commit comments