Add command line arg to disable rope cache

This commit is contained in:
Iwan Kawrakow
2025-11-03 08:20:03 +02:00
parent aa76ff2c9d
commit 525dda2e80
8 changed files with 77 additions and 95 deletions

View File

@@ -427,6 +427,7 @@ extern "C" {
bool grouped_expert_routing; // whether to use grouped expert routing (BailingMoeV2 arch)
bool fused_up_gate; // whether to use fused up/gate op [EXPERIMENTAL]
bool fused_mmad; // whether to use fused mul+multi_add op [EXPERIMENTAL]
bool rope_cache; // whether to use RoPE cache [EXPERIMENTAL]
int min_experts;
float thresh_experts;
bool only_active_experts;