Adding small comment for source of calculation.

2025-09-11 12:24:53 +00:00 · 2024-12-09 10:48:20 +01:00 · 2024-12-09 10:48:20 +01:00 · d701f9e866
commit d701f9e866
parent 36ed43c920
1 changed files with 2 additions and 0 deletions
--- a/launcher/src/main.rs
+++ b/launcher/src/main.rs
@ -295,6 +295,8 @@ impl Config {
        // TODO This calculation depends on the actual implementation
        let dtype_size = 2;
        let mlp_size = self.intermediate_size?;
+        // calculation is overshooting here.
+        // Coming from here: https://github.com/vllm-project/vllm/blob/d1c2e15eb31ef12e688ce0cb71895f88eaf4cd4f/vllm/model_executor/layers/fused_moe/fused_moe.py#L618-L624
        Some((mlp_size + mlp_size / 2) * self.num_experts * dtype_size * 3)
    }