llm-d · namasl · Feb 6, 2026 · Feb 6, 2026
diff --git a/config_explorer/Capacity_Planner.py b/config_explorer/Capacity_Planner.py
@@ -326,7 +326,7 @@ def workload_specification():
         with st.expander("See how KV cache is calculated below"):
             st.write(f"""First, the per-token memory requirement is estimated given the following inputs:
 - KV cache data type: `{kv_details.kv_data_type}` = {kv_details.precision_in_bytes} bytes in memory
-- Hidden layers: {model_config.num_hidden_layers}
+- Hidden layers: {text_config.num_hidden_layers}
 
 This model uses _{kv_details.attention_type}_. The relevant parameters are:
 """)