Update modeling_gpt_oss.py

dongfengy · dongfengy · commit 7f753d94d4bc · 2025-10-08T09:41:31.000-07:00
Signed-off-by: dongfengy &lt;99041270+dongfengy@users.noreply.github.com&gt;
diff --git a/tensorrt_llm/_torch/models/modeling_gpt_oss.py b/tensorrt_llm/_torch/models/modeling_gpt_oss.py
@@ -227,7 +227,7 @@ def _create_ideal_expert_load_balanced_logits(
 
     def compute_gate_output(self, x: torch.Tensor) -> torch.Tensor:
         if get_sm_version() in [
-                90, 100
+                90, 100, 103
         ] and x.shape[0] <= MIN_LATENCY_TINYGEMM_NUM_TOKENS:
             weight = self.gate.weight
             bias = self.gate.bias