fix scaled_gemm_f8_i4_f16_weight_quantize input (#3685)

2025-12-24 13:28:13 +08:00 · 2025-08-29 11:04:04 +08:00
parent 2fb2c0f46a
commit b6edd15d55
1 changed files with 1 additions and 1 deletions
--- a/custom_ops/gpu_ops/scaled_gemm_f8_i4_f16_weight_quantize.cu
+++ b/custom_ops/gpu_ops/scaled_gemm_f8_i4_f16_weight_quantize.cu
@@ -217,7 +217,7 @@ std::vector<paddle::DataType> Fp8Int4WeightQuantizeInferDtype(


 PD_BUILD_STATIC_OP(scaled_gemm_f8_i4_f16_weight_quantize)
-    .Inputs({"intput"})
+    .Inputs({"input"})
    .Attrs({"groupsize: int",
            "scale_dtype: std::string"})
    .Outputs({"output", "scale"})