fix ci

FlamingoPg · FlamingoPg · commit 45b13ac68a4d · 2024-07-09T00:11:58.000+08:00
diff --git a/paddle/phi/kernels/gpu/weight_dequantize_kernel.cu b/paddle/phi/kernels/gpu/weight_dequantize_kernel.cu
@@ -33,12 +33,9 @@ void WeightDequantizeKernel(const Context& dev_ctx,
                             DenseTensor* out) {
 #if defined(PADDLE_WITH_CUTLASS)
   auto out_dims = out->dims();
-  out->Resize({{out_dims[1], out_dims[0] * 2}});
   dev_ctx.template Alloc<T>(out);
   WeightDequantize<T, Context>(dev_ctx, x, scale, algo, true, group_size, out);
-  if (algo == "weight_only_int8") {
-    out->Resize({{out_dims[1], out_dims[0]}});
-  }
+  out->Resize({{out_dims[1], out_dims[0]}});
   auto out_tmp = Transpose<T, Context>(dev_ctx, *out, {1, 0});
   out->ShareDataWith(out_tmp);
 #else
diff --git a/test/quantization/test_weight_only_linear.py b/test/quantization/test_weight_only_linear.py
@@ -688,7 +688,6 @@ def test_weight_quantize_and_dequantize_int4_pir(
                 / math.sqrt(4096)
             )
             quant_weight, quant_scale = Q.weight_quantize(x=weight, algo=algo)
-            quant_weight = quant_weight.reshape([12288, 2048])
             dequant_weight = Q.weight_dequantize(
                 quant_weight, quant_scale, algo=algo
             )

Original file line number	Diff line number	Diff line change
`@@ -688,7 +688,6 @@ def test_weight_quantize_and_dequantize_int4_pir(`
`688`	`688`	`/ math.sqrt(4096)`
`689`	`689`	`)`
`690`	`690`	`quant_weight, quant_scale = Q.weight_quantize(x=weight, algo=algo)`
`691`		`- quant_weight = quant_weight.reshape([12288, 2048])`
`692`	`691`	`dequant_weight = Q.weight_dequantize(`
`693`	`692`	`quant_weight, quant_scale, algo=algo`
`694`	`693`	`)`