Skip to content

Commit 45b13ac

Browse files
committed
fix ci
1 parent d9d8a77 commit 45b13ac

File tree

2 files changed

+1
-5
lines changed

2 files changed

+1
-5
lines changed

paddle/phi/kernels/gpu/weight_dequantize_kernel.cu

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -33,12 +33,9 @@ void WeightDequantizeKernel(const Context& dev_ctx,
3333
DenseTensor* out) {
3434
#if defined(PADDLE_WITH_CUTLASS)
3535
auto out_dims = out->dims();
36-
out->Resize({{out_dims[1], out_dims[0] * 2}});
3736
dev_ctx.template Alloc<T>(out);
3837
WeightDequantize<T, Context>(dev_ctx, x, scale, algo, true, group_size, out);
39-
if (algo == "weight_only_int8") {
40-
out->Resize({{out_dims[1], out_dims[0]}});
41-
}
38+
out->Resize({{out_dims[1], out_dims[0]}});
4239
auto out_tmp = Transpose<T, Context>(dev_ctx, *out, {1, 0});
4340
out->ShareDataWith(out_tmp);
4441
#else

test/quantization/test_weight_only_linear.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -688,7 +688,6 @@ def test_weight_quantize_and_dequantize_int4_pir(
688688
/ math.sqrt(4096)
689689
)
690690
quant_weight, quant_scale = Q.weight_quantize(x=weight, algo=algo)
691-
quant_weight = quant_weight.reshape([12288, 2048])
692691
dequant_weight = Q.weight_dequantize(
693692
quant_weight, quant_scale, algo=algo
694693
)

0 commit comments

Comments
 (0)