Skip to content

Commit 78db1bd

Browse files
committed
up
1 parent bcfc520 commit 78db1bd

File tree

2 files changed

+505
-251
lines changed

2 files changed

+505
-251
lines changed

torchao/experimental/quant_api.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -780,11 +780,11 @@ def _int8_dynamic_activation_intx_weight_transform(
780780
x,
781781
mapping_type=act_mapping_type,
782782
block_size=_get_per_token_block_size(x),
783-
target_dtype=torch.int32,
783+
target_dtype=torch.int8,
784784
quant_min=-128, # lower bound of int8
785785
quant_max=127, # upper bound of int8
786786
scale_dtype=torch.float32,
787-
zero_point_dtype=torch.int32,
787+
zero_point_dtype=torch.int8,
788788
)
789789
weight = to_linear_activation_quantized(weight, activation_quant_func)
790790

0 commit comments

Comments
 (0)