Skip to content

Commit 19febb6

Browse files
committed
update
1 parent ab9c054 commit 19febb6

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

nncf/quantization/algorithms/weight_compression/onnx_backend.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@
3232
from nncf.onnx.graph.metatypes.groups import MATMUL_METATYPES
3333
from nncf.onnx.graph.model_transformer import remove_initializer
3434
from nncf.onnx.graph.model_transformer import set_initializer
35-
from nncf.onnx.graph.node_utils import get_weight_quantization_axis
35+
from nncf.onnx.graph.node_utils import get_act_quantization_axis, get_weight_quantization_axis
3636
from nncf.onnx.graph.onnx_helper import ONNX_DTYPE_TO_NNCF_DTYPE
3737
from nncf.onnx.graph.onnx_helper import get_name_to_node_map
3838
from nncf.onnx.graph.onnx_helper import get_node_index
@@ -239,6 +239,10 @@ def filter_func(point: StatisticPoint) -> bool:
239239
)
240240

241241
return filter_func
242+
243+
@staticmethod
244+
def get_activation_channel_axis(node: NNCFNode, port_id: int, input_shape: tuple[int]) -> int:
245+
return get_act_quantization_axis(node, port_id)
242246

243247
def insert_adapters(
244248
self, wc_params: WeightCompressionParameters, lora_A: Tensor, lora_B: Tensor, int8_lora: bool

0 commit comments

Comments
 (0)