diff --git a/backends/cadence/aot/quantizer/patterns.py b/backends/cadence/aot/quantizer/patterns.py index a7026cbf26c..9897d443725 100644 --- a/backends/cadence/aot/quantizer/patterns.py +++ b/backends/cadence/aot/quantizer/patterns.py @@ -1092,9 +1092,6 @@ def fuse(self, gm: fx.GraphModule, anchor_node: fx.Node) -> fx.Node | None: return None mask_shape = list(mask_shape) # Softmax mask is packed 16 elements per int32 word. - assert ( - mask_shape[-1] % 16 == 0 - ), f"Softmax mask dimension must be divisible by 16, got {mask_shape[-1]}" mask_shape[-1] = mask_shape[-1] // 16 mask_tensor = insert_node_with_meta( gm,