From 88e5fc899f4360c431dcf9c6dfa1bf57483b77f4 Mon Sep 17 00:00:00 2001 From: Mengwei Liu Date: Fri, 19 Apr 2024 08:53:06 -0700 Subject: [PATCH] Fix embedding_4bit out variant (#3151) Summary: In #3095 there's an issue with the embedding_4bit schema which causes mismatch between functional and out variant. P1217884556 Differential Revision: D56357762 --- exir/passes/_quant_patterns_and_replacements.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/exir/passes/_quant_patterns_and_replacements.py b/exir/passes/_quant_patterns_and_replacements.py index ec543560b86..c6ec40269f6 100644 --- a/exir/passes/_quant_patterns_and_replacements.py +++ b/exir/passes/_quant_patterns_and_replacements.py @@ -179,7 +179,7 @@ def embedding_byte_dtype_out_meta( quantized_decomposed_lib.define( "embedding_4bit.dtype(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, " - "int weight_quant_min, int weight_quant_max, Tensor indices, ScalarType? dtype=None) -> Tensor", + "int weight_quant_min, int weight_quant_max, Tensor indices, *, ScalarType? dtype=None) -> Tensor", ) quantized_decomposed_lib.define(