IBMZ-Linux-OSS-Python
diff --git a/‎tensorflow/compiler/mlir/quantization/stablehlo/BUILD
Lines changed: 4 additions & 35 deletions b/‎tensorflow/compiler/mlir/quantization/stablehlo/BUILD
Lines changed: 4 additions & 35 deletions
diff --git a/‎tensorflow/compiler/mlir/quantization/stablehlo/passes/quantization_patterns.cc
Lines changed: 27 additions & 19 deletions b/‎tensorflow/compiler/mlir/quantization/stablehlo/passes/quantization_patterns.cc
Lines changed: 27 additions & 19 deletions
diff --git a/‎tensorflow/compiler/mlir/quantization/stablehlo/passes/quantization_patterns.h
Lines changed: 7 additions & 3 deletions b/‎tensorflow/compiler/mlir/quantization/stablehlo/passes/quantization_patterns.h
Lines changed: 7 additions & 3 deletions
@@ -94,9 +94,9 @@ cc_library(
         ":optimize_graph_inc_gen",
         ":quantization_config_proto_cc",
         ":quantization_options_proto_cc",
+        ":quantization_patterns",
         ":remove_sharding_custom_call_inc_gen",
         ":stablehlo_type_utils",
-        ":tf_quantization_patterns",
         ":tf_stablehlo_passes_inc_gen",
         "//tensorflow/compiler/mlir/quantization/common:func",
         "//tensorflow/compiler/mlir/quantization/common:tf_attrs_and_constraints",
@@ -260,10 +260,10 @@ cc_library(
 )
 
 cc_library(
-    name = "tf_quantization_patterns",
-    srcs = ["passes/tf_quantization_patterns.cc"],
+    name = "quantization_patterns",
+    srcs = ["passes/quantization_patterns.cc"],
     hdrs = [
-        "passes/tf_quantization_patterns.h",
+        "passes/quantization_patterns.h",
     ],
     compatible_with = get_compatible_with_portable(),
     deps = [
@@ -289,37 +289,6 @@ cc_library(
     ],
 )
 
-cc_library(
-    name = "quantization_patterns",
-    srcs = ["passes/quantization_patterns.cc"],
-    hdrs = [
-        "passes/quantization_patterns.h",
-    ],
-    compatible_with = get_compatible_with_portable(),
-    deps = [
-        ":quantization_config_proto_cc",
-        "//tensorflow/compiler/mlir/lite/quantization/ir:QuantOps",
-        "//tensorflow/compiler/mlir/quantization/common:attrs_and_constraints",
-        "//tensorflow/compiler/mlir/quantization/common:lift_as_function_call",
-        "//tensorflow/compiler/mlir/quantization/common:uniform_quantized_types",
-        "//tensorflow/compiler/mlir/quantization/common/quantization_lib",
-        "//tensorflow/compiler/mlir/quantization/stablehlo/ops:stablehlo_op_quant_spec",
-        "//tensorflow/compiler/mlir/quantization/tensorflow:passes",
-        "//tensorflow/compiler/mlir/quantization/tensorflow:quantization_options_proto_cc",
-        "//tensorflow/compiler/mlir/tensorflow",
-        "//tensorflow/core:protos_all_cc",
-        "//tensorflow/core/platform:path",
-        "@com_google_absl//absl/container:flat_hash_set",
-        "@llvm-project//llvm:Support",
-        "@llvm-project//mlir:FuncDialect",
-        "@llvm-project//mlir:IR",
-        "@llvm-project//mlir:Pass",
-        "@llvm-project//mlir:QuantOps",
-        "@llvm-project//mlir:Support",
-        "@stablehlo//:stablehlo_ops",
-    ],
-)
-
 td_library(
     name = "quant_td_files",
     srcs = [
 
@@ -46,12 +46,11 @@ limitations under the License.
 #include "mlir/Support/LLVM.h"  // from @llvm-project
 #include "mlir/Support/LogicalResult.h"  // from @llvm-project
 #include "stablehlo/dialect/StablehloOps.h"  // from @stablehlo  // IWYU pragma: keep
-#include "tensorflow/compiler/mlir/lite/quantization/ir/QuantOps.h"
-#include "tensorflow/compiler/mlir/quantization/common/attrs_and_constraints.h"
-#include "tensorflow/compiler/mlir/quantization/common/lift_as_function_call.h"
-#include "tensorflow/compiler/mlir/quantization/common/quantization_lib/quantization_utils.h"
+#include "tensorflow/compiler/mlir/quantization/common/ir/QuantOps.h"
+#include "tensorflow/compiler/mlir/quantization/common/tf_attrs_and_constraints.h"
+#include "tensorflow/compiler/mlir/quantization/common/tf_lift_as_function_call.h"
+#include "tensorflow/compiler/mlir/quantization/common/tf_quantization_lib/tf_quantization_utils.h"
 #include "tensorflow/compiler/mlir/quantization/common/uniform_quantized_types.h"
-#include "tensorflow/compiler/mlir/quantization/stablehlo/ops/stablehlo_op_quant_spec.h"
 #include "tensorflow/compiler/mlir/quantization/stablehlo/quantization_config.pb.h"
 #include "tensorflow/compiler/mlir/quantization/tensorflow/quantization_options.pb.h"
 #include "tensorflow/compiler/mlir/tensorflow/ir/tf_ops.h"
@@ -62,8 +61,6 @@ namespace mlir::quant::stablehlo {
 
 namespace {
 
-using ::mlir::quant::FindUserOfType;
-using ::mlir::quant::TryCast;
 using ::mlir::stablehlo::AddOp;
 using ::mlir::stablehlo::BroadcastInDimOp;
 using ::mlir::stablehlo::ConcatenateOp;
@@ -74,6 +71,16 @@ using ::mlir::stablehlo::GatherOp;
 using ::mlir::stablehlo::GetDimensionSizeOp;
 using ::mlir::stablehlo::ReshapeOp;
 using ::mlir::stablehlo::UniformQuantizeOp;
+using ::mlir::tf_quant::FindUserOfType;
+using ::mlir::tf_quant::GetDotGeneralQuantizationDim;
+using ::mlir::tf_quant::GetQuantizationMethodOrDefault;
+using ::mlir::tf_quant::HasWeightOnlyPtqMethod;
+using ::mlir::tf_quant::IsHybridQuantizedOp;
+using ::mlir::tf_quant::kCompositeFuncPrefix;
+using ::mlir::tf_quant::kQuantizationMethodAttr;
+using ::mlir::tf_quant::kQuantizedFuncPrefix;
+using ::mlir::tf_quant::kQuantTraitAttrName;
+using ::mlir::tf_quant::TryCast;
 using ::stablehlo::quantization::Method;
 using ::stablehlo::quantization::QuantizedDimension;
 using ::stablehlo::quantization::QuantizedType;
@@ -724,12 +731,12 @@ class XlaCallModuleOpToCallOp : public OpRewritePattern<TF::XlaCallModuleOp> {
 // Quantizes only when the nested region consists of ops whose quantization
 // parameters can be propagated from outside.
 class QuantizeOpWithRegionPattern
-    : public OpRewritePattern<quantfork::DequantizeCastOp> {
+    : public OpRewritePattern<mlir::quant::ir::DequantizeCastOp> {
  public:
   explicit QuantizeOpWithRegionPattern(MLIRContext& ctx)
-      : OpRewritePattern<quantfork::DequantizeCastOp>(&ctx) {};
+      : OpRewritePattern<mlir::quant::ir::DequantizeCastOp>(&ctx) {};
 
-  LogicalResult matchAndRewrite(quantfork::DequantizeCastOp op,
+  LogicalResult matchAndRewrite(mlir::quant::ir::DequantizeCastOp op,
                                 PatternRewriter& rewriter) const final {
     if (match(op).failed()) {
       return failure();
@@ -739,7 +746,7 @@ class QuantizeOpWithRegionPattern
   }
 
  private:
-  LogicalResult match(quantfork::DequantizeCastOp op) const {
+  LogicalResult match(mlir::quant::ir::DequantizeCastOp op) const {
     // Match only when there is one user of the dequantize op.
     if (!op.getResult().hasOneUse()) {
       return failure();
@@ -767,7 +774,7 @@ class QuantizeOpWithRegionPattern
     return success();
   }
 
-  void rewrite(quantfork::DequantizeCastOp op,
+  void rewrite(mlir::quant::ir::DequantizeCastOp op,
                PatternRewriter& rewriter) const {
     // Rewrite the floating-point ops to the quantized version, by fusing
     // preceding dequantize ops and succeding quantize ops.
@@ -785,7 +792,7 @@ class QuantizeOpWithRegionPattern
 
         const Type element_type =
             mlir::cast<TensorType>(operand.getType()).getElementType();
-        if (auto dq_op = dyn_cast_or_null<quantfork::DequantizeCastOp>(
+        if (auto dq_op = dyn_cast_or_null<mlir::quant::ir::DequantizeCastOp>(
                 operand.getDefiningOp())) {
           inputs.push_back(dq_op.getOperand());
         } else if (isa<IntegerType>(element_type)) {
@@ -813,8 +820,9 @@ class QuantizeOpWithRegionPattern
             mlir::cast<TensorType>(result.getType()).getElementType();
         // If the user is the QuantizeOp, it must be the only user.
         if (result.hasOneUse() &&
-            isa<quantfork::QuantizeCastOp>(*result.user_begin())) {
-          auto user = cast<quantfork::QuantizeCastOp>(*result.user_begin());
+            isa<mlir::quant::ir::QuantizeCastOp>(*result.user_begin())) {
+          auto user =
+              cast<mlir::quant::ir::QuantizeCastOp>(*result.user_begin());
           outputs_replaced.push_back(user.getResult());
           output_types.push_back(user.getType());
         } else if (isa<IntegerType>(result_element_type)) {
@@ -944,8 +952,8 @@ bool IsQuantizedCompositeFunction(func::CallOp call_op) {
 
 bool IsConnectedWithQuantizedCompsiteFunction(Operation* same_scale_op) {
   for (const Value operand : same_scale_op->getOperands()) {
-    auto dq_op =
-        dyn_cast_or_null<quantfork::DequantizeCastOp>(operand.getDefiningOp());
+    auto dq_op = dyn_cast_or_null<mlir::quant::ir::DequantizeCastOp>(
+        operand.getDefiningOp());
     if (!dq_op) continue;
 
     Operation* preceding_op = dq_op.getArg().getDefiningOp();
@@ -973,11 +981,11 @@ bool IsConnectedWithQuantizedCompsiteFunction(Operation* same_scale_op) {
   for (const Value result : same_scale_op->getResults()) {
     // If the user is the Quantize op, it must be the only user.
     if (!result.hasOneUse() ||
-        !isa<quantfork::QuantizeCastOp>(*result.user_begin())) {
+        !isa<mlir::quant::ir::QuantizeCastOp>(*result.user_begin())) {
       continue;
     }
 
-    auto q_op = cast<quantfork::QuantizeCastOp>(*result.user_begin());
+    auto q_op = cast<mlir::quant::ir::QuantizeCastOp>(*result.user_begin());
     for (Operation* following_op : q_op->getUsers()) {
       // Check whether the following op is a quantized composite function.
       if (isa<func::CallOp>(following_op)) {
 
@@ -40,13 +40,17 @@ limitations under the License.
 #include "mlir/Support/LLVM.h"  // from @llvm-project
 #include "mlir/Support/LogicalResult.h"  // from @llvm-project
 #include "stablehlo/dialect/StablehloOps.h"  // from @stablehlo
-#include "tensorflow/compiler/mlir/quantization/common/lift_as_function_call.h"
-#include "tensorflow/compiler/mlir/quantization/common/quantization_lib/quantization_utils.h"
-#include "tensorflow/compiler/mlir/quantization/stablehlo/ops/stablehlo_op_quant_spec.h"
+#include "tensorflow/compiler/mlir/quantization/common/tf_lift_as_function_call.h"
+#include "tensorflow/compiler/mlir/quantization/common/tf_quantization_lib/tf_quantization_utils.h"
+#include "tensorflow/compiler/mlir/quantization/stablehlo/ops/tf_stablehlo_op_quant_spec.h"
 #include "tensorflow/core/framework/types.pb.h"
 
 namespace mlir::quant::stablehlo {
 
+using ::mlir::tf_quant::IsWeightOnlyQuantizableOp;
+using ::mlir::tf_quant::stablehlo::GetStableHloQuantConstraints;
+using ::mlir::tf_quant::stablehlo::IsOpQuantizableStableHlo;
+
 // Checks whether an op is connected with a quantized composite function. If
 // not, the same-scale op will not be quantized. This decision is based on the
 // current assumption that the performance gain of the same-scale op itself