ROCm
diff --git a/‎tensorflow/compiler/mlir/BUILD‎
Lines changed: 1 addition & 0 deletions b/‎tensorflow/compiler/mlir/BUILD‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/quantization/quantization_utils.cc‎
Lines changed: 30 additions & 43 deletions b/‎tensorflow/compiler/mlir/lite/quantization/quantization_utils.cc‎
Lines changed: 30 additions & 43 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/quantization/quantization_utils.h‎
Lines changed: 5 additions & 11 deletions b/‎tensorflow/compiler/mlir/lite/quantization/quantization_utils.h‎
Lines changed: 5 additions & 11 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/tests/debuginfo/BUILD‎
Lines changed: 26 additions & 1 deletion b/‎tensorflow/compiler/mlir/lite/tests/debuginfo/BUILD‎
Lines changed: 26 additions & 1 deletion
diff --git a/‎tensorflow/compiler/mlir/lite/tests/debuginfo/concrete_function_error.py‎
Lines changed: 77 additions & 0 deletions b/‎tensorflow/compiler/mlir/lite/tests/debuginfo/concrete_function_error.py‎
Lines changed: 77 additions & 0 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/tests/debuginfo/saved_model_error.py‎
Lines changed: 87 additions & 0 deletions b/‎tensorflow/compiler/mlir/lite/tests/debuginfo/saved_model_error.py‎
Lines changed: 87 additions & 0 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/tests/prepare-tf.mlir‎
Lines changed: 6 additions & 2 deletions b/‎tensorflow/compiler/mlir/lite/tests/prepare-tf.mlir‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎tensorflow/compiler/mlir/lite/transforms/legalize_patterns.td‎
Lines changed: 1 addition & 1 deletion b/‎tensorflow/compiler/mlir/lite/transforms/legalize_patterns.td‎
Lines changed: 1 addition & 1 deletion
@@ -29,6 +29,7 @@ cc_library(
     srcs = ["op_or_arg_name_mapper.cc"],
     hdrs = ["op_or_arg_name_mapper.h"],
     deps = [
+        "@com_google_absl//absl/strings",
         "@llvm//:support",
         "@local_config_mlir//:IR",
     ],
 
@@ -45,13 +45,14 @@ static Type GetQuantizedType(Builder builder, Type input_type,
       quant::ExpressedToQuantizedConverter::forInputType(input_type);
 
   quant::QuantizedType quantizedEleType;
-  if (min.size() == 1 && max.size() == 1) {
+  if (min.size() == 1 && max.size() == 1 && quant_dim == -1) {
     quantizedEleType = quant::fakeQuantAttrsToType(
         builder.getUnknownLoc(), storage_type_width, min[0], max[0],
         narrow_range, converter.expressedType, is_signed);
   } else if (min.size() == max.size()) {
     auto shape = input_type.dyn_cast<ShapedType>();
-    if (!shape || min.size() != shape.getDimSize(quant_dim)) {
+    if (!shape || shape.getRank() <= quant_dim ||
+        min.size() != shape.getDimSize(quant_dim)) {
       return {};
     }
     // TODO(b/141508873): the quantization dim is set to the last dimension.
@@ -92,33 +93,39 @@ TypeAttr GetQuantizedTypeAttr(Builder builder, Type input_type, Attribute min,
   Type final_type =
       GetQuantizedType(builder, input_type, min_value, max_value, quant_dim,
                        num_bits.getInt(), narrow_range.getValue(), is_signed);
+  if (!final_type) return {};
   return TypeAttr::get(final_type);
 }
 
-// TODO(fengliuai): expose the `quant_dim` argument.
-TypeAttr GetQuantizedTypeAttr(Builder builder, Type input_type, Attribute min,
-                              Attribute max, IntegerAttr num_bits,
-                              BoolAttr narrow_range, bool is_signed) {
-  // When input_type isn't a ranked shaped type, it shouldn't be per-axis
-  // quantizatied, and `quant_dim` shouldn't be used, otherwise, set it to the
-  // last dimension.
-  int quant_dim = 0;
-  if (auto shape = input_type.dyn_cast<RankedTensorType>()) {
-    quant_dim = shape.getRank() - 1;
+// Repeats the content of `data` multiple times to resize to `target_size`.
+// Note that this only broadcast across one dimension.
+template <typename T>
+static bool BroadcastVector(int target_size, SmallVectorImpl<T>& data) {
+  int size = data.size();
+  if (size != target_size) {
+    if (target_size % size != 0) return true;
+    data.reserve(target_size);
+    for (int i = 1, e = target_size / size; i != e; ++i) {
+      data.insert(data.end(), data.begin(), data.begin() + size);
+    }
   }
-  return GetQuantizedTypeAttr(builder, input_type, min, max, quant_dim,
-                              num_bits, narrow_range, is_signed);
+  return false;
 }
 
 // Changes the axis of the input per-channel quantized type to match the
 // dimension of the target type. Returns nullptr if it fails.
 static quant::UniformQuantizedPerAxisType ResetAxisAndBroadcast(
-    quant::UniformQuantizedPerAxisType qtype, Type target, int axis) {
-  auto shaped = target.dyn_cast<ShapedType>();
+    quant::UniformQuantizedPerAxisType qtype, Type target, int quant_dim) {
+  auto shaped = target.dyn_cast<RankedTensorType>();
   if (!shaped) return {};
 
-  // Broadcast the scales and zero points to match the length of the axis-th
-  // dimension of the target type. Currently, it covers two cases:
+  SmallVector<double, 4> scales(qtype.getScales().begin(),
+                                qtype.getScales().end());
+  SmallVector<int64_t, 4> zero_points(qtype.getZeroPoints().begin(),
+                                      qtype.getZeroPoints().end());
+  // Broadcast the scales and zero points to match the target size, which is
+  // usually the axis-th dimension of the target type. Currently, it covers two
+  // cases:
   // - for Transpose, the data layout is changed so the `dim[axis]` still equals
   // to the `scales_size`. The broadcast skips;
   // - for Reshape, the data layout isn't changed but the innermost dimension is
@@ -127,33 +134,13 @@ static quant::UniformQuantizedPerAxisType ResetAxisAndBroadcast(
   //
   // TODO(b/141709944): after the fix, the `scales` can be for dim[2], thus we
   // have to repeat each elements in the `scales` locally dim[3] times.
-  auto scales = qtype.getScales();
-  auto zero_points = qtype.getZeroPoints();
-  int target_size = shaped.getDimSize(axis);
-  int scales_size = scales.size();
-  int zero_points_size = zero_points.size();
-
-  SmallVector<double, 4> new_scales;
-  SmallVector<int64_t, 4> new_zero_points;
-  if (scales_size != target_size) {
-    if (target_size % scales_size != 0) return {};
-    for (int i = 0, e = target_size / scales_size; i != e; ++i) {
-      new_scales.insert(new_scales.end(), scales.begin(), scales.end());
-    }
-    scales = new_scales;
+  if (BroadcastVector<double>(shaped.getDimSize(quant_dim), scales) ||
+      BroadcastVector<int64_t>(shaped.getDimSize(quant_dim), zero_points)) {
+    return {};
   }
-  if (zero_points_size != target_size) {
-    if (target_size % zero_points_size != 0) return {};
-    for (int i = 0, e = target_size / zero_points_size; i != e; ++i) {
-      new_zero_points.insert(new_zero_points.end(), zero_points.begin(),
-                             zero_points.end());
-    }
-    zero_points = new_zero_points;
-  }
-
   return quant::UniformQuantizedPerAxisType::get(
       qtype.getFlags(), qtype.getStorageType(), qtype.getExpressedType(),
-      scales, zero_points, axis, qtype.getStorageTypeMin(),
+      scales, zero_points, quant_dim, qtype.getStorageTypeMin(),
       qtype.getStorageTypeMax());
 }
 
@@ -208,7 +195,7 @@ Type GetUniformQuantizedTypeForWeight(ElementsAttr attr, unsigned num_bits,
     }
   }
   auto type =
-      GetQuantizedType(builder, attr.getType(), min, max, /*quant_dim=*/0,
+      GetQuantizedType(builder, attr.getType(), min, max, /*quant_dim=*/-1,
                        num_bits, narrow_range, is_signed);
   if (auto ele_type = type.dyn_cast_or_null<TensorType>())
     return ele_type.getElementType();
 
@@ -307,22 +307,16 @@ struct ConvertUnsignedToSigned : public OpRewritePattern<Q> {
 // `narrow_range` is set to true for weights and `is_signed` is set to true
 // if it is using signed int symmetric quantization.
 //
-// Note that this method doesn't modify min and max, so they needs to be
-// adjusted before calling this method if symmetric quantized type needs to be
-// returned.
+// Note that this method may broadcast min and max to match the dimension length
+// of `input_type`, if the the `quant_dim` is valid. On the other hand, the
+// symmetry of min and max is not adjusted by this method. The QAT workflow
+// should set min/max correctly (and use `narrow_range`=true, `is_signed`=true)
+// if symmetric quantization is required.
 TypeAttr GetQuantizedTypeAttr(Builder builder, Type input_type, Attribute min,
                               Attribute max, int quant_dim,
                               IntegerAttr num_bits, BoolAttr narrow_range,
                               bool is_signed);
 
-// Same above, but the `channel_dim` is hardcoded to the last dimension to match
-// the behavior of tf.FakeQuantWithMinMaxVarsPerChannel. This method is called
-// when converting tf.FakeQuant* ops to MLIR's quant parameter representation,
-// aka. quant::QuantType.
-TypeAttr GetQuantizedTypeAttr(Builder builder, Type input_type, Attribute min,
-                              Attribute max, IntegerAttr num_bits,
-                              BoolAttr narrow_range, bool is_signed);
-
 // Casts the `target` type to a quantized type by using the quantization
 // parameters from the type in the `source` type attribute.
 // Examples:
 
@@ -8,7 +8,10 @@ glob_lit_tests(
         ":test_utilities",
     ],
     driver = "@local_config_mlir//:run_lit.sh",
-    test_file_exts = ["pbtxt"],
+    test_file_exts = [
+        "pbtxt",
+        "py",
+    ],
 )
 
 # Bundle together all the debug info files that are used by the tests.
@@ -24,8 +27,30 @@ filegroup(
     name = "test_utilities",
     testonly = True,
     data = [
+        ":concrete_function_error",
+        ":saved_model_error",
         "//tensorflow/compiler/mlir/lite:flatbuffer_to_string",
         "//tensorflow/compiler/mlir/lite:tf_tfl_translate",
         "@llvm//:FileCheck",
     ],
 )
+
+py_binary(
+    name = "saved_model_error",
+    srcs = ["saved_model_error.py"],
+    main = "saved_model_error.py",
+    python_version = "PY3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
+py_binary(
+    name = "concrete_function_error",
+    srcs = ["concrete_function_error.py"],
+    main = "concrete_function_error.py",
+    python_version = "PY3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+    ],
+)
@@ -0,0 +1,77 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Test file to display the error message and verify it with FileCheck."""
+
+# RUN: %p/concrete_function_error | FileCheck %s
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import sys
+from absl import app
+
+from tensorflow import enable_v2_behavior
+import tensorflow.compat.v2 as tf
+
+enable_v2_behavior()
+
+
+class TestGraphDebugInfo(object):
+  """Test stack trace can be displayed."""
+
+  def testConcreteFunctionDebugInfo(self):
+    """Create a concrete func with unsupported ops, and convert it."""
+    @tf.function(
+        input_signature=[tf.TensorSpec(shape=[3, 3], dtype=tf.float32)])
+    def model(x):
+      y = tf.math.reciprocal(x)  # Not supported
+      return y + y
+
+    func = model.get_concrete_function()
+    converter = tf.lite.TFLiteConverter.from_concrete_functions([func])
+    converter.experimental_new_converter = True
+    converter.convert()
+
+# pylint: disable=line-too-long
+
+# CHECK-LABEL: testConcreteFunctionDebugInfo
+# CHECK: error: 'tf.Reciprocal' op is neither a custom op nor a flex op
+# CHECK:                                  attrs=attr_protos, op_def=op_def)
+# CHECK:                                  ^
+# CHECK: {{.*tensorflow/python/ops/gen_math_ops.py:[0-9]+:[0-9]+: note: called from}}
+# CHECK:         "Reciprocal", x=x, name=name)
+# CHECK:         ^
+# CHECK: {{.*tensorflow/compiler/mlir/lite/tests/debuginfo/concrete_function_error.py:[0-9]+:[0-9]+: note: called from}}
+# CHECK:     y = tf.math.reciprocal(x)  # Not supported
+# CHECK:     ^
+# CHECK: <unknown>:0: error: failed while converting: 'main'
+
+# pylint: enable=line-too-long
+
+
+def main(argv):
+  if len(argv) > 1:
+    raise app.UsageError('Too many command-line arguments.')
+
+  try:
+    TestGraphDebugInfo().testConcreteFunctionDebugInfo()
+  except Exception as e:  # pylint: disable=broad-except
+    sys.stdout.write('testConcreteFunctionDebugInfo')
+    sys.stdout.write(str(e))
+
+
+if __name__ == '__main__':
+  app.run(main)
@@ -0,0 +1,87 @@
+# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Test file to display the error message and verify it with FileCheck."""
+
+# RUN: %p/saved_model_error | FileCheck %s
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import sys
+from absl import app
+
+from tensorflow import enable_v2_behavior
+import tensorflow.compat.v2 as tf
+
+enable_v2_behavior()
+
+
+class TestModule(tf.Module):
+  """The test model has supported op."""
+
+  @tf.function(input_signature=[tf.TensorSpec(shape=[3, 3], dtype=tf.float32)])
+  def model(self, x):
+    y = tf.math.reciprocal(x)  # Not supported
+    return y + y
+
+
+class TestGraphDebugInfo(object):
+  """Test stack trace can be displayed."""
+
+  def testSavedModelDebugInfo(self):
+    """Save a saved model with unsupported ops, and then load and convert it."""
+    # saved the model
+    test_model = TestModule()
+    saved_model_path = '/tmp/test.saved_model'
+    save_options = tf.saved_model.SaveOptions(save_debug_info=True)
+    tf.saved_model.save(test_model, saved_model_path, options=save_options)
+
+    # load the model and convert
+    converter = tf.lite.TFLiteConverter.from_saved_model(saved_model_path)
+    converter.experimental_new_converter = True
+    converter.convert()
+
+# pylint: disable=line-too-long
+
+# CHECK-LABEL: testSavedModelDebugInfo
+# CHECK: error: 'tf.Reciprocal' op is neither a custom op nor a flex op
+# CHECK:                                  attrs=attr_protos, op_def=op_def)
+# CHECK:                                  ^
+# CHECK: {{.*tensorflow/python/ops/gen_math_ops.py:[0-9]+:[0-9]+: note: called from}}
+# CHECK:         "Reciprocal", x=x, name=name)
+# CHECK:         ^
+# CHECK: {{.*tensorflow/compiler/mlir/lite/tests/debuginfo/saved_model_error.py:[0-9]+:[0-9]+: note: called from}}
+# CHECK:     y = tf.math.reciprocal(x)  # Not supported
+# CHECK:     ^
+# CHECK: <unknown>:0: error: failed while converting: 'main'
+
+# pylint: enable=line-too-long
+
+
+def main(argv):
+  """test driver method writes the error message to stdout."""
+  if len(argv) > 1:
+    raise app.UsageError('Too many command-line arguments.')
+
+  try:
+    TestGraphDebugInfo().testSavedModelDebugInfo()
+  except Exception as e:  # pylint: disable=broad-except
+    sys.stdout.write('testSavedModelDebugInfo')
+    sys.stdout.write(str(e))
+
+
+if __name__ == '__main__':
+  app.run(main)
@@ -296,7 +296,8 @@ func @perChannelFakeQuantWithConv2D(tensor<256x32x32x3xf32>) -> (tensor<256x30x3
 
 // CHECK: %[[CONSTANT:.*]] = constant dense<0.000000e+00> : tensor<16xf32>
 // CHECK: %[[CONSTANT0:.*]] = constant dense<0.000000e+00> : tensor<16x3x3x3xf32>
-// CHECK: %[[QUANTIZE:.*]] = "tfl.quantize"(%[[CONSTANT0]]) {qtype = tensor<16x3x3x3x!quant.uniform<u8:f32:0, {1.000000e+00
+// CHECK: %[[QUANTIZE:.*]] = "tfl.quantize"(%[[CONSTANT0]]) {qtype = tensor<16x3x3x3x!quant.uniform<u8:f32:0,
+// CHECK-SAME: {1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00}>>
 // CHECK: %[[DEQUANTIZE:.*]] = "tfl.dequantize"(%[[QUANTIZE]])
 // CHECK: %[[CONV:.*]] = "tfl.conv_2d"(%arg0, %[[DEQUANTIZE]], %[[CONSTANT]])
 // CHECK: return %[[CONV]] : tensor<256x30x30x16xf32>
@@ -336,7 +337,10 @@ func @perChannelFakeQuantWithDepthwiseConv2D(tensor<256x32x32x3xf32>) -> (tensor
 
 // CHECK: %[[CONSTANT:.*]] = constant dense<0.000000e+00> : tensor<48xf32>
 // CHECK: %[[CONSTANT0:.*]] = constant dense<0.000000e+00> : tensor<1x3x3x48xf32>
-// CHECK: %[[QUANTIZE:.*]] = "tfl.quantize"(%[[CONSTANT0]]) {qtype = tensor<1x3x3x48x!quant.uniform<u8:f32:3, {1.000000e+00
+// CHECK: %[[QUANTIZE:.*]] = "tfl.quantize"(%[[CONSTANT0]]) {qtype = tensor<1x3x3x48x!quant.uniform<u8:f32:3,
+// CHECK-SAME: {1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,
+// CHECK-SAME:  1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,
+// CHECK-SAME:  1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00,1.000000e+00}>>}
 // CHECK: %[[DEQUANTIZE:.*]] = "tfl.dequantize"(%[[QUANTIZE]])
 // CHECK: %[[CONV:.*]] = "tfl.depthwise_conv_2d"(%arg0, %[[DEQUANTIZE]], %[[CONSTANT]])
 // CHECK: return %[[CONV]]
 
@@ -39,7 +39,7 @@ def Merge2AttrsToArray : NativeCodeCall<"$_builder.getArrayAttr({$0, $1})">;
 // Use the tensor type information from $0 and convert min $1, max $2 and
 // numBits $3 and narrowRange $4 to a QuantizedType.
 def ConvertToQuantTypeFromAttrs : NativeCodeCall<
-    "GetQuantizedTypeAttr($_builder, $0->getType(), $1, $2, $3, $4, /*is_signed=*/false)">;
+    "GetQuantizedTypeAttr($_builder, $0->getType(), $1, $2, -1, $3, $4, /*is_signed=*/false)">;
 
 // Converts an integer attribute $0 to 32-bit with builder.
 def convertIntAttrTo32Bit : NativeCodeCall<