Add per-tensor quantization into dynamic range quantization execution path for TRANSPOSE_CONV layer (https://github.com/tensorflow/tensorflow/issues/76624)

PiperOrigin-RevId: 682438954
2025-12-06 12:20:11 +01:00 · 2024-10-04 13:50:51 -07:00 · 2024-10-04 13:50:51 -07:00 · dde5634061
commit dde5634061
parent fa74dd087d
2 changed files with 18 additions and 6 deletions
--- a/RELEASE.md
+++ b/RELEASE.md
@ -99,6 +99,7 @@ This release contains contributions from many people at Google, as well as:
    * Add support for `stablehlo.composite`.
    * `EmbeddingLookup` op supports per-channel quantization and `TensorType_INT4` values.
    * `FullyConnected` op supports `TensorType_INT16` activation and `TensorType_Int4` weight per-channel quantization.
    * Enable per-tensor quantization support in dynamic range quantization of `TRANSPOSE_CONV` layer. Fixes TFLite converter [bug](https://github.com/tensorflow/tensorflow/issues/76624).
 * `tf.tensor_scatter_update`, `tf.tensor_scatter_add` and of other reduce types.
    * Support `bad_indices_policy`.
--- a/tensorflow/lite/kernels/transpose_conv.cc
+++ b/tensorflow/lite/kernels/transpose_conv.cc
@ -477,14 +477,25 @@ TfLiteStatus Prepare(TfLiteContext* context, TfLiteNode* node) {
                                                       scaling_factors_size));
    }
-    const auto* affine_quantization =
+    auto* affine_quantization = reinterpret_cast<TfLiteAffineQuantization*>(
-        reinterpret_cast<TfLiteAffineQuantization*>(
+        weights->quantization.params);
            weights->quantization.params);
    TF_LITE_ENSURE(context, affine_quantization);
    TF_LITE_ENSURE(context, affine_quantization->scale);
-    TF_LITE_ENSURE_EQ(
+
-        context, affine_quantization->scale->size,
+    const int channels_out =
-        weights->dims->data[affine_quantization->quantized_dimension]);
+        weights->dims->data[affine_quantization->quantized_dimension];
    if (affine_quantization->scale->size != channels_out) {
      TF_LITE_ENSURE_EQ(context, affine_quantization->scale->size, 1);
      TfLiteFloatArrayFree(affine_quantization->scale);
      affine_quantization->scale = TfLiteFloatArrayCreate(channels_out);
      for (int i = 0; i < channels_out; ++i) {
        affine_quantization->scale->data[i] = weights->params.scale;
      }
    } else {
      TF_LITE_ENSURE_EQ(context, affine_quantization->scale->size,
                        channels_out);
    }
    node->temporaries->data[data->input_offset_index] = data->input_offset_id;
    TfLiteTensor* input_offsets;
    TF_LITE_ENSURE_OK(context,