edloper
diff --git a/‎RELEASE.md
+1 b/‎RELEASE.md
+1
diff --git a/‎tensorflow/compiler/mlir/lite/ir/tfl_ops.td
+22 b/‎tensorflow/compiler/mlir/lite/ir/tfl_ops.td
+22
diff --git a/‎tensorflow/compiler/mlir/lite/tests/legalize-tf.mlir
+7 b/‎tensorflow/compiler/mlir/lite/tests/legalize-tf.mlir
+7
diff --git a/‎tensorflow/compiler/mlir/lite/tests/mlir2flatbuffer/bucketize.mlir
+67 b/‎tensorflow/compiler/mlir/lite/tests/mlir2flatbuffer/bucketize.mlir
+67
diff --git a/‎tensorflow/compiler/mlir/lite/transforms/legalize_patterns.td
+4 b/‎tensorflow/compiler/mlir/lite/transforms/legalize_patterns.td
+4
diff --git a/‎tensorflow/lite/builtin_ops.h
+1 b/‎tensorflow/lite/builtin_ops.h
+1
diff --git a/‎tensorflow/lite/c/builtin_op_data.h
+7 b/‎tensorflow/lite/c/builtin_op_data.h
+7
diff --git a/‎tensorflow/lite/core/api/flatbuffer_conversions.cc
+13 b/‎tensorflow/lite/core/api/flatbuffer_conversions.cc
+13
diff --git a/‎tensorflow/lite/core/shims/builtin_ops_list.inc
+1 b/‎tensorflow/lite/core/shims/builtin_ops_list.inc
+1
diff --git a/‎tensorflow/lite/kernels/BUILD
+15 b/‎tensorflow/lite/kernels/BUILD
+15
diff --git a/‎tensorflow/lite/kernels/bucketize.cc
+149 b/‎tensorflow/lite/kernels/bucketize.cc
+149
@@ -17,6 +17,7 @@
 * `tf.lite`:
   * Where operation support is added for these data types
     'int32/uint32/int8/uint8/int64'
+  * Add builtin support for `Bucketize` op on CPU.
 
 *<INSERT MAJOR FEATURE HERE, USING MARKDOWN SYNTAX>
 *<IF RELEASE CONTAINS MULTIPLE FEATURES FROM SAME AREA, GROUP THEM TOGETHER>
 
@@ -5125,6 +5125,28 @@ broadcasted shape. `s0`, `s1` and `r0` are all integer vectors.
   );
 }
 
+def TFL_BucketizeOp
+    : TFL_Op<"bucketize", [NoSideEffect, SameOperandsAndResultShape]> {
+  let summary = "Bucketizes 'input' based on 'boundaries'.";
+
+  let description = [{
+Example:
+
+If the inputs are `boundaries = [0, 10, 100]` and
+`input = [[-5, 10000][150, 10][5, 100]]`,
+then the output will be `output = [[0, 3][3, 2][1, 3]]`.
+  }];
+
+  let arguments = (ins
+    TFL_TensorOf<[F32, F64, I32, I64]>:$input,
+    F32ArrayAttr:$boundaries
+  );
+
+  let results = (outs
+    TFL_TensorOf<[I32]>:$output
+  );
+}
+
 #endif // TFL_OPS
 
 // LINT.ThenChange(//tensorflow/lite/tools/versioning/op_version.cc)
@@ -2233,3 +2233,10 @@ func @select_v2_with_high_dims_dynamic_shape_both_sides(%arg0: tensor<8x7x6x5x?x
   // CHECK: return %[[SELECT_V2]] : tensor<8x7x6x5x?x3x2x1xf32>
 }
 
+func @Bucketize(%arg0: tensor<3x2xf32>) -> tensor<3x2xi32> {
+  %0 = "tf.Bucketize"(%arg0) {boundaries = [1.0 : f32, 10.0 : f32, 100.0 : f32]} : (tensor<3x2xf32>) -> tensor<3x2xi32>
+  return %0: tensor<3x2xi32>
+
+// CHECK-LABEL: Bucketize
+// CHECK:  "tfl.bucketize"(%arg0) {boundaries = [1.000000e+00 : f32, 1.000000e+01 : f32, 1.000000e+02 : f32]} : (tensor<3x2xf32>) -> tensor<3x2xi32>
+}
@@ -0,0 +1,67 @@
+// RUN: flatbuffer_translate -mlir-to-tflite-flatbuffer %s -o - | flatbuffer_to_string - | FileCheck %s
+
+func @main(tensor<3x2xf32>) -> tensor<3x2xi32> {
+^bb0(%arg0: tensor<3x2xf32>):
+  // CHECK:      {
+  // CHECK-NEXT:     version: 3,
+  // CHECK-NEXT:     operator_codes: [ {
+  // CHECK-NEXT:       deprecated_builtin_code: 127,
+  // CHECK-NEXT:       version: 1,
+  // CHECK-NEXT:       builtin_code: BUCKETIZE
+  // CHECK-NEXT:     } ],
+  // CHECK-NEXT:     subgraphs: [ {
+  // CHECK-NEXT:       tensors: [ {
+  // CHECK-NEXT:         shape: [ 3, 2 ],
+  // CHECK-NEXT:         buffer: 1,
+  // CHECK-NEXT:         name: "arg0",
+  // CHECK-NEXT:         quantization: {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:         }
+  // CHECK-NEXT:       }, {
+  // CHECK-NEXT:         shape: [ 3, 2 ],
+  // CHECK-NEXT:         buffer: 2,
+  // CHECK-NEXT:         name: "Const",
+  // CHECK-NEXT:         quantization: {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:         }
+  // CHECK-NEXT:       }, {
+  // CHECK-NEXT:         shape: [ 3, 2 ],
+  // CHECK-NEXT:         type: INT32,
+  // CHECK-NEXT:         buffer: 3,
+  // CHECK-NEXT:         name: "bucketize",
+  // CHECK-NEXT:         quantization: {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:         }
+  // CHECK-NEXT:       } ],
+  // CHECK-NEXT:       inputs: [ 0 ],
+  // CHECK-NEXT:       outputs: [ 2 ],
+  // CHECK-NEXT:       operators: [ {
+  // CHECK-NEXT:         inputs: [ 1 ],
+  // CHECK-NEXT:         outputs: [ 2 ]
+  // CHECK-NEXT:       } ],
+  // CHECK-NEXT:       name: "main"
+  // CHECK-NEXT:     } ],
+  // CHECK-NEXT:     description: "MLIR Converted.",
+  // CHECK-NEXT:     buffers: [ {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:     }, {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:     }, {
+  // CHECK-NEXT:       data: [ 0, 0, 160, 192, 0, 64, 28, 70, 0, 0, 22, 67, 0, 0, 32, 65, 0, 0, 160, 64, 0, 0, 200, 66 ]
+  // CHECK-NEXT:     }, {
+  // CHECK-EMPTY:
+  // CHECK-NEXT:     }, {
+  // CHECK-NEXT:       data: [ 50, 46, 56, 46, 48, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 ]
+  // CHECK-NEXT:     } ],
+  // CHECK-NEXT:     metadata: [ {
+  // CHECK-NEXT:       name: "min_runtime_version",
+  // CHECK-NEXT:       buffer: 4
+  // CHECK-NEXT:     } ],
+  // CHECK-NEXT:     signature_defs: [  ]
+  // CHECK-NEXT: }
+  // CHECK-EMPTY:
+
+  %0 = "tfl.pseudo_const" () {value = dense<[[-5.0, 10000.0], [150.0, 10.0], [5.0, 100.0]]> : tensor<3x2xf32>} : () -> tensor<3x2xf32> loc("Const")
+  %1 = "tfl.bucketize"(%0) {boundaries = [0.0 : f32, 10.0 : f32, 100.0 : f32]} : (tensor<3x2xf32>) -> tensor<3x2xi32> loc("bucketize")
+  return %1 : tensor<3x2xi32>
+}
@@ -513,3 +513,7 @@ def LegalizeComplexAbs : Pat<(TF_ComplexAbsOp $arg), (TFL_ComplexAbsOp $arg)>;
 def LegalizeReal : Pat<(TF_RealOp $arg), (TFL_RealOp $arg)>;
 
 def LegalizeImag : Pat<(TF_ImagOp $arg), (TFL_ImagOp $arg)>;
+
+def LegalizeBucketize : Pat<
+  (TF_BucketizeOp $input, F32ArrayAttr:$boundaries),
+  (TFL_BucketizeOp $input, $boundaries)>;
@@ -174,6 +174,7 @@ typedef enum {
   kTfLiteBuiltinAssignVariable = 144,
   kTfLiteBuiltinBroadcastArgs = 145,
   kTfLiteBuiltinRandomStandardNormal = 146,
+  kTfLiteBuiltinBucketize = 147,
 } TfLiteBuiltinOperator;
 
 #ifdef __cplusplus
 
@@ -507,6 +507,13 @@ typedef struct {
   int seed2;
 } TfLiteRandomParams;
 
+typedef struct {
+  int num_boundaries;
+  // This points to the memory stored in the model (flatbuffer),
+  // and is not owned.
+  const float* boundaries;
+} TfLiteBucketizeParams;
+
 #ifdef __cplusplus
 }  // extern "C"
 #endif  // __cplusplus
 
@@ -797,6 +797,19 @@ TfLiteStatus ParseOpDataTfLite(const Operator* op, BuiltinOperator op_type,
       *builtin_data = params.release();
       return kTfLiteOk;
     }
+    case BuiltinOperator_BUCKETIZE: {
+      auto params = safe_allocator.Allocate<TfLiteBucketizeParams>();
+      TF_LITE_ENSURE(error_reporter, params != nullptr);
+      if (const auto* bucketize_params =
+              op->builtin_options_as_BucketizeOptions()) {
+        const flatbuffers::Vector<float>* boundaries =
+            bucketize_params->boundaries();
+        params->num_boundaries = boundaries->size();
+        params->boundaries = boundaries->data();
+      }
+      *builtin_data = params.release();
+      return kTfLiteOk;
+    }
     // Below are the ops with no builtin_data structure.
     // TODO(aselle): Implement call in BuiltinOptions, but nullptrs are
     // ok for now, since there is no call implementation either.
 
@@ -159,3 +159,4 @@ TFLITE_OP(Register_READ_VARIABLE)
 TFLITE_OP(Register_ASSIGN_VARIABLE)
 TFLITE_OP(Register_BROADCAST_ARGS)
 TFLITE_OP(Register_RANDOM_STANDARD_NORMAL)
+TFLITE_OP(Register_BUCKETIZE)
@@ -556,6 +556,7 @@ BUILTIN_KERNEL_SRCS = [
     "bidirectional_sequence_rnn.cc",
     "broadcast_args.cc",
     "broadcast_to.cc",
+    "bucketize.cc",
     "call_once.cc",
     "cast.cc",
     "ceil.cc",
@@ -1118,6 +1119,20 @@ cc_test(
     ],
 )
 
+cc_test(
+    name = "bucketize_test",
+    size = "small",
+    srcs = ["bucketize_test.cc"],
+    deps = [
+        ":builtin_ops",
+        ":test_main",
+        ":test_util",
+        "//tensorflow/lite/schema:schema_fbs",
+        "//tensorflow/lite/testing:util",
+        "@com_google_googletest//:gtest",
+    ],
+)
+
 cc_test(
     name = "cast_test",
     size = "small",
 
@@ -0,0 +1,149 @@
+/* Copyright 2021 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <stdint.h>
+
+#include <algorithm>
+
+#include "tensorflow/lite/c/builtin_op_data.h"
+#include "tensorflow/lite/c/common.h"
+#include "tensorflow/lite/kernels/internal/tensor.h"
+#include "tensorflow/lite/kernels/internal/tensor_ctypes.h"
+#include "tensorflow/lite/kernels/kernel_util.h"
+
+namespace tflite {
+namespace ops {
+namespace builtin {
+namespace bucketize {
+namespace {
+
+constexpr int kInputTensor = 0;
+constexpr int kOutputTensor = 0;
+
+struct OpData {
+  // boundaries array is owned by the buffer housing TfLiteBucketizeParams.
+  const float* boundaries;
+  int num_boundaries;
+};
+
+void* Init(TfLiteContext* context, const char* buffer, size_t length) {
+  auto* op_data = new OpData();
+  const auto* params = reinterpret_cast<const TfLiteBucketizeParams*>(buffer);
+
+  op_data->boundaries = params->boundaries;
+  op_data->num_boundaries = params->num_boundaries;
+  return op_data;
+}
+
+void Free(TfLiteContext* context, void* buffer) {
+  delete reinterpret_cast<OpData*>(buffer);
+}
+
+TfLiteStatus Prepare(TfLiteContext* context, TfLiteNode* node) {
+  TF_LITE_ENSURE_EQ(context, NumInputs(node), 1);
+  TF_LITE_ENSURE_EQ(context, NumOutputs(node), 1);
+  OpData* opdata = reinterpret_cast<OpData*>(node->user_data);
+  if (!std::is_sorted(opdata->boundaries,
+                      opdata->boundaries + opdata->num_boundaries)) {
+    TF_LITE_KERNEL_LOG(context, "Expected sorted boundaries");
+    return kTfLiteError;
+  }
+
+  const TfLiteTensor* input;
+  TF_LITE_ENSURE_OK(context, GetInputSafe(context, node, kInputTensor, &input));
+
+  if (input->type != kTfLiteInt32 && input->type != kTfLiteFloat32 &&
+      input->type != kTfLiteInt64 && input->type != kTfLiteFloat64) {
+    TF_LITE_KERNEL_LOG(context, "Type '%s' is not supported by bucketize.",
+                       TfLiteTypeGetName(input->type));
+    return kTfLiteError;
+  }
+
+  TfLiteTensor* output;
+  TF_LITE_ENSURE_OK(context,
+                    GetOutputSafe(context, node, kOutputTensor, &output));
+  output->type = kTfLiteInt32;
+
+  TfLiteIntArray* output_shape = TfLiteIntArrayCopy(input->dims);
+  return context->ResizeTensor(context, output, output_shape);
+}
+
+template <typename T>
+inline void Bucketize(const RuntimeShape& input_shape, const T* input_data,
+                      const float* boundaries, int num_boundaries,
+                      const RuntimeShape& output_shape, int32_t* output_data) {
+  const int flat_size = MatchingFlatSize(input_shape, output_shape);
+
+  for (int i = 0; i < flat_size; i++) {
+    auto first_bigger_it = std::upper_bound(
+        boundaries, boundaries + num_boundaries, input_data[i]);
+    output_data[i] = first_bigger_it - boundaries;
+  }
+}
+
+template <typename T>
+TfLiteStatus BucketizeImpl(TfLiteContext* context, TfLiteNode* node) {
+  const TfLiteTensor* input;
+  TF_LITE_ENSURE_OK(context, GetInputSafe(context, node, kInputTensor, &input));
+  OpData* opdata = reinterpret_cast<OpData*>(node->user_data);
+  TfLiteTensor* output;
+  TF_LITE_ENSURE_OK(context,
+                    GetOutputSafe(context, node, kOutputTensor, &output));
+  TF_LITE_ENSURE_TYPES_EQ(context, output->type, kTfLiteInt32);
+
+  Bucketize<T>(GetTensorShape(input), GetTensorData<T>(input),
+               opdata->boundaries, opdata->num_boundaries,
+               GetTensorShape(output), GetTensorData<int32_t>(output));
+
+  return kTfLiteOk;
+}
+
+TfLiteStatus Eval(TfLiteContext* context, TfLiteNode* node) {
+  const TfLiteTensor* input;
+  TF_LITE_ENSURE_OK(context, GetInputSafe(context, node, kInputTensor, &input));
+
+  switch (input->type) {
+    case kTfLiteFloat32: {
+      return BucketizeImpl<float>(context, node);
+    }
+    case kTfLiteFloat64: {
+      return BucketizeImpl<double>(context, node);
+    }
+    case kTfLiteInt32: {
+      return BucketizeImpl<int32_t>(context, node);
+    }
+    case kTfLiteInt64: {
+      return BucketizeImpl<int64_t>(context, node);
+    }
+    default: {
+      TF_LITE_KERNEL_LOG(context, "Type '%s' is not supported by bucketize.",
+                         TfLiteTypeGetName(input->type));
+      return kTfLiteError;
+    }
+  }
+}
+
+}  // namespace
+}  // namespace bucketize
+
+TfLiteRegistration* Register_BUCKETIZE() {
+  static TfLiteRegistration r = {bucketize::Init, bucketize::Free,
+                                 bucketize::Prepare, bucketize::Eval};
+  return &r;
+}
+
+}  // namespace builtin
+}  // namespace ops
+}  // namespace tflite