MachineLearningPractitioner
diff --git a/‎tensorflow/core/kernels/non_max_suppression_op.cc‎
Lines changed: 49 additions & 93 deletions b/‎tensorflow/core/kernels/non_max_suppression_op.cc‎
Lines changed: 49 additions & 93 deletions
diff --git a/‎tensorflow/core/kernels/non_max_suppression_op_test.cc‎
Lines changed: 4 additions & 161 deletions b/‎tensorflow/core/kernels/non_max_suppression_op_test.cc‎
Lines changed: 4 additions & 161 deletions
@@ -33,7 +33,6 @@ limitations under the License.
 #include "tensorflow/core/platform/logging.h"
 
 namespace tensorflow {
-namespace {
 
 typedef Eigen::ThreadPoolDevice CPUDevice;
 
@@ -90,63 +89,6 @@ static inline float ComputeIOU(typename TTypes<float, 2>::ConstTensor boxes,
   return intersection_area / (area_i + area_j - intersection_area);
 }
 
-void DoNonMaxSuppressionOp(OpKernelContext* context,
-                           const Tensor& boxes,
-                           const Tensor& scores,
-                           const Tensor& max_output_size,
-                           const float iou_threshold) {
-  OP_REQUIRES(context, iou_threshold >= 0 && iou_threshold <= 1,
-      errors::InvalidArgument("iou_threshold must be in [0, 1]"));
-  
-  int num_boxes = 0;
-  ParseAndCheckBoxSizes(context, boxes, scores, &num_boxes);
-  if (!context->status().ok()) {
-    return;
-  }
-
-  const int output_size =
-      std::min(max_output_size.scalar<int>()(), num_boxes);
-  typename TTypes<float, 2>::ConstTensor boxes_data =
-      boxes.tensor<float, 2>();
-
-  std::vector<float> scores_data(num_boxes);
-  std::copy_n(scores.flat<float>().data(), num_boxes, scores_data.begin());
-  std::vector<int> sorted_indices;
-  DecreasingArgSort(scores_data, &sorted_indices);
-
-  std::vector<bool> active(num_boxes, true);
-  std::vector<int> selected;
-  int num_active = active.size();
-  for (int i = 0; i < num_boxes; ++i) {
-    if (num_active == 0 || selected.size() >= output_size) break;
-    if (active[i]) {
-      selected.push_back(sorted_indices[i]);
-    } else {
-      continue;
-    }
-    for (int j = i + 1; j < num_boxes; ++j) {
-      if (active[j]) {
-        float iou =
-          ComputeIOU(boxes_data, sorted_indices[i], sorted_indices[j]);
-        if (iou > iou_threshold) {
-          active[j] = false;
-          num_active--;
-        }
-      }
-    }
-  }
-
-  // Allocate output tensor
-  Tensor* output = nullptr;
-  TensorShape output_shape({static_cast<int>(selected.size())});
-  OP_REQUIRES_OK(context, context->allocate_output(0, output_shape, &output));
-  typename TTypes<int, 1>::Tensor selected_indices_data =
-      output->tensor<int, 1>();
-  std::copy_n(selected.begin(), selected.size(), selected_indices_data.data());
-}
-
-} // namespace
-
 template <typename Device>
 class NonMaxSuppressionOp : public OpKernel {
  public:
@@ -156,6 +98,9 @@ class NonMaxSuppressionOp : public OpKernel {
   }
 
   void Compute(OpKernelContext* context) override {
+    OP_REQUIRES(context, iou_threshold_ >= 0 && iou_threshold_ <= 1,
+                errors::InvalidArgument("iou_threshold must be in [0, 1]"));
+
     // boxes: [num_boxes, 4]
     const Tensor& boxes = context->input(0);
     // scores: [num_boxes]
@@ -167,48 +112,59 @@ class NonMaxSuppressionOp : public OpKernel {
         errors::InvalidArgument("max_output_size must be 0-D, got shape ",
                                 max_output_size.shape().DebugString()));
 
-    DoNonMaxSuppressionOp(context, boxes, scores, max_output_size, iou_threshold_);
-  }
+    int num_boxes = 0;
+    ParseAndCheckBoxSizes(context, boxes, scores, &num_boxes);
+    if (!context->status().ok()) {
+      return;
+    }
 
- private:
-  float iou_threshold_;
-};
+    const int output_size =
+        std::min(max_output_size.scalar<int>()(), num_boxes);
+    typename TTypes<float, 2>::ConstTensor boxes_data =
+        boxes.tensor<float, 2>();
+
+    std::vector<float> scores_data(num_boxes);
+    std::copy_n(scores.flat<float>().data(), num_boxes, scores_data.begin());
+    std::vector<int> sorted_indices;
+    DecreasingArgSort(scores_data, &sorted_indices);
+
+    std::vector<bool> active(num_boxes, true);
+    std::vector<int> selected;
+    int num_active = active.size();
+    for (int i = 0; i < num_boxes; ++i) {
+      if (num_active == 0 || selected.size() >= output_size) break;
+      if (active[i]) {
+        selected.push_back(sorted_indices[i]);
+      } else {
+        continue;
+      }
+      for (int j = i + 1; j < num_boxes; ++j) {
+        if (active[j]) {
+          float iou =
+              ComputeIOU(boxes_data, sorted_indices[i], sorted_indices[j]);
+          if (iou > iou_threshold_) {
+            active[j] = false;
+            num_active--;
+          }
+        }
+      }
+    }
 
-template <typename Device>
-class NonMaxSuppressionV2Op : public OpKernel {
- public:
-  explicit NonMaxSuppressionV2Op(OpKernelConstruction* context)
-      : OpKernel(context) {
+    // Allocate output tensor
+    Tensor* output = nullptr;
+    TensorShape output_shape({static_cast<int>(selected.size())});
+    OP_REQUIRES_OK(context, context->allocate_output(0, output_shape, &output));
+    typename TTypes<int, 1>::Tensor selected_indices_data =
+        output->tensor<int, 1>();
+    std::copy_n(selected.begin(), selected.size(),
+                selected_indices_data.data());
   }
 
-  void Compute(OpKernelContext* context) override {
-    // boxes: [num_boxes, 4]
-    const Tensor& boxes = context->input(0);
-    // scores: [num_boxes]
-    const Tensor& scores = context->input(1);
-    // max_output_size: scalar
-    const Tensor& max_output_size = context->input(2);
-    OP_REQUIRES(
-        context, TensorShapeUtils::IsScalar(max_output_size.shape()),
-        errors::InvalidArgument("max_output_size must be 0-D, got shape ",
-                                max_output_size.shape().DebugString()));
-    // iou_threshold: scalar
-    const Tensor& iou_threshold = context->input(3);
-    OP_REQUIRES(
-        context, TensorShapeUtils::IsScalar(iou_threshold.shape()),
-        errors::InvalidArgument("iou_threshold must be 0-D, got shape ",
-                                iou_threshold.shape().DebugString()));
-
-    const float iou_threshold_val = iou_threshold.scalar<float>()();
-
-    DoNonMaxSuppressionOp(context, boxes, scores, max_output_size, iou_threshold_val);
-  }
+ private:
+  float iou_threshold_;
 };
 
 REGISTER_KERNEL_BUILDER(Name("NonMaxSuppression").Device(DEVICE_CPU),
                         NonMaxSuppressionOp<CPUDevice>);
 
-REGISTER_KERNEL_BUILDER(Name("NonMaxSuppressionV2").Device(DEVICE_CPU),
-                        NonMaxSuppressionV2Op<CPUDevice>);
-
 }  // namespace tensorflow
@@ -141,174 +141,18 @@ TEST_F(NonMaxSuppressionOpTest, TestInconsistentBoxAndScoreShapes) {
   AddInputFromArray<float>(TensorShape({5}), {.9f, .75f, .6f, .95f, .5f});
   AddInputFromArray<int>(TensorShape({}), {30});
   Status s = RunOpKernel();
-  
-  ASSERT_FALSE(s.ok());
-  EXPECT_TRUE(
-              StringPiece(s.ToString()).contains("scores has incompatible shape"))
-    << s;
-}
-
-TEST_F(NonMaxSuppressionOpTest, TestInvalidIOUThreshold) {
-  MakeOp(1.2);
-  AddInputFromArray<float>(TensorShape({1, 4}), {0, 0, 1, 1});
-  AddInputFromArray<float>(TensorShape({1}), {.9f});
-  AddInputFromArray<int>(TensorShape({}), {3});
-  Status s = RunOpKernel();
-
-  ASSERT_FALSE(s.ok());
-  EXPECT_TRUE(
-              StringPiece(s.ToString()).contains("iou_threshold must be in [0, 1]"))
-    << s;
-}
-
-TEST_F(NonMaxSuppressionOpTest, TestEmptyInput) {
-  MakeOp(.5);
-  AddInputFromArray<float>(TensorShape({0, 4}), {});
-  AddInputFromArray<float>(TensorShape({0}), {});
-  AddInputFromArray<int>(TensorShape({}), {30});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({0}));
-  test::FillValues<int>(&expected, {});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-    
-//
-// NonMaxSuppressionV2Op Tests
-//
-
-class NonMaxSuppressionV2OpTest : public OpsTestBase {
- protected:
-  void MakeOp() {
-    TF_EXPECT_OK(NodeDefBuilder("non_max_suppression_op", "NonMaxSuppressionV2")
-                     .Input(FakeInput(DT_FLOAT))
-                     .Input(FakeInput(DT_FLOAT))
-                     .Input(FakeInput(DT_INT32))
-                     .Input(FakeInput(DT_FLOAT))
-                     .Finalize(node_def()));
-    TF_EXPECT_OK(InitOp());
-  }
-};
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectFromThreeClusters) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({6, 4}),
-                           {0, 0,  1, 1,  0, 0.1f,  1, 1.1f,  0, -0.1f, 1, 0.9f,
-                            0, 10, 1, 11, 0, 10.1f, 1, 11.1f, 0, 100,  1, 101});
-  AddInputFromArray<float>(TensorShape({6}), {.9f, .75f, .6f, .95f, .5f, .3f});
-  AddInputFromArray<int>(TensorShape({}), {3});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({3}));
-  test::FillValues<int>(&expected, {3, 0, 5});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectFromThreeClustersFlippedCoordinates) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({6, 4}),
-                           {1, 1,  0, 0,  0, 0.1f,  1, 1.1f,  0, .9f,  1, -0.1f,
-                            0, 10, 1, 11, 1, 10.1f, 0, 11.1f, 1, 101, 0, 100});
-  AddInputFromArray<float>(TensorShape({6}), {.9f, .75f, .6f, .95f, .5f, .3f});
-  AddInputFromArray<int>(TensorShape({}), {3});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({3}));
-  test::FillValues<int>(&expected, {3, 0, 5});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectAtMostTwoBoxesFromThreeClusters) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({6, 4}),
-                           {0, 0,  1, 1,  0, 0.1f,  1, 1.1f,  0, -0.1f, 1, 0.9f,
-                            0, 10, 1, 11, 0, 10.1f, 1, 11.1f, 0, 100,  1, 101});
-  AddInputFromArray<float>(TensorShape({6}), {.9f, .75f, .6f, .95f, .5f, .3f});
-  AddInputFromArray<int>(TensorShape({}), {2});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({2}));
-  test::FillValues<int>(&expected, {3, 0});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectAtMostThirtyBoxesFromThreeClusters) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({6, 4}),
-                           {0, 0,  1, 1,  0, 0.1f,  1, 1.1f,  0, -0.1f, 1, 0.9f,
-                            0, 10, 1, 11, 0, 10.1f, 1, 11.1f, 0, 100,  1, 101});
-  AddInputFromArray<float>(TensorShape({6}), {.9f, .75f, .6f, .95f, .5f, .3f});
-  AddInputFromArray<int>(TensorShape({}), {30});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({3}));
-  test::FillValues<int>(&expected, {3, 0, 5});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectSingleBox) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({1, 4}), {0, 0, 1, 1});
-  AddInputFromArray<float>(TensorShape({1}), {.9f});
-  AddInputFromArray<int>(TensorShape({}), {3});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({1}));
-  test::FillValues<int>(&expected, {0});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestSelectFromTenIdenticalBoxes) {
-  MakeOp();
-
-  int num_boxes = 10;
-  std::vector<float> corners(num_boxes * 4);
-  std::vector<float> scores(num_boxes);
-  for (int i = 0; i < num_boxes; ++i) {
-    corners[i * 4 + 0] = 0;
-    corners[i * 4 + 1] = 0;
-    corners[i * 4 + 2] = 1;
-    corners[i * 4 + 3] = 1;
-    scores[i] = .9;
-  }
-  AddInputFromArray<float>(TensorShape({num_boxes, 4}), corners);
-  AddInputFromArray<float>(TensorShape({num_boxes}), scores);
-  AddInputFromArray<int>(TensorShape({}), {3});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  TF_ASSERT_OK(RunOpKernel());
-
-  Tensor expected(allocator(), DT_INT32, TensorShape({1}));
-  test::FillValues<int>(&expected, {0});
-  test::ExpectTensorEqual<int>(expected, *GetOutput(0));
-}
-
-TEST_F(NonMaxSuppressionV2OpTest, TestInconsistentBoxAndScoreShapes) {
-  MakeOp();
-  AddInputFromArray<float>(TensorShape({6, 4}),
-                           {0, 0,  1, 1,  0, 0.1f,  1, 1.1f,  0, -0.1f, 1, 0.9f,
-                            0, 10, 1, 11, 0, 10.1f, 1, 11.1f, 0, 100,  1, 101});
-  AddInputFromArray<float>(TensorShape({5}), {.9f, .75f, .6f, .95f, .5f});
-  AddInputFromArray<int>(TensorShape({}), {30});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
-  Status s = RunOpKernel();
 
   ASSERT_FALSE(s.ok());
   EXPECT_TRUE(
       StringPiece(s.ToString()).contains("scores has incompatible shape"))
       << s;
 }
 
-TEST_F(NonMaxSuppressionV2OpTest, TestInvalidIOUThreshold) {
-  MakeOp();
+TEST_F(NonMaxSuppressionOpTest, TestInvalidIOUThreshold) {
+  MakeOp(1.2);
   AddInputFromArray<float>(TensorShape({1, 4}), {0, 0, 1, 1});
   AddInputFromArray<float>(TensorShape({1}), {.9f});
   AddInputFromArray<int>(TensorShape({}), {3});
-  AddInputFromArray<float>(TensorShape({}), {1.2f});
   Status s = RunOpKernel();
 
   ASSERT_FALSE(s.ok());
@@ -317,12 +161,11 @@ TEST_F(NonMaxSuppressionV2OpTest, TestInvalidIOUThreshold) {
       << s;
 }
 
-TEST_F(NonMaxSuppressionV2OpTest, TestEmptyInput) {
-  MakeOp();
+TEST_F(NonMaxSuppressionOpTest, TestEmptyInput) {
+  MakeOp(.5);
   AddInputFromArray<float>(TensorShape({0, 4}), {});
   AddInputFromArray<float>(TensorShape({0}), {});
   AddInputFromArray<int>(TensorShape({}), {30});
-  AddInputFromArray<float>(TensorShape({}), {.5f});
   TF_ASSERT_OK(RunOpKernel());
 
   Tensor expected(allocator(), DT_INT32, TensorShape({0}));