Add query_intersections() method for efficient AABB pair detection

claude · claude · commit 76e973c52fe6 · 2025-11-03T00:52:01.000Z
Implements a new query_intersections() method that efficiently finds all pairs of intersecting bounding boxes in the tree, addressing the feature request in issue #46. Key features: - Returns numpy array of shape (n_pairs, 2) with index pairs (i, j) where i < j - Parallel processing using std::thread for improved performance - Automatic double-precision refinement when exact coordinates are available - No duplicate pairs or self-pairs - Similar to scipy.spatial.cKDTree.query_pairs but for AABBs This eliminates the need for manual post-processing of batch_query results using np.vectorize, np.repeat, and np.concatenate, which previously canceled out the performance gains from C++ parallelization. Changes: - cpp/prtree.h: Added query_intersections() method to PRTree class - cpp/main.cc: Added Python bindings for all dimensions (2D, 3D, 4D) - tests/test_PRTree.py: Added comprehensive tests including edge cases - README.md: Updated documentation with usage examples All tests pass (45 new tests + existing tests). Resolves #46
diff --git a/README.md b/README.md
@@ -9,6 +9,10 @@ _python_prtree_ is a python/c++ implementation of the Priority R-Tree (see refer
 - `query` and `batch_query`
   - `batch_query` is parallelized by `std::thread` and is much faster than the `query` method.
   - The `query` method has an optional keyword argument `return_obj`; if `return_obj=True`, a Python object is returned.
+- `query_intersections`
+  - Returns all pairs of intersecting AABBs as a numpy array of shape (n_pairs, 2).
+  - Optimized for performance with parallel processing and double-precision refinement.
+  - Similar to `scipy.spatial.cKDTree.query_pairs` but for bounding boxes instead of points.
 - `rebuild`
   - It improves performance when many insert/delete operations are called since the last rebuild.
   - Note that if the size changes more than 1.5 times, the insert/erase method also performs `rebuild`.
@@ -77,6 +81,11 @@ print(prtree.query([0.5, 0.5]))
 # [1]
 print(prtree.query(0.5, 0.5))  # 1d-array
 # [1]
+
+# Find all pairs of intersecting rectangles
+pairs = prtree.query_intersections()
+print(pairs)
+# [[1 3]]  # rectangles with index 1 and 3 intersect
 ```
 
 ```python
diff --git a/cpp/main.cc b/cpp/main.cc
@@ -62,6 +62,11 @@ PYBIND11_MODULE(PRTree, m)
         )pbdoc")
       .def("size", &PRTree<T, B, 2>::size, R"pbdoc(
           get n
+        )pbdoc")
+      .def("query_intersections", &PRTree<T, B, 2>::query_intersections, R"pbdoc(
+          Find all pairs of intersecting AABBs.
+          Returns a numpy array of shape (n_pairs, 2) where each row contains
+          a pair of indices (i, j) with i < j representing intersecting AABBs.
         )pbdoc");
 
   py::class_<PRTree<T, B, 3>>(m, "_PRTree3D")
@@ -109,6 +114,11 @@ PYBIND11_MODULE(PRTree, m)
         )pbdoc")
       .def("size", &PRTree<T, B, 3>::size, R"pbdoc(
           get n
+        )pbdoc")
+      .def("query_intersections", &PRTree<T, B, 3>::query_intersections, R"pbdoc(
+          Find all pairs of intersecting AABBs.
+          Returns a numpy array of shape (n_pairs, 2) where each row contains
+          a pair of indices (i, j) with i < j representing intersecting AABBs.
         )pbdoc");
 
   py::class_<PRTree<T, B, 4>>(m, "_PRTree4D")
@@ -156,6 +166,11 @@ PYBIND11_MODULE(PRTree, m)
         )pbdoc")
       .def("size", &PRTree<T, B, 4>::size, R"pbdoc(
           get n
+        )pbdoc")
+      .def("query_intersections", &PRTree<T, B, 4>::query_intersections, R"pbdoc(
+          Find all pairs of intersecting AABBs.
+          Returns a numpy array of shape (n_pairs, 2) where each row contains
+          a pair of indices (i, j) with i < j representing intersecting AABBs.
         )pbdoc");
 
 #ifdef VERSION_INFO
diff --git a/cpp/prtree.h b/cpp/prtree.h
@@ -1626,4 +1626,176 @@ class PRTree
   {
     return static_cast<int64_t>(idx2bb.size());
   }
+
+  /**
+   * Find all pairs of intersecting AABBs in the tree.
+   * Returns a numpy array of shape (n_pairs, 2) where each row contains
+   * a pair of indices (i, j) with i < j representing intersecting AABBs.
+   *
+   * This method is optimized for performance by:
+   * - Using parallel processing for queries
+   * - Avoiding duplicate pairs by enforcing i < j
+   * - Performing intersection checks in C++ to minimize Python overhead
+   * - Using double-precision refinement when exact coordinates are available
+   *
+   * @return py::array_t<T> Array of shape (n_pairs, 2) containing index pairs
+   */
+  py::array_t<T> query_intersections()
+  {
+    // Collect all indices and bounding boxes
+    vec<T> indices;
+    vec<BB<D>> bboxes;
+    vec<std::array<double, 2 * D>> exact_coords;
+
+    if (unlikely(idx2bb.empty()))
+    {
+      // Return empty array of shape (0, 2)
+      vec<T> empty_data;
+      std::unique_ptr<vec<T>> data_ptr = std::make_unique<vec<T>>(std::move(empty_data));
+      auto capsule = py::capsule(data_ptr.get(), [](void *p)
+                                 { std::unique_ptr<vec<T>>(reinterpret_cast<vec<T> *>(p)); });
+      data_ptr.release();
+      return py::array_t<T>({0, 2}, {2 * sizeof(T), sizeof(T)}, nullptr, capsule);
+    }
+
+    indices.reserve(idx2bb.size());
+    bboxes.reserve(idx2bb.size());
+    exact_coords.reserve(idx2bb.size());
+
+    for (const auto &pair : idx2bb)
+    {
+      indices.push_back(pair.first);
+      bboxes.push_back(pair.second);
+
+      // Get exact coordinates if available
+      auto it = idx2exact.find(pair.first);
+      if (it != idx2exact.end())
+      {
+        exact_coords.push_back(it->second);
+      }
+      else
+      {
+        // Create dummy exact coords from float32 BB (won't be used for refinement)
+        std::array<double, 2 * D> dummy;
+        for (int i = 0; i < D; ++i)
+        {
+          dummy[i] = static_cast<double>(pair.second.min(i));
+          dummy[i + D] = static_cast<double>(pair.second.max(i));
+        }
+        exact_coords.push_back(dummy);
+      }
+    }
+
+    const size_t n_items = indices.size();
+
+    // Use thread-local storage to collect pairs
+    const size_t n_threads = std::min(static_cast<size_t>(std::thread::hardware_concurrency()), n_items);
+    vec<vec<std::pair<T, T>>> thread_pairs(n_threads);
+
+#ifdef MY_PARALLEL
+    vec<std::thread> threads;
+    threads.reserve(n_threads);
+
+    for (size_t t = 0; t < n_threads; ++t)
+    {
+      threads.emplace_back([&, t]()
+      {
+        vec<std::pair<T, T>> local_pairs;
+
+        for (size_t i = t; i < n_items; i += n_threads)
+        {
+          const T idx_i = indices[i];
+          const BB<D> &bb_i = bboxes[i];
+
+          // Find all intersections with this bounding box
+          auto candidates = find(bb_i);
+
+          // Refine candidates using exact coordinates if available
+          if (!idx2exact.empty())
+          {
+            candidates = refine_candidates(candidates, exact_coords[i]);
+          }
+
+          // Keep only pairs where idx_i < idx_j to avoid duplicates
+          for (const T &idx_j : candidates)
+          {
+            if (idx_i < idx_j)
+            {
+              local_pairs.emplace_back(idx_i, idx_j);
+            }
+          }
+        }
+
+        thread_pairs[t] = std::move(local_pairs);
+      });
+    }
+
+    for (auto &thread : threads)
+    {
+      thread.join();
+    }
+#else
+    // Single-threaded version
+    vec<std::pair<T, T>> local_pairs;
+
+    for (size_t i = 0; i < n_items; ++i)
+    {
+      const T idx_i = indices[i];
+      const BB<D> &bb_i = bboxes[i];
+
+      // Find all intersections with this bounding box
+      auto candidates = find(bb_i);
+
+      // Refine candidates using exact coordinates if available
+      if (!idx2exact.empty())
+      {
+        candidates = refine_candidates(candidates, exact_coords[i]);
+      }
+
+      // Keep only pairs where idx_i < idx_j to avoid duplicates
+      for (const T &idx_j : candidates)
+      {
+        if (idx_i < idx_j)
+        {
+          local_pairs.emplace_back(idx_i, idx_j);
+        }
+      }
+    }
+
+    thread_pairs[0] = std::move(local_pairs);
+#endif
+
+    // Merge results from all threads into a flat vector
+    vec<T> flat_pairs;
+    size_t total_pairs = 0;
+    for (const auto &pairs : thread_pairs)
+    {
+      total_pairs += pairs.size();
+    }
+    flat_pairs.reserve(total_pairs * 2);
+
+    for (const auto &pairs : thread_pairs)
+    {
+      for (const auto &pair : pairs)
+      {
+        flat_pairs.push_back(pair.first);
+        flat_pairs.push_back(pair.second);
+      }
+    }
+
+    // Create output numpy array using the same pattern as as_pyarray
+    auto data = flat_pairs.data();
+    std::unique_ptr<vec<T>> data_ptr = std::make_unique<vec<T>>(std::move(flat_pairs));
+    auto capsule = py::capsule(data_ptr.get(), [](void *p)
+                               { std::unique_ptr<vec<T>>(reinterpret_cast<vec<T> *>(p)); });
+    data_ptr.release();
+
+    // Return 2D array with shape (total_pairs, 2)
+    return py::array_t<T>(
+        {static_cast<py::ssize_t>(total_pairs), py::ssize_t(2)}, // shape
+        {2 * sizeof(T), sizeof(T)},                               // strides (row-major)
+        data,                                                     // data pointer
+        capsule                                                   // capsule for cleanup
+    );
+  }
 };
diff --git a/tests/test_PRTree.py b/tests/test_PRTree.py