diff --git a/CMakeLists.txt b/CMakeLists.txt
index 5fa15b0d93..b3735a2e88 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -1,54 +1,56 @@
-# For Server x86_64 install clang for fp16 support and use the following commands
 cmake_minimum_required(VERSION 3.14)
-project(ndd)
-
-
-#check for the correct clang version
-find_program(CLANG_CANDIDATE_C
-    NAMES clang-21 clang-20 clang-19 clang
-)
 
-find_program(CLANG_CANDIDATE_CXX
-    NAMES clang++-21 clang++-20 clang++-19 clang++
-)
+# Select a Clang toolchain before project() so CMake configures the matching
+# standard library and platform SDK paths.
+if(NOT DEFINED CMAKE_C_COMPILER AND NOT DEFINED ENV{CC})
+    if(CMAKE_HOST_SYSTEM_NAME STREQUAL "Darwin")
+        execute_process(
+            COMMAND xcrun --find clang
+            OUTPUT_VARIABLE CLANG_CANDIDATE_C
+            OUTPUT_STRIP_TRAILING_WHITESPACE
+            ERROR_QUIET
+        )
+    else()
+        find_program(CLANG_CANDIDATE_C NAMES clang-21 clang-20 clang-19 clang)
+    endif()
 
-if (NOT CLANG_CANDIDATE_C OR NOT CLANG_CANDIDATE_CXX)
-    message(FATAL_ERROR "Clang not found. Please install clang >= 19.")
+    if(CLANG_CANDIDATE_C)
+        set(CMAKE_C_COMPILER "${CLANG_CANDIDATE_C}" CACHE FILEPATH "C compiler")
+    endif()
 endif()
 
-# Query clang version
-execute_process(
-    COMMAND ${CLANG_CANDIDATE_C} --version
-    OUTPUT_VARIABLE CLANG_VERSION_OUTPUT
-    ERROR_VARIABLE CLANG_VERSION_ERROR
-    OUTPUT_STRIP_TRAILING_WHITESPACE
-)
+if(NOT DEFINED CMAKE_CXX_COMPILER AND NOT DEFINED ENV{CXX})
+    if(CMAKE_HOST_SYSTEM_NAME STREQUAL "Darwin")
+        execute_process(
+            COMMAND xcrun --find clang++
+            OUTPUT_VARIABLE CLANG_CANDIDATE_CXX
+            OUTPUT_STRIP_TRAILING_WHITESPACE
+            ERROR_QUIET
+        )
+    else()
+        find_program(CLANG_CANDIDATE_CXX NAMES clang++-21 clang++-20 clang++-19 clang++)
+    endif()
 
-if (NOT CLANG_VERSION_OUTPUT)
-    message(FATAL_ERROR "Failed to query clang version.")
+    if(CLANG_CANDIDATE_CXX)
+        set(CMAKE_CXX_COMPILER "${CLANG_CANDIDATE_CXX}" CACHE FILEPATH "C++ compiler")
+    endif()
 endif()
 
-# Extract major version
-string(REGEX MATCH "clang version ([0-9]+)" _match "${CLANG_VERSION_OUTPUT}")
-set(CLANG_VERSION_MAJOR "${CMAKE_MATCH_1}")
+project(ndd)
 
-if (NOT CLANG_VERSION_MAJOR)
-    message(FATAL_ERROR
-        "Unable to determine clang version from:\n${CLANG_VERSION_OUTPUT}\n"
-    )
+if(NOT CMAKE_C_COMPILER_ID MATCHES "Clang" OR NOT CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+    message(FATAL_ERROR "Clang >= 17 is required. Set CC/CXX or CMAKE_C_COMPILER/CMAKE_CXX_COMPILER to a Clang toolchain.")
 endif()
 
-if (CLANG_VERSION_MAJOR LESS 17)
-    message(FATAL_ERROR
-        "Clang ${CLANG_VERSION_MAJOR} detected, but clang >= 17 is required "
-    )
+if(CMAKE_CXX_COMPILER_VERSION VERSION_LESS 17)
+    message(FATAL_ERROR "Clang ${CMAKE_CXX_COMPILER_VERSION} detected, but Clang >= 17 is required.")
 endif()
 
-# Lock compilers
-set(CMAKE_C_COMPILER   "${CLANG_CANDIDATE_C}"   CACHE STRING "" FORCE)
-set(CMAKE_CXX_COMPILER "${CLANG_CANDIDATE_CXX}" CACHE STRING "" FORCE)
+if(APPLE AND (CMAKE_C_COMPILER MATCHES "[/\\\\]Android[/\\\\].*[/\\\\]ndk[/\\\\]" OR CMAKE_CXX_COMPILER MATCHES "[/\\\\]Android[/\\\\].*[/\\\\]ndk[/\\\\]"))
+    message(FATAL_ERROR "Android NDK Clang was selected for a macOS build. Use Xcode Command Line Tools Clang, for example: CC=$(xcrun --find clang) CXX=$(xcrun --find clang++) cmake ...")
+endif()
 
-message(STATUS "Using Clang ${CLANG_VERSION_MAJOR}")
+message(STATUS "Using ${CMAKE_CXX_COMPILER_ID} ${CMAKE_CXX_COMPILER_VERSION}")
 message(STATUS "C compiler : ${CMAKE_C_COMPILER}")
 message(STATUS "C++ compiler: ${CMAKE_CXX_COMPILER}")
 
@@ -250,6 +252,15 @@ endif()
 
 message(STATUS "Binary name: ${NDD_BINARY_NAME}")
 
+# Filter sources are split out so filter headers only expose declarations.
+set(NDD_FILTER_SOURCES
+    src/filter/category_index.cpp
+    src/filter/filter.cpp
+    src/filter/numeric_index.cpp
+)
+
+add_library(ndd_filter STATIC ${NDD_FILTER_SOURCES})
+
 # Add new src/*.cpp files here when they should be compiled into ndd.
 set(NDD_CORE_SOURCES
     src/sparse/inverted_index.cpp
@@ -289,6 +300,15 @@ target_include_directories(ndd_core PRIVATE
     ${OPENSSL_INCLUDE_DIR}
     ${CURL_INCLUDE_DIRS}
 )
+target_include_directories(ndd_filter PRIVATE
+    ${CMAKE_CURRENT_SOURCE_DIR}/src
+    ${CMAKE_CURRENT_SOURCE_DIR}/src/core
+    ${CMAKE_CURRENT_SOURCE_DIR}/src/filter
+    ${CMAKE_CURRENT_SOURCE_DIR}/src/utils
+    ${CMAKE_CURRENT_SOURCE_DIR}/third_party
+    ${CMAKE_CURRENT_SOURCE_DIR}/third_party/json
+    ${LMDB_INCLUDE_DIR}
+)
 target_include_directories(${NDD_BINARY_NAME} PRIVATE
     ${CMAKE_CURRENT_SOURCE_DIR}/src
     ${CMAKE_CURRENT_SOURCE_DIR}/src/server
@@ -307,8 +327,9 @@ target_include_directories(${NDD_BINARY_NAME} PRIVATE
 
 # Set compiler flags
 if(NOT DEBUG)
-    target_compile_options(ndd_core PRIVATE -O3 -ffast-math -fno-finite-math-only)
-    target_compile_options(${NDD_BINARY_NAME} PRIVATE -O3 -ffast-math -fno-finite-math-only)
+    target_compile_options(ndd_core PRIVATE -O3 -ffast-math -fno-finite-math-only -falign-functions=64)
+    target_compile_options(ndd_filter PRIVATE -O3 -ffast-math -fno-finite-math-only -falign-functions=64)
+    target_compile_options(${NDD_BINARY_NAME} PRIVATE -O3 -ffast-math -fno-finite-math-only -falign-functions=64)
 endif()
 
 # Apply Flags based on selection
@@ -355,6 +376,7 @@ target_compile_definitions(ndd_core PRIVATE
     ASIO_HAS_STD_STRING_VIEW
     MDB_MAXKEYSIZE=512
 )
+target_compile_definitions(ndd_filter PRIVATE MDB_MAXKEYSIZE=512)
 target_compile_definitions(${NDD_BINARY_NAME} PRIVATE 
     ASIO_STANDALONE 
     ASIO_HAS_STD_CHRONO 
@@ -364,6 +386,7 @@ target_compile_definitions(${NDD_BINARY_NAME} PRIVATE
 
 # Link libraries
 target_link_libraries(${NDD_BINARY_NAME} PRIVATE
+    ndd_filter
     Threads::Threads
     OpenSSL::SSL
     OpenSSL::Crypto
@@ -382,6 +405,15 @@ option(ENABLE_TESTING "Enable building tests" OFF)
 if(ENABLE_TESTING)
     enable_testing()
     add_subdirectory(tests)
+    if(TARGET ndd_filter_test)
+        target_link_libraries(ndd_filter_test ndd_filter)
+    endif()
+    if(TARGET ndd_vector_storage_test)
+        target_link_libraries(ndd_vector_storage_test ndd_filter)
+    endif()
+    if(TARGET ndd_numeric_index_stress_test)
+        target_link_libraries(ndd_numeric_index_stress_test ndd_filter)
+    endif()
 endif()
 
 message(STATUS "Processor: ${CMAKE_SYSTEM_PROCESSOR}")
diff --git a/docs/filter.md b/docs/filter.md
index 7340840409..b6f401d01f 100644
--- a/docs/filter.md
+++ b/docs/filter.md
@@ -1,95 +1,594 @@
-# Filter Design & Strategy
+# Filters
 
-This document outlines the architectural design for Endee's filtering system, covering component designs for Numeric, Category, and Boolean types, and the overarching execution strategy.
+Onboarding guide to the filter subsystem on the `filter_pass` branch. Read this
+top-to-bottom. The "Caveats" sections call out behaviours that are
+counter-intuitive or that the team has not yet fixed; treat them as load-bearing
+context, not nitpicks.
 
-## 1. Global Filtering Strategy
+The source files this doc maps to:
 
-The system prioritizes **Pre-Filtering** followed by an adaptive search execution path.
+- [src/filter/filter.hpp](../src/filter/filter.hpp), [src/filter/filter.cpp](../src/filter/filter.cpp) — top-level `Filter` class, JSON parsing, schema, query dispatch.
+- [src/filter/numeric_index.hpp](../src/filter/numeric_index.hpp), [src/filter/numeric_index.cpp](../src/filter/numeric_index.cpp) — `NumericIndex`, `Bucket`, sortable-key helpers.
+- [src/filter/category_index.hpp](../src/filter/category_index.hpp), [src/filter/category_index.cpp](../src/filter/category_index.cpp) — `CategoryIndex`, the bitmap-per-key store used for strings and booleans.
+- [src/storage/vector_storage.hpp](../src/storage/vector_storage.hpp) — wires the filter store to vectors and metadata (`store_vectors_batch`, `deleteFilter`, `updateFilter`).
+- [src/core/ndd.hpp](../src/core/ndd.hpp) — `searchKNN`, `deleteVectorsByFilter`, `updateFilters`. The adaptive search path lives here.
+- [src/core/types.hpp](../src/core/types.hpp) — `FilterParams`.
+- [src/hnsw/hnswalg.h](../src/hnsw/hnswalg.h) — HNSW fatigue boost when a filter is active.
+- [src/main.cpp](../src/main.cpp) — HTTP layer.
 
-### 1.1. Execution Flow
-1.  **Filter Analysis:**
-    *   Incoming queries (e.g., `Age: [18-25] AND City: "NY"`) are broken into atomic filter operations.
-    *   **Cardinality Estimation:** Each filter estimates its result set size (e.g., "NY" has 500 users, "Age" has 10k).
-2.  **Optimization (Cheapest First):**
-    *   Filters are executed in order of increasing cardinality (smallest first).
-    *   Results are intersected (`AND`) incrementally. If the intermediate result becomes empty, execution stops early.
-3.  **Adaptive Search Path:**
-    *   Final `RoaringBitmap` of valid IDs is passed to the Vector Search engine.
-    *   **Small Result (< 1,000 IDs):** **Bypass HNSW.** Fetch vectors for valid IDs directly and perform Brute Force distance calculation. This avoids graph overhead for sparse results.
-    *   **Large Result:** **Filtered HNSW.** Pass the Bitmap to HNSW's `searchKnn` via `BitMapFilterFunctor`.
+---
+
+## 1. Big picture
+
+```
+HTTP                main.cpp           parses request, builds filter_array JSON
+  |
+IndexManager        ndd.hpp            searchKNN / insert / delete / update
+  |
+VectorStorage       vector_storage.hpp owns filter_store_ + meta_store_ + vector_store_
+  |
+Filter              filter/filter.cpp  schema + JSON-to-index dispatch
+  |                                    |
+  |                                    +-- NumericIndex   numbers (Number = unified int/float)
+  |                                    +-- CategoryIndex  strings + booleans
+  |
+MDBX                                   one filter env per index, multiple named DBIs
+```
+
+There is **one MDBX environment per index**, opened from
+`<index_path>/filters`, with four named sub-databases:
+
+| dbi              | what it holds                                              |
+|------------------|------------------------------------------------------------|
+| `<unnamed>`      | filter schema JSON under key `__ndd_schema_v1__`          |
+| `numeric_forward`| `<field>:<id>` -> 4-byte sortable value (current value)    |
+| `numeric_inverted`| bucket-key -> serialized `Bucket` (the inverted index)    |
+| `category_idx`   | `<field>:<value>` -> serialized RoaringBitmap of ids       |
+
+Geometry is bounded by `settings::FILTER_MAP_SIZE_BITS` / `_MAX_BITS`
+(env-overridable via `NDD_FILTER_MAP_SIZE_BITS` / `_MAX_BITS`). Default min is
+16 MiB, default max is 64 GiB.
+
+---
+
+## 2. Error code contract
+
+Every public filter call returns `ndd::OperationResult<T>` (defined in
+[src/utils/types.hpp](../src/utils/types.hpp)). The codes are a stable contract
+between the filter layer and `main.cpp`:
+
+| code      | meaning                                                          | HTTP |
+|-----------|------------------------------------------------------------------|------|
+| `0`       | success                                                          | 2xx  |
+| `1`       | invalid JSON shape (not an array / not an object / bad keys)     | 400  |
+| `2`       | unsupported operator or invalid value for the field type         | 400  |
+| `3`       | field type conflict with the persisted schema                    | 400  |
+| `100-199` | MDBX / storage failure                                           | 500  |
+| `200-299` | corruption / invariant violation                                 | 500  |
+
+`main.cpp::operation_error_is_client_error` returns true for `code < 100`.
+Doc-comments on every public method spell out the per-call code range.
+
+---
+
+## 3. Filter schema and field types
+
+Schema lives in the unnamed MDBX dbi under key `__ndd_schema_v1__` as a JSON
+object `{ field_name -> FieldType }`. `FieldType` is:
+
+```
+Unknown = 0, String = 1, Number = 2, Bool = 4
+```
+
+Two important rules:
+
+- **First-write-wins.** The first insert that mentions a field freezes its type.
+  Later inserts that use a different type return code `3`. See
+  `Filter::register_field_type` in [filter.cpp](../src/filter/filter.cpp).
+- **JSON type drives `FieldType`.** `value.is_boolean()` → Bool,
+  `value.is_number()` → Number, `value.is_string()` → String. There is no way
+  to override.
+
+Schema is loaded once on `Filter` construction and cached in
+`schema_cache_` under `schema_mutex_`. Every register touches MDBX (one
+read-write txn per new field), so first inserts after restart pay a per-field
+cost.
+
+### Caveats
+
+- The schema persistence is **not** atomic with numeric/category writes. The
+  schema commit happens inside `register_field_type` during validation
+  ([filter.cpp:683](../src/filter/filter.cpp#L683)), before any data is
+  written. A crash between schema commit and data write leaves a "registered
+  but empty" field.
+- Low-level `add_to_filter()` /  `add_to_filter_batch()` /
+  `remove_from_filter()` write directly to the `CategoryIndex` and bypass
+  schema registration entirely. They will happily create category entries for
+  a field that the schema (or a later JSON insert) thinks is `Number`. The
+  high-level `add_filters_from_json[_batch]` is the only schema-aware entry
+  point. Treat the low-level methods as legacy.
+
+---
+
+## 4. Numbers: one float32 sortable domain
+
+Every numeric value — both JSON integers and JSON floats — is funneled through
+`Filter::sortable_from_json` ([filter.cpp:57](../src/filter/filter.cpp#L57))
+which:
+
+1. Rejects non-numeric or non-finite values (`code = 2`).
+2. Calls `value.get<float>()` (float32, not double).
+3. Normalizes signed zero.
+4. Passes the float to `float_to_sortable` to get a `uint32_t` that sorts the
+   same way as the original float.
+
+`float_to_sortable` is the standard IEEE-754 trick: flip all bits if the sign
+bit is set, otherwise flip just the sign bit
+([numeric_index.cpp:21](../src/filter/numeric_index.cpp#L21)). It makes the
+representation lexicographically ordered, which means we can scan inverted
+buckets with a normal MDBX cursor and get range semantics.
+
+There is also `int_to_sortable` in the same file. **It is no longer used by
+inserts or queries.** All numeric paths go through `float_to_sortable`. The
+function is left in the source for tests and for a potential future
+"true integer" type.
+
+### Caveats (read this before debugging an off-by-one)
+
+- **float32 precision.** Above `2^24 = 16,777,216`, not every integer is
+  representable in float32. `1 vs 1.0` compare equal (good) but
+  `16_777_217 vs 16_777_216` collapse to the same key (bad). The doc comment
+  above `sortable_from_json` spells this out.
+- **Strict comparisons (`$gt`, `$lt`)** use `std::nextafterf` on the float32
+  bound. The "next representable" gap grows with magnitude, so the bound for
+  `$gt 1e20` is very different from the bound for `$gt 1.0`. See
+  `Filter::numeric_bound_from_comparison` in
+  [filter.cpp:117](../src/filter/filter.cpp#L117).
+- **Migration.** Older DBs that wrote integers through `int_to_sortable` will
+  not interoperate with the float32 sortable keys. The numeric index has no
+  version field; the only currently-supported migration is "rebuild the index."
+  Both `numeric_index.cpp` and the inline comment in
+  [filter.cpp:94](../src/filter/filter.cpp#L94) call this out.
+- **Bucket density.** The float bit domain is less uniformly dense in the
+  integer range than `int_to_sortable` was. Integer-heavy fields will create
+  more buckets and walk more entries on wide range scans.
+- **Large JSON integers.** `category_value_from_json` calls
+  `value.get<int>()` for integer category values
+  ([filter.cpp:91](../src/filter/filter.cpp#L91)). Values outside `int` are
+  unsafe (nlohmann throws on overflow; we do not catch with a code-2 message
+  yet).
+
+---
+
+## 5. Numeric inverted index
+
+Owned by `NumericIndex`. The data model is a B+-tree of fixed-width buckets
+keyed by `<field>:<base_value_big_endian>`.
+
+### 5.1 Bucket layout
+
+```cpp
+struct Bucket {
+    static constexpr size_t MAX_SIZE = 1024;          // soft cap on ids.size()
+    static constexpr uint32_t MAX_DELTA = 65535;      // u16 max
+    uint32_t base_value = 0;                          // runtime only
+
+    std::vector<uint16_t>   deltas;                   // sorted ascending
+    std::vector<ndd::idInt> ids;                      // index-aligned with deltas
+    ndd::RoaringBitmap      summary_bitmap;           // union of all ids
+};
+```
+
+Serialization (see `Bucket::serialize` /
+`Bucket::deserialize` in [numeric_index.cpp:162](../src/filter/numeric_index.cpp#L162)):
+
+```
+[uint32_t bm_size][bitmap bytes][deltas (N * u16)][ids (N * u32)]
+```
+
+`N` is **derived** from the residual bytes after the bitmap:
+`(iov_len - 4 - bm_size) / (sizeof(u16) + sizeof(idInt))`. The branch removed
+the explicit count field — this is what the `e9cca02 numeric filters using
+only floats` and the bitmap-only-bucket fix commits depend on, because it lets
+`ids.size()` transiently exceed `MAX_SIZE` (slide-split fallthrough) without
+overflowing a stored count.
+
+### 5.2 Inserts
+
+`NumericIndex::put_internal` ([numeric_index.cpp:720](../src/filter/numeric_index.cpp#L720)):
+
+1. Look up the forward entry `<field>:<id>`. If present with the same value,
+   no-op. If different, remove the id from its old bucket.
+2. Upsert the forward entry to the new value.
+3. Call `add_to_buckets` to add the id to the correct inverted bucket.
+
+`add_to_buckets` ([numeric_index.cpp:448](../src/filter/numeric_index.cpp#L448))
+walks back from `MDBX_SET_RANGE` to find the predecessor bucket whose
+`[base, base+MAX_DELTA]` covers the value. If no such bucket exists, it
+creates one keyed at the exact value. If the matching bucket is at
+`MAX_SIZE`, it runs the **slide split**.
+
+### 5.3 Slide split
+
+A bucket whose `ids.size()` reaches `MAX_SIZE` (1024) is split at a
+**value boundary**, not the median. We scan right (then left) from the median
+to find the first index where `deltas[i] != deltas[i-1]`, then split there.
+This guarantees the right bucket's key (`base + delta[split]`) differs from
+the left bucket's key, so MDBX never sees duplicate keys.
+
+If the bucket is **all duplicates of `base_value`** (no value boundary
+anywhere), the split cannot succeed. We fall through and just append the new
+entry, letting the bucket sit momentarily over `MAX_SIZE`:
+
+- If the new value equals `base_value`, the duplicate run extends and the
+  fallthrough repeats on the next insert.
+- If the new value is greater than `base_value`, the bucket now has a value
+  boundary; the very next insert into this bucket will slide-split cleanly.
+
+This is the path that creates **bitmap-only ids** (see next section).
+
+### 5.4 Saturated-duplicate path / bitmap-only ids
+
+`Bucket::add` ([numeric_index.cpp:91](../src/filter/numeric_index.cpp#L91))
+has this branch:
+
+```cpp
+if (delta_32 == 0 && ids.size() >= MAX_SIZE) {
+    return;   // id only goes into summary_bitmap
+}
+```
+
+When the bucket is saturated and the incoming value equals `base_value`, the
+id is added to `summary_bitmap` only. The arrays don't grow. The bitmap is
+the source of truth for membership.
+
+Three places that depend on this:
+
+1. **Range scan** ([numeric_index.cpp:1011](../src/filter/numeric_index.cpp#L1011))
+   handles `bucket.ids.empty()` but `summary_bitmap` non-empty: include the
+   bitmap iff `base_value` is in `[min_val, max_val]`.
+2. **Partial-overlap scan**
+   ([numeric_index.cpp:1049](../src/filter/numeric_index.cpp#L1049)) reconstructs
+   the bitmap-only subset by `summary_bitmap` minus `{ ids[i] : deltas[i] != 0 }`.
+3. **Slide split** ([numeric_index.cpp:629](../src/filter/numeric_index.cpp#L629))
+   computes the left bucket's bitmap as `original_bitmap - right_bucket.ids`
+   instead of rebuilding it from `ids[]`, which would lose bitmap-only entries.
+
+### Caveats
+
+- **`Bucket::is_empty()` looks at both `ids.empty()` and
+  `summary_bitmap.isEmpty()`** ([numeric_index.cpp:306](../src/filter/numeric_index.cpp#L306)).
+  This was a fix on this branch. Older versions only looked at `ids`, which
+  would let a delete operation delete a bucket that still had bitmap-only ids.
+- **Bucket size is not page-bounded.** `summary_bitmap` size depends on the
+  user-space insertion pattern, not the entry count. A high-cardinality
+  bucket can be much larger than an MDBX page. There is a TODO in the header
+  to bound buckets by page size; today they are bounded only by
+  `MAX_SIZE = 1024` on the array side.
+- **Bitmap-only partial-overlap is expensive.** The reconstruction at
+  [numeric_index.cpp:1069](../src/filter/numeric_index.cpp#L1069) copies the
+  full bitmap then `remove()`s every delta-zero entry. For a bucket dominated
+  by saturated duplicates this is a real cost.
+
+### 5.5 Range scan: fast path
+
+`NumericIndex::range` ([numeric_index.cpp:902](../src/filter/numeric_index.cpp#L902))
+walks buckets forward from the start of the query. For every bucket whose
+**entire `[base, base + MAX_DELTA]` extent** lies inside `[min_val, max_val]`,
+it skips the full deserialize and reads only the `summary_bitmap`
+(`Bucket::read_summary_bitmap`). This fires on every interior bucket of a wide
+scan and is the reason wide ranges only pay deltas/ids parsing on the start
+and end buckets.
+
+**Caveat:** the fast path is conservative — it requires the **declared
+extent** to be covered, not the actual `[bucket_min, bucket_max]`. A bucket
+packed tightly inside its extent still pays the deserialize unless the whole
+65 K-wide window is inside the query. The TODO is to store actual bucket
+min/max in the bucket header.
+
+### 5.6 Batch writes
+
+`NumericIndex::put_batch` ([numeric_index.cpp:800](../src/filter/numeric_index.cpp#L800))
+commits in **chunks of `BATCH_TXN_CHUNK_SIZE = 256`**. This caps each
+write transaction's dirty-page footprint so MDBX cannot blow past the env
+map size on a multi-thousand-entry batch (the `750e5d8` commit). The
+trade-off is that the batch is not atomic across chunks.
+
+---
+
+## 6. Category / boolean index
+
+`CategoryIndex` ([category_index.cpp](../src/filter/category_index.cpp))
+maps a formatted key `<field>:<value>` to a `RoaringBitmap`. Booleans are
+treated as a category with values `"0"` / `"1"`.
+
+```
+add(field, value, id):
+    1) txn: read bitmap for key                  (read-only txn)
+    2)      bitmap.add(id)
+    3) txn: write bitmap                         (read-write txn)
+```
+
+Two transactions. `remove` is the same shape with `bitmap.remove(id)`.
+`add_batch_by_key` uses `addMany` so the in-memory union is O(N) instead of
+N individual `add()`s.
+
+### Caveats
+
+- **Read-modify-write across two txns is not atomic.** Two concurrent
+  `add()` calls to the same key can produce a lost update (writer B's read
+  predates writer A's commit). High-write workloads on a hot category need
+  external serialization until this moves into a single txn.
+- **The whole bitmap is rewritten on every `add`/`remove`.** For a hot
+  category with millions of ids this is wasteful. Tracked in the perf TODO
+  list (see [filter_todo.md](filter_todo.md)).
+- **Empty keys are not garbage collected.** Removing the last id from a key
+  leaves an empty bitmap in MDBX.
+- **`$in` with an empty string is silently skipped.** `computeFilterBitmap`
+  skips category values whose string form is empty
+  ([filter.cpp:465](../src/filter/filter.cpp#L465)). An empty-string match
+  cannot be expressed in the current shape.
+
+---
+
+## 7. Bitmap deserialization safety
+
+Both indexes use a hardened deserialization helper:
+
+- `Bucket::read_bitmap_payload` in
+  [numeric_index.cpp:46](../src/filter/numeric_index.cpp#L46).
+- `CategoryIndex::read_bitmap_payload` in
+  [category_index.cpp:14](../src/filter/category_index.cpp#L14).
+
+Both follow the same pattern:
+
+1. `roaring_bitmap_portable_deserialize_size(bytes, len)` to verify the
+   payload self-describes a complete bitmap with no trailing junk.
+2. `RoaringBitmap::readSafe(bytes, len)` (the bounds-checked deserializer).
+3. `roaring_bitmap_internal_validate` to catch malformed run/array
+   containers.
+
+Any failure returns `code = 200`. This is the `a46d0b8 safe filter bitmap
+deserialization` commit. Before this landed, a corrupt or empty bucket
+payload could be silently treated as an empty bitmap; now it surfaces as a
+corruption error.
+
+---
+
+## 8. Query API and operators
+
+Top-level entry points on `Filter`:
+
+- `computeFilterBitmap(filter_array)` — returns the bitmap of ids matching
+  the AND of all clauses.
+- `getIdsMatchingFilter(filter_array)` — same, materialized as a vector.
+- `countIdsMatchingFilter(filter_array)` — same, materialized as a size_t.
+- `check_numeric(field, id, op, val)` — fast point check via the forward
+  index; used by `VectorStorage::matches_filter`.
+
+`filter_array` is a JSON **array** of single-field objects. Each clause uses
+a Mongo-style `$op`:
+
+```jsonc
+[
+    { "category":   { "$eq":    "books" } },
+    { "in_stock":   { "$eq":    true    } },
+    { "price":      { "$range": [10, 50] } },
+    { "rating":     { "$gte":   4.0     } },
+    { "discount":   { "$lt":    20      } },
+    { "tags":       { "$in":    ["sale", "new"] } }
+]
+```
+
+Operators supported (`computeFilterBitmap` in
+[filter.cpp:372](../src/filter/filter.cpp#L372)):
+
+| operator   | types         | notes                                                                 |
+|------------|---------------|-----------------------------------------------------------------------|
+| `$eq`      | any           | numeric → `range(v, v)`; category → bitmap lookup.                    |
+| `$in`      | any           | array; numeric → per-item range; category → per-value bitmap union.   |
+| `$range`   | Number        | `[start, end]` inclusive in float32-sortable order. Errors if start > end. |
+| `$lt`      | Number        | uses `nextafterf(x, -inf)` to make the bound exclusive.               |
+| `$lte`     | Number        | inclusive.                                                            |
+| `$gt`      | Number        | uses `nextafterf(x, +inf)` to make the bound exclusive.               |
+| `$gte`     | Number        | inclusive.                                                            |
+
+After all clauses are evaluated, partial bitmaps are sorted by cardinality
+ascending and AND-intersected smallest-first. The intersection short-circuits
+as soon as the result is empty.
+
+### Caveats
+
+- **All clauses materialize before intersecting.** There is no cardinality
+  estimator and no "cheapest first" lazy evaluation despite what the older
+  doc claimed. Every clause runs an MDBX read pass on its own
+  read-only transaction; only **after** all of them complete does the AND
+  start. See [filter.cpp:521-545](../src/filter/filter.cpp#L521).
+- **No clause-level shared snapshot.** Each `$eq`/`$in`/`$range`/`$lt..`
+  opens its own MDBX read txn. A concurrent writer can produce a result that
+  mixes pre- and post-write snapshots across clauses. The operation lock in
+  `searchKNN` is also intentionally disabled
+  ([ndd.hpp:1633](../src/core/ndd.hpp#L1633)), so reads do not serialize
+  against writes either.
+- **Field name and `$in` value validation:** the field name must not contain
+  `:` (it is the key delimiter). Same rule for category values.
+  `validate_filter_key_component` ([filter.cpp:30](../src/filter/filter.cpp#L30))
+  rejects on `:` and returns code `1`. Length, NUL bytes, control bytes, and
+  MDBX max-key are **not** validated. Category values are capped at 255 chars
+  ([filter.cpp:96](../src/filter/filter.cpp#L96)).
+- **The old doc said category values may contain `:`.** They cannot. Code is
+  authoritative; this version of the doc reflects the code.
+- **Schema is only consulted via `schema_cache_` during search.** If a query
+  arrives before any insert has touched the field, `type` defaults to
+  `Unknown` and the query falls through to the category branch, which will
+  just return an empty bitmap.
 
 ---
 
-## 2. Numeric Filter Design
+## 9. Vector storage integration
 
-*Optimized for range queries, high compression, and sequential access.*
+`VectorStorage` owns the `Filter` instance (`filter_store_`) and is the only
+caller that needs to keep three stores (`vector_store_`, `meta_store_`,
+`filter_store_`) in sync. The two pieces worth knowing:
 
-### 2.1. Storage Architecture (Hybrid Bucket)
-The database (LMDB) acts as a coarse-grained B+ Tree.
-*   **Key:** `[FieldID] + [Base_Value_32bit]`.
-    *   Floats are mapped to lexicographically ordered integers to preserve sort order.
-    *   Keys are stored in Big-Endian to support native cursor iteration.
-*   **Value (Bucket):** Fixed-size block (Max 1024 unique values).
-    *   **Summary Bitmap (Roaring):** Pre-computed union of all IDs in the bucket. Used for $O(1)$ block retrieval during full overlaps.
-    *   **Data Arrays (Structure of Arrays - SoA):**
-        *   **Values:** Compressed as `uint16_t` deltas relative to the Key's `Base_Value`.
-        *   **IDs:** Raw `idInt` array, index-aligned with values.
+### 9.1 Upsert cleanup (`store_vectors_batch`)
 
-### 2.2. Query Execution
-*   **Buckets Fully Inside Selection (Middle):** Use **Summary Bitmap**. Zero array access.
-*   **Buckets Partially Overlapping (Edges):** Scan `Values` array (SIMD), use indices to fetch specific `IDs`.
+Implemented in
+[vector_storage.hpp:781](../src/storage/vector_storage.hpp#L781). Four phases:
 
-### 2.3. Constraints & Splitting
-*   **Split Triggers:** Count > 1024 OR Delta > 65,535.
-*   **Sliding Split:** To ensure Key Uniqueness in LMDB, splits do not strictly occur at the median. The split point "slides" right to find the first value divergence, ensuring `Key(RightBucket) != Key(LeftBucket)`.
+1. **Cleanup** — for every entry whose `is_new_to_db[i] == false` (i.e. the
+   id-mapper says this id was already live), read its prior `meta.filter`
+   and call `filter_store_->remove_filters_from_json(...)` to drop the old
+   filter index entries. Without this, a "rename" upsert leaves the old
+   filter still matchable.
+2. **Vectors** — `vector_store_->store_vectors_batch`.
+3. **Meta** — `meta_store_->store_meta_batch` (this is the moment
+   `meta.filter` becomes the new value; cleanup HAD to happen before this).
+4. **Filters** — `filter_store_->add_filters_from_json_batch`.
+
+The `is_new_to_db` vector is the id-mapper's signal:
+
+- `true` → fresh slot, or reuse of a deleted slot. Nothing to clean.
+- `false` → existing live id, an upsert. Cleanup required.
+- empty → legacy caller; cleanup is silently skipped to preserve old
+  semantics. New callers always pass the signal.
+
+### 9.2 `deleteFilter`
+
+[vector_storage.hpp:1049](../src/storage/vector_storage.hpp#L1049). Removes
+filter index entries AND clears `meta.filter` (only when it exactly matches
+the input). This is the `b0e8425` commit — before it, `deleteFilter` only
+touched the index, leaving `meta.filter` populated and drifted.
+
+### Caveats
+
+- **Cross-store atomicity is by design absent.** Vector, meta, filter, and
+  schema writes each commit in their own MDBX txn. A crash between phases
+  leaves torn state: e.g. the cleanup phase committed but phase 4 never ran,
+  so the index entries are gone for a vector that still claims (via
+  `meta.filter`) to have them. The operator-visible remedy is rebuild.
+- **`store_vectors_batch` issues one extra MDBX read per upserted id** to
+  fetch the prior `meta.filter`. Fresh inserts skip this. Heavy upsert
+  workloads should expect that overhead.
+- **The cleanup pass only protects new writes.** Drift accumulated before
+  this branch landed will not be fixed automatically. A targeted rebuild is
+  required to clean it up.
+- **`meta.filter` is the source of truth for cleanup.** If `meta` is
+  unreadable for a live id (torn earlier write), `store_vectors_batch`
+  returns code `103` instead of silently overwriting — better to surface the
+  inconsistency than to make it worse.
 
 ---
 
-## 3. Category Filter Design
+## 10. Search: filter-aware path
+
+`IndexManager::searchKNN` in
+[ndd.hpp:1614](../src/core/ndd.hpp#L1614). When `filter_array` is non-empty:
 
-*Optimized for exact match lookups and faceting.*
+1. Compute the filter bitmap.
+2. If sparse search is enabled, run the sparse query in another thread, with
+   the filter bitmap passed in.
+3. For the dense path, branch on the bitmap's cardinality (`card`):
+   - `card == 0` → no dense results.
+   - `card < params.prefilter_threshold` → **brute force on the small set**.
+     Iterate the bitmap into `valid_ids`, visit those vectors via
+     `visit_vectors_by_ids`, compute distances directly, keep a top-`k` heap.
+     This bypasses HNSW.
+   - Otherwise → **filtered HNSW**. Pass a `BitMapFilterFunctor` and
+     `params.boost_percentage` to `HierarchicalNSW::searchKnn`.
 
-### 3.1. Interface (MongoDB-Style)
-*   **Single Value:** `{"City": "NY"}`
-*   **List Membership ($in):** `{"City": {"$in": ["NY", "London", "Tokyo"]}}`
+`FilterParams` ([core/types.hpp](../src/core/types.hpp)):
 
-### 3.2. Storage Architecture
-Utilizes Inverted Indices with **Text-Based Keys** to enable prefix scanning and faceting.
-*   **Key:** `[FieldName] + ":" + [Value]`.
-    *   **Parsing Logic:** The system strictly splits on the **first** occurrence of `:`.
-    *   **Format:** `City:New:York` is parsed as Field=`City`, Value=`New:York`.
-    *   **Constraints:** `FieldName` must **not** contain the `:` character (alphanumeric + underscore recommended). `Value` can contain any character including `:`.
-*   **Value:** `RoaringBitmap` (Serialized). Contains all IDs that have this attribute value.
+```cpp
+struct FilterParams {
+    size_t prefilter_threshold = settings::PREFILTER_CARDINALITY_THRESHOLD;  // default 10_000
+    size_t boost_percentage    = settings::FILTER_BOOST_PERCENTAGE;          // default 0
+};
+```
 
-### 3.3. Query Execution
-*   **Exact Match:** Direct Key lookup.
-*   **$in Query:**
-    1.  Parse the list `["NY", "London"]`.
-    2.  Perform multiple Key lookups.
-    3.  Compute the **Union** of the resulting Bitmaps efficiently.
+Both are accepted from the HTTP body under `filter_params` (see
+[main.cpp:839](../src/main.cpp#L839)).
+
+### HNSW fatigue boost
+
+When `filter_boost_percentage > 0` and a filter is active,
+`HierarchicalNSW::searchKnn` ([hnswalg.h:1490](../src/hnsw/hnswalg.h#L1490))
+inflates the early-exit budget by `(100 + boost) / 100`. The intuition: with
+a filter the graph is rejecting more candidates, so it pays to explore more
+before giving up. Set `boost_percentage > 0` if recall drops on filtered
+queries.
+
+### Caveats
+
+- **The operation lock is intentionally disabled in search**
+  ([ndd.hpp:1632-1637](../src/core/ndd.hpp#L1632)). The comment is explicit:
+  "We aren't using reader's lock here to enable reads while writing.
+  TODO: check correctness when stressing the system." Filter results can be
+  inconsistent under concurrent writes.
+- **The brute-force branch reads vectors one-by-one via a visitor.** This is
+  fast for sparse filters (small `card`) but degrades sharply if you raise
+  `prefilter_threshold` past a few tens of thousands.
+- **HNSW filter functors are called inside the inner search loop** — keep
+  `bitmap.contains(id)` cheap. `BitMapFilterFunctor` wraps `RoaringBitmap`
+  which is already fast, but custom functors should not allocate.
+- **`matches_filter`** in
+  [vector_storage.hpp:622](../src/storage/vector_storage.hpp#L622) is a
+  separate point-check API for callers that already have a vector in hand
+  (e.g. recovery). It tries the index for numeric clauses and parses
+  `meta.filter` JSON for string/bool clauses. It is NOT used by the main
+  search path.
 
 ---
 
-## 4. Boolean Filter Design
+## 11. Limits and validation summary
+
+What the public surface will reject (code `1` or `2`):
 
-*Optimized for extreme density ops.*
+- `filter_array` not a JSON array.
+- Any clause that is not a single-field object.
+- Field name empty or containing `:`.
+- `$op` value's JSON type mismatching the operator (`$range` not a 2-array,
+  `$in` not an array, comparison value not a number).
+- Non-finite numbers.
+- Category values that are not string/integer/boolean, or that exceed 255
+  bytes, or that contain `:`.
+- `$range` with `start > end`.
+- `$lt`/`$lte`/`$gt`/`$gte` on a non-Number field.
 
-### 4.1. Storage Architecture
-Treated as a specialized Category filter with strictly two possible keys per field.
-*   **Keys:** `[FieldName]:0` (False) and `[FieldName]:1` (True).
-    *   Consistent with the text-based key design (uses `:` separator).
-*   **Value:** `RoaringBitmap`.
+What it will **not** reject yet:
 
-### 4.2. Strategy
-Boolean filters are typically low-selectivity (often matching ~50% of the DB). They are processed **Last** in the intersection chain unless statistics indicate high skew (e.g., `Is_Active` is true for 99% of data, so filtering for `False` is fast).
+- Overly long field names.
+- NUL or control bytes in field name or value.
+- Keys that exceed MDBX max-key-size (manifests as code 100 from MDBX, not
+  code 1).
+- Two distinct large integers that collapse to the same float32 key (silent;
+  see §4 caveats).
 
 ---
 
-## 5. Schema & Type Enforcement
+## 12. Open work / where the bodies are buried
+
+Treat [docs/filter_todo.md](filter_todo.md) and
+[docs/filter_issue_drafts.md](filter_issue_drafts.md) as the authoritative
+TODO list. Highlights:
 
-To ensure index integrity without a strict schema registry, the system adheres to **First-Write Wins** typing.
+- **Atomicity.** Schema, numeric, category, and meta writes are independent
+  txns. Crash recovery needs a journal or single-txn execution; meanwhile
+  rebuild is the only safe recovery.
+- **Concurrent category writes.** Read-modify-write across two txns can
+  drop concurrent updates to the same key.
+- **Search snapshot consistency.** Filter clauses each open their own read
+  txn, and `searchKNN` skips the operation lock. Multi-clause results may
+  mix snapshots.
+- **Schema bypass by low-level category APIs.** `add_to_filter()` does not
+  consult the schema.
+- **Numeric bucket format is unversioned.** Old DBs need rebuild; tests
+  explicitly reject the legacy count-prefixed payload.
+- **Fast path is coarse.** Tight buckets inside their extent still
+  deserialize.
+- **`$in` issues one MDBX read txn per value.** Batch under one txn.
+- **Cardinality estimator does not exist.** All partial bitmaps materialize
+  before intersection.
 
-*   **Immutable Types:** Once a `FieldName` is indexed with a specific type (Numeric, Category, or Boolean), that type is bound to the field.
-*   **Validation Logic:**
-    *   If `is_active` is first seen as **Boolean**, subsequent attempts to insert `is_active: "yes"` (Category) or `is_active: 1` (Numeric bucket) must be rejected.
-    *   This prevents storage corruption and ambiguous query parsing.
+If you are about to land filter changes, scan §3-9 caveats first and check
+whether your change closes any of them.
diff --git a/src/core/ndd.hpp b/src/core/ndd.hpp
index 55f6e5bc57..5c7c7de21d 100644
--- a/src/core/ndd.hpp
+++ b/src/core/ndd.hpp
@@ -26,6 +26,7 @@
 #include <thread>
 #include <atomic>
 #include <optional>
+#include <queue>
 #include <random>
 #include <type_traits>
 #include <future>
@@ -988,8 +989,18 @@ class IndexManager {
         entry->alg = std::move(new_alg);
     }
 
+    /**
+     * Adds or updates a batch of vectors and their associated filter documents.
+     *
+     * Return codes:
+     * 0 = success; value is true when vectors were inserted and false for an empty batch
+     * 1-99 = propagated filter validation failure from vector storage
+     * 100-199 = storage, sparse, or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
     template <typename VectorType>
-    bool addVectors(const std::string& index_id, const std::vector<VectorType>& vectors) {
+    ndd::OperationResult<bool> addVectors(const std::string& index_id,
+                                          const std::vector<VectorType>& vectors) {
         try {
             // Get the index entry (loads if needed, handles all locking)
             auto entry_ptr = getIndexEntry(index_id);
@@ -1002,7 +1013,7 @@ class IndexManager {
             LOG_DEBUG("Adding " << vectors.size() << " vectors to index " << index_id);
             if(vectors.empty()) {
                 LOG_DEBUG("No vectors to add");
-                return false;
+                return {SUCCESS, "No vectors to add", false};
             }
 
             // CRITICAL FIX: Pass WAL to create_ids_batch for atomic logging
@@ -1068,7 +1079,7 @@ class IndexManager {
                                       index_id,
                                       "Failed to update sparse storage for batch size "
                                               << sparse_batch.size());
-                            return false;
+                            return {100, "Failed to update sparse storage"};
                         }
                     }
                 }
@@ -1093,14 +1104,50 @@ class IndexManager {
             }
             LOG_DEBUG("QuantVectorObject conversion completed with move semantics");
 
-            // Store quantized vectors using optimized batch function (no double conversion!)
+            /*
+             * Store quantized vectors using optimized batch function (no double
+             * conversion). Two parallel vectors flow into store_vectors_batch:
+             *
+             *   storage_vectors : (numeric_id, QuantVectorObject) pairs — the data.
+             *   is_new_to_db    : per-entry "did the id_mapper already know this
+             *                     str_id?" signal, carried in numeric_ids[i].second
+             *                     (see id_mapper::create_ids_batch).
+             *
+             * The flag matters because store_vectors_batch uses it to decide whether
+             * to run the upsert-cleanup pass for each entry:
+             *   - true  => fresh slot or reuse of a deleted slot. The filter index
+             *              has nothing to clean for this numeric_id (a reuse only
+             *              happens after deleteFilter / deletePoint scrubbed it).
+             *   - false => the str_id was already mapped to this numeric_id, so it
+             *              is a live-point upsert. store_vectors_batch reads the
+             *              prior meta.filter and removes its filter index entries
+             *              before the new ones are written. Without this signal
+             *              the old category / numeric entries would survive and
+             *              keep matching queries against the old filter value.
+             *
+             * Skipping this wiring (passing an empty is_new_to_db) silently disables
+             * the cleanup pass — that fallback exists for back-compat, but inside
+             * the upsert flow we always have the signal, so we always pass it.
+             */
             std::vector<std::pair<idInt, QuantVectorObject>> storage_vectors;
+            std::vector<bool> is_new_to_db;
             storage_vectors.reserve(quantized_vectors.size());
+            is_new_to_db.reserve(quantized_vectors.size());
             for(size_t i = 0; i < quantized_vectors.size(); i++) {
                 // Copy QuantVectorObject for storage (we need to keep original for HNSW)
                 storage_vectors.emplace_back(numeric_ids[i].first, quantized_vectors[i]);
+                is_new_to_db.push_back(numeric_ids[i].second);
+            }
+            auto storage_result =
+                    entry.vector_storage->store_vectors_batch(storage_vectors, is_new_to_db);
+            if(!storage_result.ok()) {
+                if(storage_result.code < 100) {
+                    LOG_WARN(1212, index_id, "Insert filters rejected: " << storage_result.message);
+                } else {
+                    LOG_ERROR(1219, index_id, "Insert filters failed: " << storage_result.message);
+                }
+                return {storage_result.code, storage_result.message};
             }
-            entry.vector_storage->store_vectors_batch(storage_vectors);
             LOG_DEBUG("Stored " << storage_vectors.size()
                                 << " pre-quantized vectors in vector storage");
 
@@ -1160,7 +1207,7 @@ class IndexManager {
             }
 
             PRINT_LOG_TIME();
-            return true;
+            return {SUCCESS, "", true};
         } catch(const std::runtime_error& e) {
             // Re-throw runtime_error (includes backup-in-progress check)
             // so it can be caught by API layer and returned as proper JSON error
@@ -1330,9 +1377,19 @@ class IndexManager {
         }
     }
 
-    // Delete vectors from id mapper, delete filter and mark as deleted in HNSW. Does not delete
-    // meta, vector data Meta and vector data will be overwritten when the id is reused
-    bool deleteVectorsByIds(CacheEntry& entry, const std::vector<ndd::idInt>& numeric_ids) {
+    /**
+     * Deletes vectors from id mapper, filter indexes, sparse storage, and HNSW live set.
+     * XXX: Does not delete meta, vector data Meta and vector data will be overwritten when
+     * the id is reused.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from vector storage
+     * 100-199 = storage or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
+    ndd::OperationResult<bool>
+    deleteVectorsByIds(CacheEntry& entry, const std::vector<ndd::idInt>& numeric_ids) {
         try {
             for(ndd::idInt numeric_id : numeric_ids) {
                 auto meta = entry.vector_storage->get_meta(numeric_id);
@@ -1344,9 +1401,23 @@ class IndexManager {
                     continue;
                 }
                 // Remove the filter
-                entry.vector_storage->deleteFilter(numeric_id, meta.filter);
-                // Mark as deleted in HNSW index
+                auto filter_result = entry.vector_storage->deleteFilter(numeric_id, meta.filter);
+                if(!filter_result.ok()) {
+                    if(filter_result.code < 100) {
+                        LOG_WARN(1216,
+                                 entry.index_id,
+                                 "Delete-vector filter removal rejected: "
+                                         << filter_result.message);
+                    } else {
+                        LOG_ERROR(1217,
+                                  entry.index_id,
+                                  "Delete-vector filter removal failed: "
+                                          << filter_result.message);
+                    }
+                    return {filter_result.code, filter_result.message};
+                }
 
+                // Mark as deleted in HNSW index
                 entry.alg->markDelete(numeric_id);
 
                 // Delete from sparse storage if hybrid index
@@ -1360,14 +1431,24 @@ class IndexManager {
             // Mark the index as dirty
             entry.markDirty();
 
-            return true;
+            return {SUCCESS, "", true};
         } catch(const std::exception& e) {
             LOG_ERROR(2035, entry.index_id, "Failed to delete vectors: " << e.what());
-            return false;
+            return {100, std::string("Failed to delete vectors: ") + e.what()};
         }
     }
 
-    size_t deleteVectorsByFilter(const std::string& index_id, const nlohmann::json& filter_array) {
+    /**
+     * Deletes all vectors matching a filter query.
+     *
+     * Return codes:
+     * 0 = success; value is the number of deleted vectors
+     * 1-99 = propagated filter validation failure; caller should return HTTP 400
+     * 100-199 = storage or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
+    ndd::OperationResult<size_t>
+    deleteVectorsByFilter(const std::string& index_id, const nlohmann::json& filter_array) {
         try {
             auto entry_ptr = getIndexEntry(index_id);
             auto& entry = *entry_ptr;
@@ -1375,11 +1456,27 @@ class IndexManager {
             // Use per-index operation mutex to prevent concurrent operations
             std::unique_lock<std::shared_mutex> operation_lock(entry.operation_mutex);
 
-            auto numeric_ids =
+            auto numeric_ids_result =
                     entry.vector_storage->filter_store_->getIdsMatchingFilter(filter_array);
+            if(!numeric_ids_result.ok()) {
+                if(numeric_ids_result.code < 100) {
+                    LOG_WARN(1213,
+                             index_id,
+                             "Delete-by-filter rejected: " << numeric_ids_result.message);
+                } else {
+                    LOG_ERROR(1214,
+                              index_id,
+                              "Delete-by-filter failed while computing filter: "
+                                      << numeric_ids_result.message);
+                }
+                return {numeric_ids_result.code, numeric_ids_result.message};
+            }
+
+            auto& numeric_ids = numeric_ids_result.value_or_throw();
             LOG_DEBUG("Filter matched " << numeric_ids.size() << " vectors");
 
-            if(deleteVectorsByIds(entry, numeric_ids)) {
+            auto delete_result = deleteVectorsByIds(entry, numeric_ids);
+            if(delete_result.ok() && delete_result.value_or_throw()) {
                 // Check if we need to save based on WAL entry count after logging
                 WriteAheadLog* wal = getOrCreateWAL(entry);
                 if(wal->getEntryCount() >= persistence_config_.save_every_n_updates) {
@@ -1387,22 +1484,34 @@ class IndexManager {
                                               << " updates");
                     saveIndexInternal(entry);
                 }
-                return numeric_ids.size();
+                return {SUCCESS, "", numeric_ids.size()};
             } else {
-                return 0;
+                if(!delete_result.ok()) {
+                    return {delete_result.code, delete_result.message};
+                }
+                return {SUCCESS, "", static_cast<size_t>(0)};
             }
         } catch(const std::runtime_error& e) {
             // Re-throw runtime_error (includes backup-in-progress check)
             throw;
         } catch(const std::exception& e) {
             LOG_ERROR(2036, index_id, "Failed to delete vectors by filter: " << e.what());
-            return 0;
+            return {100, std::string("Failed to delete vectors by filter: ") + e.what()};
         }
     }
 
-    // Update filters for a batch of vectors
-    size_t updateFilters(const std::string& index_id,
-                         const std::vector<std::pair<std::string, std::string>>& updates) {
+    /**
+     * Replaces filter documents for a batch of vectors.
+     *
+     * Return codes:
+     * 0 = success; value is the number of updated filters
+     * 1-99 = propagated filter validation failure; caller should return HTTP 400
+     * 100-199 = storage or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
+    ndd::OperationResult<size_t>
+    updateFilters(const std::string& index_id,
+                  const std::vector<std::pair<std::string, std::string>>& updates) {
         try {
             auto entry_ptr = getIndexEntry(index_id);
             auto& entry = *entry_ptr;
@@ -1417,7 +1526,19 @@ class IndexManager {
                     continue;
                 }
 
-                entry.vector_storage->updateFilter(numeric_id, new_filter);
+                auto filter_result = entry.vector_storage->updateFilter(numeric_id, new_filter);
+                if(!filter_result.ok()) {
+                    if(filter_result.code < 100) {
+                        LOG_WARN(1215,
+                                 index_id,
+                                 "Update-filters rejected: " << filter_result.message);
+                    } else {
+                        LOG_ERROR(1218,
+                                  index_id,
+                                  "Update-filters failed: " << filter_result.message);
+                    }
+                    return {filter_result.code, filter_result.message};
+                }
                 updated_count++;
             }
 
@@ -1425,20 +1546,29 @@ class IndexManager {
                 entry.markDirty();
             }
 
-            return updated_count;
+            return {SUCCESS, "", updated_count};
         } catch(const std::runtime_error& e) {
             // Re-throw runtime_error (includes backup-in-progress check)
             throw;
         } catch(const std::exception& e) {
             LOG_ERROR(2037, index_id, "Failed to update filters: " << e.what());
-            return 0;
+            return {100, std::string("Failed to update filters: ") + e.what()};
         }
     }
 
-    // Delete a single vector by string ID - vector data will not be deleted. The meta and filter
-    // will be deleted and the vector will be marked as deleted in HNSW. The id will be put in the
-    // deleted_ids in id mapper and will be reused for new vectors
-    bool deleteVector(const std::string& index_id, const std::string& str_id) {
+    /**
+     * Deletes one vector by string id and removes its filter index entries.
+     * The meta and filter will be deleted and the vector will be marked as
+     * deleted in HNSW. The id will be put in the deleted_ids in id mapper and will be reused for new vectors.
+     *
+     * Return codes:
+     * 0 = success; value is false when the vector id does not exist
+     * 1-99 = propagated filter validation failure; caller should return HTTP 400
+     * 100-199 = storage or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
+    ndd::OperationResult<bool> deleteVector(const std::string& index_id,
+                                            const std::string& str_id) {
         try {
             auto entry_ptr = getIndexEntry(index_id);
             auto& entry = *entry_ptr;
@@ -1448,12 +1578,12 @@ class IndexManager {
 
             size_t numeric_id = entry.id_mapper->get_id(str_id);
             if(numeric_id == 0) {
-                return false;
+                return {SUCCESS, "", false};
             }
-            bool result = deleteVectorsByIds(entry, {static_cast<idInt>(numeric_id)});
+            auto result = deleteVectorsByIds(entry, {static_cast<idInt>(numeric_id)});
 
             // Check if we need to save based on WAL entry count after logging
-            if(result) {
+            if(result.ok() && result.value_or_throw()) {
                 WriteAheadLog* wal = getOrCreateWAL(entry);
                 if(wal->getEntryCount() >= persistence_config_.save_every_n_updates) {
                     LOG_DEBUG("Saving index " << index_id << " after " << wal->getEntryCount()
@@ -1468,21 +1598,20 @@ class IndexManager {
             throw;
         } catch(const std::exception& e) {
             LOG_ERROR(2038, index_id, "Failed to delete vector: " << e.what());
-            return false;
+            return {100, std::string("Failed to delete vector: ") + e.what()};
         }
     }
 
-    std::optional<std::vector<ndd::VectorResult>> searchKNN(const std::string& index_id,
-                                                            const std::vector<float>& query,
-                                                            size_t k,
-                                                            const nlohmann::json& filter_array,
-                                                            ndd::FilterParams params = {},
-                                                            bool include_vectors = false,
-                                                            size_t ef = 0) {
-        return searchKNN(index_id, query, {}, {}, k, filter_array, params, include_vectors, ef);
-    }
-
-    std::optional<std::vector<ndd::VectorResult>>
+    /**
+     * Searches an index with optional filter bitmap computation.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure; caller should return HTTP 400
+     * 100-199 = search or propagated filter storage failure; caller should return HTTP 500
+     * 200-299 = propagated filter corruption/invariant failure; caller should return HTTP 500
+     */
+    ndd::OperationResult<std::vector<ndd::VectorResult>>
     searchKNN(const std::string& index_id,
                 const std::vector<float>& query,
                 const std::vector<uint32_t>& sparse_indices,
@@ -1516,13 +1645,25 @@ class IndexManager {
             // Zero-weight sources cannot influence the final ranking, so skip their retrieval
             // work entirely.
             if(!run_dense_search && !run_sparse_search) {
-                return std::vector<ndd::VectorResult>();
+                return {SUCCESS, "", std::vector<ndd::VectorResult>()};
             }
 
             // 0. Compute Filter Bitmap (Shared)
             std::optional<ndd::RoaringBitmap> active_filter_bitmap;
             if (!filter_array.empty()) {
-                active_filter_bitmap = entry.vector_storage->filter_store_->computeFilterBitmap(filter_array);
+                auto filter_result =
+                        entry.vector_storage->filter_store_->computeFilterBitmap(filter_array);
+                if(!filter_result.ok()) {
+                    if(filter_result.code < 100) {
+                        LOG_WARN(1220, index_id, "Search filter rejected: " << filter_result.message);
+                    } else {
+                        LOG_ERROR(1221,
+                                  index_id,
+                                  "Search filter computation failed: " << filter_result.message);
+                    }
+                    return {filter_result.code, filter_result.message};
+                }
+                active_filter_bitmap = std::move(filter_result.value_or_throw());
             }
             const ndd::RoaringBitmap* filter_ptr =
                     active_filter_bitmap ? &(*active_filter_bitmap) : nullptr;
@@ -1579,26 +1720,47 @@ class IndexManager {
                     if (card == 0) {
                         // No results match filter
                     } else if (card < params.prefilter_threshold) {
-                         // Strategy A: Brute Force on Small Subset
+                        // Strategy A: Brute Force on Small Subset
                         std::vector<ndd::idInt> valid_ids;
-                        valid_ids.reserve(card);
-                        bitmap.iterate([](ndd::idInt id, void* ptr){
-                        static_cast<std::vector<ndd::idInt>*>(ptr)->push_back(id);
-                        return true;
-                        }, &valid_ids);
-
-                         // Fetch vectors
-                        auto vector_batch = entry.vector_storage->get_vectors_batch(valid_ids);
-
-                        // Prepare subset for bruteforce search
-                        std::vector<std::pair<idInt, std::vector<uint8_t>>> vector_subset;
-                        vector_subset.reserve(vector_batch.size());
-                        for(auto& [nid, vbytes] : vector_batch) {
-                            vector_subset.emplace_back(nid, std::move(vbytes));
+                        {
+                            valid_ids.reserve(card);
+                            bitmap.iterate(
+                                    [](ndd::idInt id, void* ptr) {
+                                        static_cast<std::vector<ndd::idInt>*>(ptr)->push_back(id);
+                                        return true;
+                                    },
+                                    &valid_ids);
                         }
 
-                        dense_results = hnswlib::searchKnnSubset<float>(
-                            query_bytes.data(), vector_subset, k, space);
+                        {
+                            auto distance_func = space->get_dist_func();
+                            void* dist_func_param = space->get_dist_func_param();
+                            std::priority_queue<std::pair<float, ndd::idInt>> top_results;
+
+                            if(k > 0) {
+                                entry.vector_storage->visit_vectors_by_ids(
+                                        valid_ids,
+                                        [&](ndd::idInt numeric_id, const void* vector_data) {
+                                            float distance = distance_func(query_bytes.data(),
+                                                                           vector_data,
+                                                                           dist_func_param);
+
+                                            if(top_results.size() < k) {
+                                                top_results.emplace(distance, numeric_id);
+                                            } else if(distance < top_results.top().first) {
+                                                top_results.pop();
+                                                top_results.emplace(distance, numeric_id);
+                                            }
+                                        });
+                            }
+
+                            dense_results.reserve(top_results.size());
+                            while(!top_results.empty()) {
+                                dense_results.push_back(top_results.top());
+                                top_results.pop();
+                            }
+                            std::reverse(dense_results.begin(), dense_results.end());
+                        }
 
                     } else {
                         // Strategy B: Filtered HNSW Search
@@ -1634,7 +1796,7 @@ class IndexManager {
             std::vector<std::pair<float, ndd::idInt>> final_candidates;
 
             if(dense_results.empty() && sparse_results.empty()) {
-                return std::vector<ndd::VectorResult>();
+                return {SUCCESS, "", std::vector<ndd::VectorResult>()};
             } else if(sparse_results.empty()) {
                 // Only dense results
                 final_candidates.reserve(dense_results.size());
@@ -1687,17 +1849,27 @@ class IndexManager {
             results.reserve(final_candidates.size());
             LOG_DEBUG("Search results size: " << final_candidates.size());
 
-            // Process and filter results
+            // Postfilter strategy:
+            //   Every code path that feeds final_candidates already enforces filter_ptr:
+            //     - Filtered HNSW search drops ids via BitMapFilterFunctor (filter.hpp).
+            //     - Prefilter brute-force only iterates ids drawn from the bitmap.
+            //     - Sparse search drops non-matching ids inside its scoring phase
+            //       (inverted_index.cpp).
+            //   So on the dense-only path the per-result contains() check is dead and
+            //   we skip it. On the hybrid path we keep it as defense-in-depth in case
+            //   sparse search ever stops honoring the filter; either way the check now
+            //   runs before get_meta() so a (defensive) reject does not pay an MDBX read.
+            const bool postfilter_active = filter_ptr != nullptr && run_sparse_search;
+            size_t postfilter_drops = 0;
             size_t filtered_count = 0;
             for(const auto& p : final_candidates) {
-                // Get metadata
-                ndd::VectorMeta meta = entry.vector_storage->get_meta(p.second);
-
-                // Apply filter
-                if(filter_ptr && !filter_ptr->contains(p.second)) {
+                if(postfilter_active && !filter_ptr->contains(p.second)) {
+                    ++postfilter_drops;
                     continue;
                 }
 
+                ndd::VectorMeta meta = entry.vector_storage->get_meta(p.second);
+
                 ndd::VectorResult result;
                 result.id = meta.id;
                 result.filter = meta.filter;
@@ -1730,10 +1902,19 @@ class IndexManager {
             if(results.size() > k) {
                 results.resize(k);
             }
-            return results;
+
+            // A drop here means an upstream filter step failed to honor filter_ptr.
+            // Log once per request rather than per-result to respect the hot-loop rule.
+            if(postfilter_drops > 0) {
+                LOG_WARN(1222,
+                         index_id,
+                         "Postfilter dropped " << postfilter_drops
+                                               << " ids that bypassed upstream filter checks");
+            }
+            return {SUCCESS, "", std::move(results)};
         } catch(const std::exception& e) {
             LOG_ERROR(2039, index_id, "Search failed: " << e.what());
-            return std::nullopt;
+            return {100, std::string("Search failed: ") + e.what()};
         }
     }
 
@@ -2280,4 +2461,4 @@ inline std::pair<bool, std::string> IndexManager::uploadBackup(const std::string
     backup_store_.writeBackupJson(username, backup_db);
 
     return {true, "Backup uploaded successfully"};
-}
\ No newline at end of file
+}
diff --git a/src/filter/category_index.cpp b/src/filter/category_index.cpp
new file mode 100644
index 0000000000..35cb881926
--- /dev/null
+++ b/src/filter/category_index.cpp
@@ -0,0 +1,341 @@
+#include "category_index.hpp"
+
+#include <stdexcept>
+#include <utility>
+
+namespace ndd {
+    namespace filter {
+
+        std::string CategoryIndex::format_filter_key(const std::string& field,
+                                                     const std::string& value) {
+            return field + ":" + value;
+        }
+
+        ndd::OperationResult<ndd::RoaringBitmap>
+        CategoryIndex::read_bitmap_payload(const void* data, size_t len) {
+            if(data == nullptr || len == 0) {
+                return {200, "empty bitmap payload"};
+            }
+
+            const char* bytes = static_cast<const char*>(data);
+            const size_t consumed =
+                    roaring::api::roaring_bitmap_portable_deserialize_size(bytes, len);
+            if(consumed == 0) {
+                return {200, "invalid or truncated bitmap payload"};
+            }
+            if(consumed != len) {
+                return {200,
+                        "bitmap payload length mismatch: consumed "
+                                + std::to_string(consumed) + " of "
+                                + std::to_string(len) + " bytes"};
+            }
+
+            ndd::RoaringBitmap bitmap;
+            try {
+                bitmap = ndd::RoaringBitmap::readSafe(bytes, len);
+            } catch(const std::exception& e) {
+                return {200,
+                        "failed to deserialize bitmap payload: " + std::string(e.what())};
+            }
+
+            const char* reason = nullptr;
+            if(!roaring::api::roaring_bitmap_internal_validate(&bitmap.roaring, &reason)) {
+                return {200,
+                        std::string("invalid bitmap internals")
+                                + (reason != nullptr ? ": " + std::string(reason) : "")};
+            }
+            return {SUCCESS, "", std::move(bitmap)};
+        }
+
+        /*
+         * Loads the bitmap stored for a formatted category filter key.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+         * 200 = corrupt stored bitmap payload; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<ndd::RoaringBitmap>
+        CategoryIndex::get_bitmap_internal(const std::string& filter_key) const {
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100,
+                        "Failed to begin category bitmap read transaction: "
+                                + std::string(mdbx_strerror(rc))};
+            }
+
+            MDBX_val key{const_cast<char*>(filter_key.c_str()), filter_key.size()};
+            MDBX_val data;
+
+            rc = mdbx_get(txn, dbi_, &key, &data);
+            if(rc == MDBX_NOTFOUND || (rc == MDBX_SUCCESS && data.iov_len == 0)) {
+                mdbx_txn_abort(txn);
+                return {SUCCESS, "", ndd::RoaringBitmap()};
+            }
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100,
+                        "Failed to read category bitmap key '" + filter_key
+                                + "': " + std::string(mdbx_strerror(rc))};
+            }
+
+            auto bitmap_result = read_bitmap_payload(data.iov_base, data.iov_len);
+            if(!bitmap_result.ok()) {
+                mdbx_txn_abort(txn);
+                return {bitmap_result.code,
+                        "Corrupt category bitmap payload for key '" + filter_key
+                                + "': " + bitmap_result.message};
+            }
+            if(!bitmap_result.value.has_value()) {
+                mdbx_txn_abort(txn);
+                return {200, "Category bitmap reader succeeded without a bitmap for key '"
+                                     + filter_key + "'"};
+            }
+            mdbx_txn_abort(txn);
+            return {SUCCESS, "", std::move(*bitmap_result.value)};
+        }
+
+        /*
+         * Stores the bitmap for a formatted category filter key.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction or write failure; caller should log ERROR and return HTTP 500
+         * 200 = invalid bitmap serialization; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<> CategoryIndex::store_bitmap_internal(
+                const std::string& filter_key,
+                const ndd::RoaringBitmap& bitmap) {
+            size_t required_size = bitmap.getSizeInBytes();
+            if(required_size == 0) {
+                return {200, "Invalid category bitmap serialization size for key '"
+                                     + filter_key + "'"};
+            }
+
+            std::vector<char> buffer(required_size);
+            bitmap.write(buffer.data(), true);
+
+            MDBX_val key{const_cast<char*>(filter_key.c_str()), filter_key.size()};
+            MDBX_val data{const_cast<char*>(buffer.data()), buffer.size()};
+
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100,
+                        "Failed to begin category bitmap write transaction: "
+                                + std::string(mdbx_strerror(rc))};
+            }
+
+            rc = mdbx_put(txn, dbi_, &key, &data, MDBX_UPSERT);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100, "Failed to store category bitmap key '" + filter_key
+                                     + "': " + std::string(mdbx_strerror(rc))};
+            }
+
+            rc = mdbx_txn_commit(txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100,
+                        "Failed to commit category bitmap write transaction: "
+                                + std::string(mdbx_strerror(rc))};
+            }
+            return {SUCCESS, ""};
+        }
+
+        CategoryIndex::CategoryIndex(MDBX_env* env) :
+            env_(env) {
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+            if(rc != MDBX_SUCCESS) {
+                throw std::runtime_error(
+                        std::string("Failed to begin txn for CategoryIndex init: ")
+                        + mdbx_strerror(rc));
+            }
+
+            // Open named DB for category/boolean
+            rc = mdbx_dbi_open(txn, "category_idx", MDBX_CREATE, &dbi_);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                throw std::runtime_error(std::string("Failed to open category_idx dbi: ")
+                                         + mdbx_strerror(rc));
+            }
+
+            rc = mdbx_txn_commit(txn);
+            if(rc != MDBX_SUCCESS) {
+                throw std::runtime_error(std::string("Failed to commit CategoryIndex init: ")
+                                         + mdbx_strerror(rc));
+            }
+        }
+
+        /*
+         * Lists all unique category values stored for one field.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction, cursor, or scan failure; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<std::vector<std::string>>
+        CategoryIndex::scan_values(const std::string& field) const {
+            std::vector<std::string> values;
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100,
+                        "Failed to begin category value scan transaction: "
+                                + std::string(mdbx_strerror(rc))};
+            }
+
+            MDBX_cursor* cursor = nullptr;
+            rc = mdbx_cursor_open(txn, dbi_, &cursor);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100,
+                        "Failed to open category value scan cursor: "
+                                + std::string(mdbx_strerror(rc))};
+            }
+
+            std::string prefix = field + ":";
+            MDBX_val key{const_cast<char*>(prefix.c_str()), prefix.size()};
+            MDBX_val data;
+
+            rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
+            while(rc == MDBX_SUCCESS) {
+                std::string found_key(static_cast<char*>(key.iov_base), key.iov_len);
+                if(found_key.rfind(prefix, 0) != 0) {
+                    break;
+                }
+
+                values.push_back(found_key.substr(prefix.size()));
+                rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
+            }
+
+            mdbx_cursor_close(cursor);
+            mdbx_txn_abort(txn);
+
+            if(rc != MDBX_SUCCESS && rc != MDBX_NOTFOUND) {
+                return {100, "Failed during category value scan: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+            return {SUCCESS, "", std::move(values)};
+        }
+
+        /*
+         * Loads the bitmap for one category field/value pair.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+         * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+         */
+        ndd::OperationResult<ndd::RoaringBitmap>
+        CategoryIndex::get_bitmap(const std::string& field, const std::string& value) const {
+            return get_bitmap_internal(format_filter_key(field, value));
+        }
+
+        /*
+         * Loads the bitmap for an already formatted category key.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+         * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+         */
+        ndd::OperationResult<ndd::RoaringBitmap>
+        CategoryIndex::get_bitmap_by_key(const std::string& key) const {
+            return get_bitmap_internal(key);
+        }
+
+        /*
+         * Adds one id to a category field/value bitmap.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+         * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+         */
+        ndd::OperationResult<>
+        CategoryIndex::add(const std::string& field, const std::string& value, ndd::idInt id) {
+            std::string filter_key = format_filter_key(field, value);
+            auto bitmap_result = get_bitmap_internal(filter_key);
+            if(!bitmap_result.ok()) {
+                return {bitmap_result.code, bitmap_result.message};
+            }
+
+            bitmap_result.value_or_throw().add(id);
+            return store_bitmap_internal(filter_key, bitmap_result.value_or_throw());
+        }
+
+        /*
+         * Removes one id from a category field/value bitmap.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+         * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+         */
+        ndd::OperationResult<>
+        CategoryIndex::remove(const std::string& field, const std::string& value, ndd::idInt id) {
+            std::string filter_key = format_filter_key(field, value);
+            auto bitmap_result = get_bitmap_internal(filter_key);
+            if(!bitmap_result.ok()) {
+                return {bitmap_result.code, bitmap_result.message};
+            }
+
+            bitmap_result.value_or_throw().remove(id);
+            return store_bitmap_internal(filter_key, bitmap_result.value_or_throw());
+        }
+
+        /*
+         * Checks whether one id is present in a category field/value bitmap.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+         * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+         */
+        ndd::OperationResult<bool>
+        CategoryIndex::contains(const std::string& field,
+                                const std::string& value,
+                                ndd::idInt id) const {
+            auto bitmap_result = get_bitmap_internal(format_filter_key(field, value));
+            if(!bitmap_result.ok()) {
+                return {bitmap_result.code, bitmap_result.message};
+            }
+            return {SUCCESS, "", bitmap_result.value_or_throw().contains(id)};
+        }
+
+        /*
+         * Adds a batch of ids to an already formatted category key.
+         *
+         * Return codes:
+         * 0 = success
+         * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+         * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+         */
+        ndd::OperationResult<>
+        CategoryIndex::add_batch_by_key(const std::string& key,
+                                        const std::vector<ndd::idInt>& ids) {
+            if(ids.empty()) {
+                return {SUCCESS, ""};
+            }
+            auto bitmap_result = get_bitmap_internal(key);
+            if(!bitmap_result.ok()) {
+                return {bitmap_result.code, bitmap_result.message};
+            }
+
+            bitmap_result.value_or_throw().addMany(ids.size(), ids.data());
+            return store_bitmap_internal(key, bitmap_result.value_or_throw());
+        }
+
+        // Expose key formatting for external batching logic
+        std::string CategoryIndex::make_key(const std::string& field, const std::string& value) {
+            return format_filter_key(field, value);
+        }
+
+        MDBX_dbi CategoryIndex::get_dbi() const {
+            return dbi_;
+        }
+
+    }  // namespace filter
+}  // namespace ndd
diff --git a/src/filter/category_index.hpp b/src/filter/category_index.hpp
index 58ffa62c69..20ca6fae24 100644
--- a/src/filter/category_index.hpp
+++ b/src/filter/category_index.hpp
@@ -1,12 +1,12 @@
 #pragma once
 
+#include <cstddef>
 #include <string>
 #include <vector>
-#include <stdexcept>
-#include <iostream>
+
 #include "mdbx/mdbx.h"
-#include "../utils/log.hpp"
 #include "../core/types.hpp"
+#include "../utils/types.hpp"
 
 namespace ndd {
     namespace filter {
@@ -17,196 +17,116 @@ namespace ndd {
             MDBX_dbi dbi_;
 
             static std::string format_filter_key(const std::string& field,
-                                                 const std::string& value) {
-                return field + ":" + value;
-            }
-
-            // Load bitmap from LMDB
-            ndd::RoaringBitmap get_bitmap_internal(const std::string& filter_key) const {
-                MDBX_txn* txn;
-                int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
-                if(rc != MDBX_SUCCESS) {
-                    throw std::runtime_error("Failed to begin read transaction: "
-                                             + std::string(mdbx_strerror(rc)));
-                }
-
-                try {
-                    MDBX_val key{const_cast<char*>(filter_key.c_str()), filter_key.size()};
-                    MDBX_val data;
-
-                    rc = mdbx_get(txn, dbi_, &key, &data);
-                    if(rc == MDBX_NOTFOUND) {
-                        mdbx_txn_abort(txn);
-                        // LOG_DEBUG("Filter key not found: " << filter_key);
-                        return ndd::RoaringBitmap();  // Return empty bitmap
-                    }
-                    if(rc != MDBX_SUCCESS) {
-                        mdbx_txn_abort(txn);
-                        throw std::runtime_error("Failed to read filter key '" + filter_key
-                                                 + "': " + std::string(mdbx_strerror(rc)));
-                    }
-
-                    if(data.iov_len == 0) {
-                        mdbx_txn_abort(txn);
-                        // LOG_DEBUG("Empty data for filter key: " << filter_key);
-                        return ndd::RoaringBitmap();
-                    }
-
-                    ndd::RoaringBitmap bitmap =
-                            ndd::RoaringBitmap::read(static_cast<const char*>(data.iov_base));
-                    mdbx_txn_abort(txn);
-                    return bitmap;
-                } catch(...) {
-                    mdbx_txn_abort(txn);
-                    throw;
-                }
-            }
-
-            void store_bitmap_internal(const std::string& filter_key,
-                                       const ndd::RoaringBitmap& bitmap) {
-                if(bitmap.cardinality() == 0) {
-                    // LOG_DEBUG("Storing empty bitmap for key: " << filter_key);
-                }
-
-                size_t required_size = bitmap.getSizeInBytes();
-                if(required_size == 0) {
-                    throw std::runtime_error("Invalid bitmap serialization: size is 0");
-                }
-
-                std::vector<char> buffer(required_size);
-                bitmap.write(buffer.data(), true);
-
-                MDBX_val key{const_cast<char*>(filter_key.c_str()), filter_key.size()};
-                MDBX_val data{const_cast<char*>(buffer.data()), buffer.size()};
-
-                MDBX_txn* txn;
-                int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-                if(rc != MDBX_SUCCESS) {
-                    throw std::runtime_error("Failed to begin write transaction: "
-                                             + std::string(mdbx_strerror(rc)));
-                }
-
-                rc = mdbx_put(txn, dbi_, &key, &data, MDBX_UPSERT);
-                if(rc != MDBX_SUCCESS) {
-                    mdbx_txn_abort(txn);
-                    throw std::runtime_error("Failed to store bitmap: "
-                                             + std::string(mdbx_strerror(rc)));
-                }
-
-                rc = mdbx_txn_commit(txn);
-                if(rc != MDBX_SUCCESS) {
-                    throw std::runtime_error("Failed to commit transaction: "
-                                             + std::string(mdbx_strerror(rc)));
-                }
-            }
+                                                 const std::string& value);
+
+            static ndd::OperationResult<ndd::RoaringBitmap>
+            read_bitmap_payload(const void* data, size_t len);
+
+            /*
+             * Loads the bitmap stored for a formatted category filter key.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+             * 200 = corrupt stored bitmap payload; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<ndd::RoaringBitmap>
+            get_bitmap_internal(const std::string& filter_key) const;
+
+            /*
+             * Stores the bitmap for a formatted category filter key.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction or write failure; caller should log ERROR and return HTTP 500
+             * 200 = invalid bitmap serialization; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<> store_bitmap_internal(const std::string& filter_key,
+                                                         const ndd::RoaringBitmap& bitmap);
 
         public:
-            CategoryIndex(MDBX_env* env) :
-                env_(env) {
-                MDBX_txn* txn;
-                int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-                if(rc != MDBX_SUCCESS) {
-                    throw std::runtime_error(std::string("Failed to begin txn for CategoryIndex init: ") + mdbx_strerror(rc));
-                }
-
-                // Open named DB for category/boolean
-                rc = mdbx_dbi_open(txn, "category_idx", MDBX_CREATE, &dbi_);
-                if(rc != MDBX_SUCCESS) {
-                    mdbx_txn_abort(txn);
-                    throw std::runtime_error(std::string("Failed to open category_idx dbi: ") + mdbx_strerror(rc));
-                }
-
-                mdbx_txn_commit(txn);
-            }
-
-            // Faceting: List all unique values for a field
-            std::vector<std::string> scan_values(const std::string& field) const {
-                std::vector<std::string> values;
-                MDBX_txn* txn;
-                if (mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn) != MDBX_SUCCESS) return values;
-
-                MDBX_cursor* cursor;
-                mdbx_cursor_open(txn, dbi_, &cursor);
-
-                std::string prefix = field + ":";
-                MDBX_val key{const_cast<char*>(prefix.c_str()), prefix.size()};
-                MDBX_val data;
-
-                int rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
-                while(rc == MDBX_SUCCESS) {
-                    std::string found_key((char*)key.iov_base, key.iov_len);
-                    if(found_key.rfind(prefix, 0) != 0) break;
-
-                    values.push_back(found_key.substr(prefix.size()));
-                    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
-                }
-                mdbx_cursor_close(cursor);
-                mdbx_txn_abort(txn);
-                return values;
-            }
-
-            ndd::RoaringBitmap get_bitmap(const std::string& field,
-                                          const std::string& value) const {
-                return get_bitmap_internal(format_filter_key(field, value));
-            }
-
-            // Direct key access for internal use if needed, or expose format_filter_key
-            ndd::RoaringBitmap get_bitmap_by_key(const std::string& key) const {
-                return get_bitmap_internal(key);
-            }
-
-            void add(const std::string& field, const std::string& value, ndd::idInt id) {
-                std::string filter_key = format_filter_key(field, value);
-                ndd::RoaringBitmap bitmap = get_bitmap_internal(filter_key);
-                bitmap.add(id);
-                store_bitmap_internal(filter_key, bitmap);
-            }
-
-            void remove(const std::string& field, const std::string& value, ndd::idInt id) {
-                std::string filter_key = format_filter_key(field, value);
-                ndd::RoaringBitmap bitmap = get_bitmap_internal(filter_key);
-                bitmap.remove(id);
-                store_bitmap_internal(filter_key, bitmap);
-            }
-
-            bool contains(const std::string& field, const std::string& value, ndd::idInt id) const {
-                std::string filter_key = format_filter_key(field, value);
-                ndd::RoaringBitmap bitmap = get_bitmap_internal(filter_key);
-                return bitmap.contains(id);
-            }
-
-            void add_batch(const std::string& field,
-                           const std::string& value,
-                           const std::vector<ndd::idInt>& ids) {
-                if(ids.empty()) {
-                    return;
-                }
-                std::string filter_key = format_filter_key(field, value);
-                ndd::RoaringBitmap bitmap = get_bitmap_internal(filter_key);
-                for(const auto& id : ids) {
-                    bitmap.add(id);
-                }
-                store_bitmap_internal(filter_key, bitmap);
-            }
-
-            // Helper for batch operations where key is already formatted
-            void add_batch_by_key(const std::string& key, const std::vector<ndd::idInt>& ids) {
-                if(ids.empty()) {
-                    return;
-                }
-                ndd::RoaringBitmap bitmap = get_bitmap_internal(key);
-                for(const auto& id : ids) {
-                    bitmap.add(id);
-                }
-                store_bitmap_internal(key, bitmap);
-            }
+            CategoryIndex(MDBX_env* env);
+
+            /*
+             * Lists all unique category values stored for one field.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction, cursor, or scan failure; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<std::vector<std::string>>
+            scan_values(const std::string& field) const;
+
+            /*
+             * Loads the bitmap for one category field/value pair.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+             * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+             */
+            ndd::OperationResult<ndd::RoaringBitmap>
+            get_bitmap(const std::string& field, const std::string& value) const;
+
+            /*
+             * Loads the bitmap for an already formatted category key.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+             * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+             */
+            ndd::OperationResult<ndd::RoaringBitmap>
+            get_bitmap_by_key(const std::string& key) const;
+
+            /*
+             * Adds one id to a category field/value bitmap.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+             * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+             */
+            ndd::OperationResult<>
+            add(const std::string& field, const std::string& value, ndd::idInt id);
+
+            /*
+             * Removes one id from a category field/value bitmap.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+             * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+             */
+            ndd::OperationResult<>
+            remove(const std::string& field, const std::string& value, ndd::idInt id);
+
+            /*
+             * Checks whether one id is present in a category field/value bitmap.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from the bitmap read helper
+             * 200-299 = propagated corruption/invariant failure from the bitmap read helper
+             */
+            ndd::OperationResult<bool>
+            contains(const std::string& field, const std::string& value, ndd::idInt id) const;
+
+            /*
+             * Adds a batch of ids to an already formatted category key.
+             *
+             * Return codes:
+             * 0 = success
+             * 100-199 = propagated MDBX/storage failure from bitmap read/write helpers
+             * 200-299 = propagated corruption/invariant failure from bitmap read/write helpers
+             */
+            ndd::OperationResult<>
+            add_batch_by_key(const std::string& key, const std::vector<ndd::idInt>& ids);
 
             // Expose key formatting for external batching logic
-            static std::string make_key(const std::string& field, const std::string& value) {
-                return format_filter_key(field, value);
-            }
+            static std::string make_key(const std::string& field, const std::string& value);
 
-            MDBX_dbi get_dbi() const { return dbi_; }
+            MDBX_dbi get_dbi() const;
         };
 
     }  // namespace filter
diff --git a/src/filter/filter.cpp b/src/filter/filter.cpp
new file mode 100644
index 0000000000..646e8d3bcd
--- /dev/null
+++ b/src/filter/filter.cpp
@@ -0,0 +1,991 @@
+#include "filter.hpp"
+
+#include <algorithm>
+#include <cmath>
+#include <cstring>
+#include <filesystem>
+#include <limits>
+#include <stdexcept>
+#include <utility>
+
+#include "../utils/log.hpp"
+#include "../utils/settings.hpp"
+
+BitMapFilterFunctor::BitMapFilterFunctor(const ndd::RoaringBitmap& bitmap) :
+    bitmap_(bitmap) {}
+
+bool BitMapFilterFunctor::operator()(ndd::idInt id) {
+    return bitmap_.contains(id);
+}
+
+std::string Filter::format_filter_key(const std::string& field, const std::string& value) {
+    return field + ":" + value;
+}
+
+// Rejects ':' because it is the MDBX key delimiter for category and numeric
+// indexes (see format_filter_key, NumericIndex::make_*_key). Allowing ':' in
+// user input causes byte-level key collisions across distinct (field, value)
+// pairs.
+ndd::OperationResult<>
+Filter::validate_filter_key_component(const std::string& component,
+                                      const std::string& context) {
+    if(component.find(':') != std::string::npos) {
+        return {1, context + " must not contain ':'"};
+    }
+    return {SUCCESS, ""};
+}
+
+/**
+ * Converts a JSON number into the current sortable numeric filter encoding.
+ * All numeric filter values use one float32 sortable domain, including JSON
+ * integers, so 2 and 2.0 compare equal. Limitations: values are rounded to
+ * float precision before indexing/querying, distinct large integers can
+ * collapse to the same key, and strict comparisons use the next float32
+ * representable value around the rounded query bound. float32 has 24 bits of
+ * integer precision (23 stored mantissa bits plus the hidden bit), so it
+ * represents every integer only up to 2^24 = 16,777,216; above that, not all
+ * consecutive integers are representable. Consecutive integers are also less
+ * dense in the float sortable bit domain than under int_to_sortable, so
+ * integer-heavy fields can create more numeric buckets and make wide range
+ * scans walk more bucket entries. Existing filter DBs that indexed integers
+ * with int_to_sortable must be rebuilt.
+ *
+ * Return codes:
+ * 0 = success
+ * 2 = value is not numeric or not finite in float32; caller should return HTTP 400
+ */
+ndd::OperationResult<uint32_t> Filter::sortable_from_json(const nlohmann::json& value,
+                                                          const std::string& context) {
+    if(!value.is_number()) {
+        return {2, context + " must be a finite float32 number"};
+    }
+
+    float numeric_value = value.get<float>();
+    if(!std::isfinite(numeric_value)) {
+        LOG_WARN(1202, "Rejected numeric filter value outside finite float32 domain");
+        return {2, context + " must be a finite float32 number"};
+    }
+    if(numeric_value == 0.0f) {
+        numeric_value = 0.0f;
+    }
+
+    return {SUCCESS, "", ndd::filter::float_to_sortable(numeric_value)};
+}
+
+/*
+ * Converts a JSON scalar into the category key value representation.
+ *
+ * Return codes:
+ * 0 = success
+ * 2 = value is not a supported category scalar or is too long; caller should return HTTP 400
+ */
+ndd::OperationResult<std::string> Filter::category_value_from_json(
+        const nlohmann::json& value,
+        const std::string& context) {
+    std::string str_val;
+    if(value.is_string()) {
+        str_val = value.get<std::string>();
+    } else if(value.is_boolean()) {
+        str_val = value.get<bool>() ? "1" : "0";
+    } else if(value.is_number_integer()) {
+        str_val = std::to_string(value.get<int>());
+    } else {
+        return {2, context + " must be string, integer, or boolean"};
+    }
+
+    if(str_val.size() > 255) {
+        return {2, context + " is too long"};
+    }
+    auto delim_check = validate_filter_key_component(str_val, context);
+    if(!delim_check.ok()) {
+        return {delim_check.code, delim_check.message};
+    }
+    return {SUCCESS, "", std::move(str_val)};
+}
+
+/*
+ * Resolves [$lt | $lte | $gt | $gte] on a JSON numeric value into a
+ * sortable [min, max] range usable against NumericIndex::range / check_range.
+ * A returned pair with min > max signals a provably-empty range
+ * (e.g. $gt the largest finite float32); callers must skip the lookup.
+ *
+ * Return codes:
+ * 0 = success
+ * 2 = value is not a finite number, or operator is not a numeric comparison;
+ *     caller should return HTTP 400
+ */
+ndd::OperationResult<std::pair<uint32_t, uint32_t>>
+Filter::numeric_bound_from_comparison(const std::string& op, const nlohmann::json& val) {
+    using Bound = std::pair<uint32_t, uint32_t>;
+    constexpr uint32_t SORTABLE_MIN = 0x00000000u;
+    constexpr uint32_t SORTABLE_MAX = 0xFFFFFFFFu;
+    const Bound EMPTY{SORTABLE_MAX, SORTABLE_MIN};
+
+    if(!val.is_number()) {
+        return {2, op + " value must be a finite number"};
+    }
+    float x = val.get<float>();
+    if(!std::isfinite(x)) {
+        LOG_WARN(1203, "Rejected numeric comparison bound outside finite float32 domain");
+        return {2, op + " value must be a finite number"};
+    }
+    if(x == 0.0f) {
+        x = 0.0f;
+    }
+
+    if(op == "$gte") {
+        auto sortable_result = sortable_from_json(val, op + " value");
+        if(!sortable_result.ok()) {
+            return {sortable_result.code, sortable_result.message};
+        }
+        return {SUCCESS, "", Bound{sortable_result.value_or_throw(), SORTABLE_MAX}};
+    }
+    if(op == "$lte") {
+        auto sortable_result = sortable_from_json(val, op + " value");
+        if(!sortable_result.ok()) {
+            return {sortable_result.code, sortable_result.message};
+        }
+        return {SUCCESS, "", Bound{SORTABLE_MIN, sortable_result.value_or_throw()}};
+    }
+    if(op == "$gt") {
+        float next = std::nextafterf(x, std::numeric_limits<float>::infinity());
+        if(!std::isfinite(next)) {
+            return {SUCCESS, "", EMPTY};
+        }
+        return {SUCCESS, "", Bound{ndd::filter::float_to_sortable(next), SORTABLE_MAX}};
+    }
+    if(op == "$lt") {
+        float next = std::nextafterf(x, -std::numeric_limits<float>::infinity());
+        if(!std::isfinite(next)) {
+            return {SUCCESS, "", EMPTY};
+        }
+        return {SUCCESS, "", Bound{SORTABLE_MIN, ndd::filter::float_to_sortable(next)}};
+    }
+
+    return {2, "Unsupported numeric comparison operator: " + op};
+}
+
+/*
+ * Persists the current in-memory filter schema cache.
+ *
+ * Return codes:
+ * 0 = success
+ * 100 = MDBX transaction, write, or commit failure; caller should log ERROR and return HTTP 500
+ */
+ndd::OperationResult<> Filter::save_schema_internal() {
+    nlohmann::json schema_json;
+    for(const auto& [field, type] : schema_cache_) {
+        schema_json[field] = static_cast<int>(type);
+    }
+    std::string json_str = schema_json.dump();
+
+    MDBX_txn* txn = nullptr;
+    int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+    if(rc != MDBX_SUCCESS) {
+        return {100, "Failed to begin schema write transaction: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    MDBX_val key{const_cast<char*>(SCHEMA_KEY), std::strlen(SCHEMA_KEY)};
+    MDBX_val data{const_cast<char*>(json_str.c_str()), json_str.size()};
+
+    rc = mdbx_put(txn, dbi_, &key, &data, MDBX_UPSERT);
+    if(rc != MDBX_SUCCESS) {
+        mdbx_txn_abort(txn);
+        return {100, "Failed to persist filter schema: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    rc = mdbx_txn_commit(txn);
+    if(rc != MDBX_SUCCESS) {
+        return {100, "Failed to commit filter schema update: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+    return {SUCCESS, ""};
+}
+
+/*
+ * Loads the persisted filter schema into the in-memory schema cache.
+ *
+ * Return codes:
+ * 0 = success
+ * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+ * 200 = corrupt schema JSON payload; caller should log ERROR and return HTTP 500
+ */
+ndd::OperationResult<> Filter::load_schema() {
+    MDBX_txn* txn = nullptr;
+    int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+    if(rc != MDBX_SUCCESS) {
+        return {100, "Failed to begin schema read transaction: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    MDBX_val key{const_cast<char*>(SCHEMA_KEY), std::strlen(SCHEMA_KEY)};
+    MDBX_val data;
+    rc = mdbx_get(txn, dbi_, &key, &data);
+
+    if(rc == MDBX_NOTFOUND || (rc == MDBX_SUCCESS && data.iov_len == 0)) {
+        mdbx_txn_abort(txn);
+        return {SUCCESS, ""};
+    }
+    if(rc != MDBX_SUCCESS) {
+        mdbx_txn_abort(txn);
+        return {100, "Failed to read filter schema: " + std::string(mdbx_strerror(rc))};
+    }
+
+    try {
+        std::string json_str(static_cast<const char*>(data.iov_base), data.iov_len);
+        auto parsed = nlohmann::json::parse(json_str);
+        std::lock_guard<std::mutex> lock(schema_mutex_);
+        schema_cache_.clear();
+        for(auto& [field, stored_type] : parsed.items()) {
+            schema_cache_[field] = static_cast<FieldType>(stored_type.get<int>());
+        }
+    } catch(const std::exception& e) {
+        mdbx_txn_abort(txn);
+        return {200, "Failed to parse filter schema: " + std::string(e.what())};
+    }
+
+    mdbx_txn_abort(txn);
+    return {SUCCESS, ""};
+}
+
+/*
+ * Registers a field type in the filter schema if it is not already present.
+ *
+ * Return codes:
+ * 0 = success
+ * 3 = field type mismatch with existing schema; caller should return HTTP 400
+ * 100-199 = propagated MDBX/storage failure from schema persistence
+ */
+ndd::OperationResult<> Filter::register_field_type(const std::string& field, FieldType type) {
+    std::lock_guard<std::mutex> lock(schema_mutex_);
+    auto it = schema_cache_.find(field);
+    if(it != schema_cache_.end()) {
+        if(it->second == type) {
+            return {SUCCESS, ""};
+        }
+        return {3, "Filter field '" + field + "' has a different existing type"};
+    }
+
+    schema_cache_[field] = type;
+    auto save_result = save_schema_internal();
+    if(!save_result.ok()) {
+        schema_cache_.erase(field);
+        return save_result;
+    }
+    return {SUCCESS, ""};
+}
+
+void Filter::init_environment() {
+    int rc = mdbx_env_create(&env_);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to create LMDB env for filters: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    // max DBs to allow multiple databases (main + schema + numeric_forward + numeric_inverted)
+    rc = mdbx_env_set_maxdbs(env_, 10);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to configure max DBs for filters: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    // Set geometry for auto-grow using the filter map size settings
+    rc = mdbx_env_set_geometry(env_,
+                               -1,
+                               1ULL << settings::FILTER_MAP_SIZE_BITS,
+                               1ULL << settings::FILTER_MAP_SIZE_MAX_BITS,
+                               1ULL << settings::FILTER_MAP_SIZE_BITS,
+                               -1,
+                               -1);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to set geometry for filters: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    rc = mdbx_env_open(env_,
+                       path_.c_str(),
+                       MDBX_WRITEMAP | MDBX_MAPASYNC | MDBX_NORDAHEAD,
+                       0664);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to open filter environment: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    MDBX_txn* txn = nullptr;
+    rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to begin filter transaction: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    rc = mdbx_dbi_open(txn, nullptr, MDBX_CREATE, &dbi_);
+    if(rc != MDBX_SUCCESS) {
+        mdbx_txn_abort(txn);
+        throw std::runtime_error(std::string("Failed to open filter database: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    rc = mdbx_txn_commit(txn);
+    if(rc != MDBX_SUCCESS) {
+        throw std::runtime_error(std::string("Failed to commit filter transaction: ")
+                                 + mdbx_strerror(rc));
+    }
+
+    // Initialize Indices
+    numeric_index_ = std::make_unique<ndd::filter::NumericIndex>(env_);
+    category_index_ = std::make_unique<ndd::filter::CategoryIndex>(env_);
+
+    auto schema_result = load_schema();
+    if(!schema_result.ok()) {
+        LOG_ERROR(1201, index_id_, schema_result.message);
+        throw std::runtime_error(schema_result.message);
+    }
+}
+
+Filter::Filter(const std::string& path, const std::string& index_id) :
+    index_id_(index_id),
+    path_(path) {
+    std::filesystem::create_directories(path);
+    init_environment();
+}
+
+Filter::Filter(const std::string& path) :
+    Filter(path, "-/-") {}
+
+Filter::~Filter() {
+    mdbx_dbi_close(env_, dbi_);
+    mdbx_env_close(env_);
+}
+
+/*
+ * Computes the bitmap for an AND filter query.
+ *
+ * Return codes:
+ * 0 = success
+ * 1 = invalid filter query shape; caller should return HTTP 400
+ * 2 = invalid operator or value for field type; caller should return HTTP 400
+ * 100-199 = propagated MDBX/storage failure from category or numeric index
+ * 200-299 = propagated corruption/invariant failure from category or numeric index
+ */
+ndd::OperationResult<ndd::RoaringBitmap>
+Filter::computeFilterBitmap(const nlohmann::json& filter_array) const {
+    if(!filter_array.is_array()) {
+        return {1, "Filter must be an array"};
+    }
+
+    if(filter_array.empty()) {
+        return {SUCCESS, "", ndd::RoaringBitmap()};
+    }
+
+    std::vector<ndd::RoaringBitmap> partial_results;
+    partial_results.reserve(filter_array.size());
+
+    for(const auto& condition : filter_array) {
+        if(!condition.is_object() || condition.size() != 1) {
+            return {1, "Each filter condition must be a single-field object"};
+        }
+
+        const auto& field = condition.begin().key();
+        const auto& expr = condition.begin().value();
+        if(field.empty()) {
+            return {1, "Filter field name cannot be empty"};
+        }
+        auto field_check = validate_filter_key_component(field, "Filter field name");
+        if(!field_check.ok()) {
+            return {field_check.code, field_check.message};
+        }
+        if(!expr.is_object() || expr.size() != 1) {
+            return {1, "Filter operator must be a single-field object"};
+        }
+
+        // Check schema for field type
+        FieldType type = FieldType::Unknown;
+        {
+            std::lock_guard<std::mutex> lock(schema_mutex_);
+            auto it = schema_cache_.find(field);
+            if(it != schema_cache_.end()) {
+                type = it->second;
+            }
+        }
+
+        const std::string op = expr.begin().key();
+        const auto& val = expr.begin().value();
+        ndd::RoaringBitmap or_result;
+
+        if(op == "$eq") {
+            if(type == FieldType::Number) {
+                auto sortable_result = sortable_from_json(val, "$eq value for numeric field");
+                if(!sortable_result.ok()) {
+                    return {sortable_result.code, sortable_result.message};
+                }
+                auto range_result =
+                        numeric_index_->range(field, sortable_result.value_or_throw(), sortable_result.value_or_throw());
+                if(!range_result.ok()) {
+                    return {range_result.code, range_result.message};
+                }
+                or_result = std::move(range_result.value_or_throw());
+            } else {
+                auto value_result = category_value_from_json(val, "$eq value");
+                if(!value_result.ok()) {
+                    return {value_result.code, value_result.message};
+                }
+                auto bitmap_result = category_index_->get_bitmap_by_key(
+                        format_filter_key(field, value_result.value_or_throw()));
+                if(!bitmap_result.ok()) {
+                    return {bitmap_result.code, bitmap_result.message};
+                }
+                or_result = std::move(bitmap_result.value_or_throw());
+            }
+        } else if(op == "$in") {
+            if(!val.is_array()) {
+                return {2, "$in must be an array"};
+            }
+
+            for(const auto& item : val) {
+                if(type == FieldType::Number) {
+                    auto sortable_result =
+                            sortable_from_json(item, "$in value for numeric field");
+                    if(!sortable_result.ok()) {
+                        return {sortable_result.code, sortable_result.message};
+                    }
+                    auto range_result = numeric_index_->range(field,
+                                                              sortable_result.value_or_throw(),
+                                                              sortable_result.value_or_throw());
+                    if(!range_result.ok()) {
+                        return {range_result.code, range_result.message};
+                    }
+                    or_result |= range_result.value_or_throw();
+                } else {
+                    auto value_result = category_value_from_json(item, "$in value");
+                    if(!value_result.ok()) {
+                        return {value_result.code, value_result.message};
+                    }
+                    if(!value_result.value_or_throw().empty()) {
+                        auto bitmap_result = category_index_->get_bitmap_by_key(
+                                format_filter_key(field, value_result.value_or_throw()));
+                        if(!bitmap_result.ok()) {
+                            return {bitmap_result.code, bitmap_result.message};
+                        }
+                        or_result |= bitmap_result.value_or_throw();
+                    }
+                }
+            }
+        } else if(op == "$range") {
+            if(!val.is_array() || val.size() != 2) {
+                return {2, "$range must be [start, end] with exactly 2 values"};
+            }
+            if(type != FieldType::Number) {
+                return {2, "$range operator is only supported for numeric fields"};
+            }
+
+            auto start_result = sortable_from_json(val[0], "Range start");
+            if(!start_result.ok()) {
+                return {start_result.code, start_result.message};
+            }
+            auto end_result = sortable_from_json(val[1], "Range end");
+            if(!end_result.ok()) {
+                return {end_result.code, end_result.message};
+            }
+            if(start_result.value_or_throw() > end_result.value_or_throw()) {
+                return {2, "Invalid range: start > end"};
+            }
+
+            auto range_result =
+                    numeric_index_->range(field, start_result.value_or_throw(), end_result.value_or_throw());
+            if(!range_result.ok()) {
+                return {range_result.code, range_result.message};
+            }
+            or_result = std::move(range_result.value_or_throw());
+        } else if(op == "$lt" || op == "$lte" || op == "$gt" || op == "$gte") {
+            if(type != FieldType::Number) {
+                return {2, op + " operator is only supported for numeric fields"};
+            }
+            auto bound_result = numeric_bound_from_comparison(op, val);
+            if(!bound_result.ok()) {
+                return {bound_result.code, bound_result.message};
+            }
+            auto [min_val, max_val] = bound_result.value_or_throw();
+            if(min_val <= max_val) {
+                auto range_result = numeric_index_->range(field, min_val, max_val);
+                if(!range_result.ok()) {
+                    return {range_result.code, range_result.message};
+                }
+                or_result = std::move(range_result.value_or_throw());
+            }
+        } else {
+            return {2, "Unsupported filter operator: " + op};
+        }
+
+        partial_results.push_back(std::move(or_result));
+    }
+
+    // Optimization: Sort by cardinality (smallest first)
+    std::sort(partial_results.begin(),
+              partial_results.end(),
+              [](const ndd::RoaringBitmap& left, const ndd::RoaringBitmap& right) {
+                  return left.cardinality() < right.cardinality();
+              });
+
+    if(partial_results.empty()) {
+        return {SUCCESS, "", ndd::RoaringBitmap()};
+    }
+
+    ndd::RoaringBitmap final_result = partial_results[0];
+    for(size_t i = 1; i < partial_results.size(); ++i) {
+        final_result &= partial_results[i];
+
+        // If result becomes empty, stop early
+        if(final_result.isEmpty()) {
+            return {SUCCESS, "", std::move(final_result)};
+        }
+    }
+
+    return {SUCCESS, "", std::move(final_result)};
+}
+
+/**
+ * Returns numeric ids matching a filter query based on the provided JSON filter array
+ *
+ * Return codes:
+ * 0 = success
+ * 1-99 = propagated filter validation failure from bitmap computation
+ * 100-199 = propagated MDBX/storage failure from bitmap computation
+ * 200-299 = propagated corruption/invariant failure from bitmap computation
+ */
+ndd::OperationResult<std::vector<ndd::idInt>>
+Filter::getIdsMatchingFilter(const nlohmann::json& filter_array) const {
+    auto bitmap_result = computeFilterBitmap(filter_array);
+    if(!bitmap_result.ok()) {
+        return {bitmap_result.code, bitmap_result.message};
+    }
+
+    std::vector<ndd::idInt> ids;
+    ids.reserve(bitmap_result.value_or_throw().cardinality());
+    bitmap_result.value_or_throw().iterate(
+            [](ndd::idInt val, void* ptr) {
+                static_cast<std::vector<ndd::idInt>*>(ptr)->push_back(val);
+                return true;
+            },
+            &ids);
+    return {SUCCESS, "", std::move(ids)};
+}
+
+/*
+ * Counts numeric ids matching a filter query.
+ *
+ * Return codes:
+ * 0 = success
+ * 1-99 = propagated filter validation failure from bitmap computation
+ * 100-199 = propagated MDBX/storage failure from bitmap computation
+ * 200-299 = propagated corruption/invariant failure from bitmap computation
+ */
+ndd::OperationResult<size_t> Filter::countIdsMatchingFilter(
+        const nlohmann::json& filter_array) const {
+    auto bitmap_result = computeFilterBitmap(filter_array);
+    if(!bitmap_result.ok()) {
+        return {bitmap_result.code, bitmap_result.message};
+    }
+    return {SUCCESS, "", bitmap_result.value_or_throw().cardinality()};
+}
+
+/*
+ * Adds one id to a category filter.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<>
+Filter::add_to_filter(const std::string& field,
+                      const std::string& value,
+                      ndd::idInt numeric_id) {
+    auto field_check = validate_filter_key_component(field, "Filter field name");
+    if(!field_check.ok()) {
+        return field_check;
+    }
+    auto value_check = validate_filter_key_component(value, "Filter value");
+    if(!value_check.ok()) {
+        return value_check;
+    }
+    return category_index_->add(field, value, numeric_id);
+}
+
+/*
+ * Adds a batch of ids to one already formatted category filter key.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<> Filter::add_to_filter_batch(
+        const std::string& filter_key,
+        const std::vector<ndd::idInt>& numeric_ids) {
+    if(numeric_ids.empty()) {
+        return {SUCCESS, ""};
+    }
+    return category_index_->add_batch_by_key(filter_key, numeric_ids);
+}
+
+/*
+ * Adds one batch of filter JSON documents into the numeric and category indexes.
+ *
+ * Return codes:
+ * 0 = success
+ * 1 = invalid filter JSON or field shape; caller should return HTTP 400
+ * 2 = unsupported filter field type or category value too long; caller should return HTTP 400
+ * 3 = field type mismatch with existing schema; caller should return HTTP 400
+ * 100-199 = propagated MDBX/storage failure from schema, numeric, or category writes
+ * 200-299 = propagated corruption/invariant failure from numeric or category writes
+ */
+ndd::OperationResult<> Filter::add_filters_from_json_batch(
+        const std::vector<std::pair<ndd::idInt, std::string>>& id_filter_pairs) {
+    if(id_filter_pairs.empty()) {
+        return {SUCCESS, ""};
+    }
+
+    // Create a map to collect IDs for each label filter
+    std::unordered_map<std::string, std::vector<ndd::idInt>> label_filter_to_ids;
+    label_filter_to_ids.reserve(id_filter_pairs.size());
+    std::vector<ndd::filter::NumericBatchEntry> numeric_filter_entries;
+    numeric_filter_entries.reserve(id_filter_pairs.size());
+
+    // Group IDs by filter
+    for(const auto& [numeric_id, filter_json] : id_filter_pairs) {
+        nlohmann::json parsed;
+        try {
+            parsed = nlohmann::json::parse(filter_json);
+        } catch(const std::exception& e) {
+            return {1, "Invalid filter JSON: " + std::string(e.what())};
+        }
+
+        if(!parsed.is_object()) {
+            return {1, "Filter JSON document must be an object"};
+        }
+
+        for(const auto& [field, value] : parsed.items()) {
+            if(field.empty()) {
+                return {1, "Filter field name cannot be empty"};
+            }
+            auto field_check = validate_filter_key_component(field, "Filter field name");
+            if(!field_check.ok()) {
+                return {field_check.code, field_check.message};
+            }
+
+            FieldType type = FieldType::Unknown;
+            if(value.is_boolean()) {
+                type = FieldType::Bool;
+            } else if(value.is_number()) {
+                type = FieldType::Number;
+            } else if(value.is_string()) {
+                type = FieldType::String;
+            }
+
+            if(type == FieldType::Unknown) {
+                return {2, "Unsupported filter type for field '" + field + "'"};
+            }
+
+            auto register_result = register_field_type(field, type);
+            if(!register_result.ok()) {
+                return register_result;
+            }
+
+            if(type == FieldType::String) {
+                auto category_result = category_value_from_json(value, "Filter value");
+                if(!category_result.ok()) {
+                    return {category_result.code,
+                            category_result.message + " for field '" + field + "'"};
+                }
+                label_filter_to_ids[format_filter_key(field, category_result.value_or_throw())]
+                        .emplace_back(numeric_id);
+            } else if(type == FieldType::Bool) {
+                label_filter_to_ids[format_filter_key(field, value.get<bool>() ? "1" : "0")]
+                        .emplace_back(numeric_id);
+            } else if(type == FieldType::Number) {
+                auto sortable_result = sortable_from_json(value, "Numeric filter value");
+                if(!sortable_result.ok()) {
+                    return {sortable_result.code,
+                            sortable_result.message + " for field '" + field + "'"};
+                }
+                numeric_filter_entries.emplace_back(field, numeric_id, sortable_result.value_or_throw());
+            }
+        }
+    }
+
+    /**
+     * XXX: For transactional correctness of filter adds, all the filters
+     * should be added in a single transaction.
+     * For now, they are being added in two different transactions.
+     * one for numeric_index and other for labels.
+     */
+
+    if(!numeric_filter_entries.empty()) {
+        auto numeric_result = numeric_index_->put_batch(numeric_filter_entries);
+        if(!numeric_result.ok()) {
+            return numeric_result;
+        }
+    }
+
+    // Process each filter with its batch of IDs
+    for(const auto& [filter_key, ids] : label_filter_to_ids) {
+        auto add_result = add_to_filter_batch(filter_key, ids);
+        if(!add_result.ok()) {
+            return add_result;
+        }
+    }
+
+    return {SUCCESS, ""};
+}
+
+/*
+ * Removes one id from a category filter.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<>
+Filter::remove_from_filter(const std::string& field,
+                           const std::string& value,
+                           ndd::idInt numeric_id) {
+    auto field_check = validate_filter_key_component(field, "Filter field name");
+    if(!field_check.ok()) {
+        return field_check;
+    }
+    auto value_check = validate_filter_key_component(value, "Filter value");
+    if(!value_check.ok()) {
+        return value_check;
+    }
+    return category_index_->remove(field, value, numeric_id);
+}
+
+/*
+ * Checks whether one id is present in a category filter.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<bool>
+Filter::contains(const std::string& field,
+                 const std::string& value,
+                 ndd::idInt numeric_id) const {
+    auto field_check = validate_filter_key_component(field, "Filter field name");
+    if(!field_check.ok()) {
+        return {field_check.code, field_check.message};
+    }
+    auto value_check = validate_filter_key_component(value, "Filter value");
+    if(!value_check.ok()) {
+        return {value_check.code, value_check.message};
+    }
+    return category_index_->contains(field, value, numeric_id);
+}
+
+/*
+ * Adds one filter JSON document into the numeric and category indexes.
+ *
+ * Return codes:
+ * 0 = success
+ * 1-99 = propagated filter validation failure from batch add
+ * 100-199 = propagated MDBX/storage failure from batch add
+ * 200-299 = propagated corruption/invariant failure from batch add
+ */
+ndd::OperationResult<> Filter::add_filters_from_json(ndd::idInt numeric_id,
+                                                     const std::string& filter_json) {
+    return add_filters_from_json_batch({{numeric_id, filter_json}});
+}
+
+/*
+ * Removes one filter JSON document from the numeric and category indexes.
+ *
+ * Return codes:
+ * 0 = success
+ * 1 = invalid filter JSON or field shape; caller should return HTTP 400
+ * 2 = unsupported filter field type; caller should return HTTP 400
+ * 100-199 = propagated MDBX/storage failure from numeric or category index
+ * 200-299 = propagated corruption/invariant failure from numeric or category index
+ */
+ndd::OperationResult<> Filter::remove_filters_from_json(ndd::idInt numeric_id,
+                                                        const std::string& filter_json) {
+    nlohmann::json parsed;
+    try {
+        parsed = nlohmann::json::parse(filter_json);
+    } catch(const std::exception& e) {
+        return {1, "Invalid filter JSON while removing filters: " + std::string(e.what())};
+    }
+
+    if(!parsed.is_object()) {
+        return {1, "Filter JSON document must be an object"};
+    }
+
+    for(const auto& [field, value] : parsed.items()) {
+        if(field.empty()) {
+            return {1, "Filter field name cannot be empty"};
+        }
+        auto field_check = validate_filter_key_component(field, "Filter field name");
+        if(!field_check.ok()) {
+            return {field_check.code, field_check.message};
+        }
+
+        ndd::OperationResult<> remove_result{SUCCESS, ""};
+        if(value.is_string()) {
+            auto category_result = category_value_from_json(value, "Filter value");
+            if(!category_result.ok()) {
+                return {category_result.code,
+                        category_result.message + " for field '" + field + "'"};
+            }
+            remove_result = remove_from_filter(field, category_result.value_or_throw(), numeric_id);
+        } else if(value.is_number()) {
+            // Remove from Numeric Index
+            remove_result = numeric_index_->remove(field, numeric_id);
+        } else if(value.is_boolean()) {
+            remove_result = remove_from_filter(field,
+                                               value.get<bool>() ? "1" : "0",
+                                               numeric_id);
+        } else {
+            return {2, "Unsupported filter type for field '" + field + "'"};
+        }
+
+        if(!remove_result.ok()) {
+            return remove_result;
+        }
+    }
+
+    return {SUCCESS, ""};
+}
+
+/*
+ * Combines category filters with AND semantics.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<ndd::RoaringBitmap> Filter::combine_filters_and(
+        const std::vector<std::pair<std::string, std::string>>& filters) const {
+    ndd::RoaringBitmap result;
+    bool first = true;
+    for(const auto& [field, value] : filters) {
+        auto bitmap_result = category_index_->get_bitmap(field, value);
+        if(!bitmap_result.ok()) {
+            return {bitmap_result.code, bitmap_result.message};
+        }
+        if(first) {
+            result = std::move(bitmap_result.value_or_throw());
+            first = false;
+        } else {
+            result &= bitmap_result.value_or_throw();
+        }
+    }
+    return {SUCCESS, "", std::move(result)};
+}
+
+/*
+ * Combines category filters with OR semantics.
+ *
+ * Return codes:
+ * 0 = success
+ * 100-199 = propagated MDBX/storage failure from category index
+ * 200-299 = propagated corruption/invariant failure from category index
+ */
+ndd::OperationResult<ndd::RoaringBitmap> Filter::combine_filters_or(
+        const std::vector<std::pair<std::string, std::string>>& filters) const {
+    ndd::RoaringBitmap result;
+    for(const auto& [field, value] : filters) {
+        auto bitmap_result = category_index_->get_bitmap(field, value);
+        if(!bitmap_result.ok()) {
+            return {bitmap_result.code, bitmap_result.message};
+        }
+        result |= bitmap_result.value_or_throw();
+    }
+    return {SUCCESS, "", std::move(result)};
+}
+
+/*
+ * Checks whether one id satisfies one numeric filter expression.
+ *
+ * Return codes:
+ * 0 = success
+ * 2 = invalid numeric operator or value; caller should return HTTP 400
+ * 100-199 = propagated MDBX/storage failure from numeric index
+ * 200-299 = propagated corruption/invariant failure from numeric index
+ */
+ndd::OperationResult<bool> Filter::check_numeric(const std::string& field,
+                                                 ndd::idInt id,
+                                                 const std::string& op,
+                                                 const nlohmann::json& val) const {
+    if(op == "$eq") {
+        auto sortable_result = sortable_from_json(val, "$eq value for numeric field");
+        if(!sortable_result.ok()) {
+            return {sortable_result.code, sortable_result.message};
+        }
+        return numeric_index_->check_range(field,
+                                           id,
+                                           sortable_result.value_or_throw(),
+                                           sortable_result.value_or_throw());
+    }
+
+    if(op == "$in") {
+        if(!val.is_array()) {
+            return {2, "$in must be an array"};
+        }
+        for(const auto& item : val) {
+            auto sortable_result = sortable_from_json(item, "$in value for numeric field");
+            if(!sortable_result.ok()) {
+                return {sortable_result.code, sortable_result.message};
+            }
+
+            auto check_result = numeric_index_->check_range(field,
+                                                            id,
+                                                            sortable_result.value_or_throw(),
+                                                            sortable_result.value_or_throw());
+            if(!check_result.ok()) {
+                return check_result;
+            }
+            if(check_result.value_or_throw()) {
+                return {SUCCESS, "", true};
+            }
+        }
+        return {SUCCESS, "", false};
+    }
+
+    if(op == "$range") {
+        if(!val.is_array() || val.size() != 2) {
+            return {2, "$range must be [start, end] with exactly 2 values"};
+        }
+
+        auto start_result = sortable_from_json(val[0], "Range start");
+        if(!start_result.ok()) {
+            return {start_result.code, start_result.message};
+        }
+        auto end_result = sortable_from_json(val[1], "Range end");
+        if(!end_result.ok()) {
+            return {end_result.code, end_result.message};
+        }
+        if(start_result.value_or_throw() > end_result.value_or_throw()) {
+            return {2, "Invalid range: start > end"};
+        }
+
+        return numeric_index_->check_range(field, id, start_result.value_or_throw(), end_result.value_or_throw());
+    }
+
+    if(op == "$lt" || op == "$lte" || op == "$gt" || op == "$gte") {
+        auto bound_result = numeric_bound_from_comparison(op, val);
+        if(!bound_result.ok()) {
+            return {bound_result.code, bound_result.message};
+        }
+        auto [min_val, max_val] = bound_result.value_or_throw();
+        if(min_val > max_val) {
+            return {SUCCESS, "", false};
+        }
+        return numeric_index_->check_range(field, id, min_val, max_val);
+    }
+
+    return {2, "Unsupported numeric operator: " + op};
+}
diff --git a/src/filter/filter.hpp b/src/filter/filter.hpp
index 392fe2b404..f834b6cdb2 100644
--- a/src/filter/filter.hpp
+++ b/src/filter/filter.hpp
@@ -1,47 +1,45 @@
 #pragma once
 
 // System includes
-#include <string>
+#include <cstdint>
 #include <memory>
-#include <stdexcept>
-#include <filesystem>
-#include <sstream>
-#include <iomanip>
-#include <iostream>
+#include <mutex>
+#include <string>
 #include <unordered_map>
+#include <utility>
 #include <vector>
 
 #include "json/nlohmann_json.hpp"
-#include "../utils/settings.hpp"
 #include "mdbx/mdbx.h"
-#include "../utils/log.hpp"
 #include "../core/types.hpp"
-#include "../hnsw/hnswlib.h" // For BaseFilterFunctor
+#include "../hnsw/hnswlib.h"
+#include "../utils/types.hpp"
 
-#include "numeric_index.hpp"
 #include "category_index.hpp"
+#include "numeric_index.hpp"
 
 enum class FieldType : uint8_t {
     Unknown = 0,
     String = 1,
-    Number = 2,  // Unified Integer and Float
+    Number = 2, // Unified Integer and Float
     Bool = 4
 };
 
 // Filter Functor for HNSW
 class BitMapFilterFunctor : public hnswlib::BaseFilterFunctor {
     const ndd::RoaringBitmap& bitmap_;
+
 public:
-    BitMapFilterFunctor(const ndd::RoaringBitmap& bitmap) : bitmap_(bitmap) {}
-    bool operator()(ndd::idInt id) override {
-        return bitmap_.contains(id);
-    }
+    BitMapFilterFunctor(const ndd::RoaringBitmap& bitmap);
+
+    bool operator()(ndd::idInt id) override;
 };
 
 class Filter {
 private:
     MDBX_env* env_;
-    MDBX_dbi dbi_;  // Used for schema storage
+    // Used for schema storage
+    MDBX_dbi dbi_;
     std::string index_id_;
     std::string path_;
     std::unique_ptr<ndd::filter::NumericIndex> numeric_index_;
@@ -51,569 +49,256 @@ class Filter {
     std::unordered_map<std::string, FieldType> schema_cache_;
     mutable std::mutex schema_mutex_;
 
-    void load_schema() {
-        MDBX_txn* txn;
-        int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
-        if(rc != MDBX_SUCCESS) {
-            LOG_ERROR(
-                    1210, index_id_, "Failed to begin schema read transaction: " << mdbx_strerror(rc));
-            return;
-        }
-
-        MDBX_val key{const_cast<char*>(SCHEMA_KEY), strlen(SCHEMA_KEY)};
-        MDBX_val data;
-        rc = mdbx_get(txn, dbi_, &key, &data);
-
-        if(rc == MDBX_SUCCESS && data.iov_len > 0) {
-            try {
-                std::string json_str(static_cast<const char*>(data.iov_base), data.iov_len);
-                auto j = nlohmann::json::parse(json_str);
-                std::lock_guard<std::mutex> lock(schema_mutex_);
-                for(auto& [k, v] : j.items()) {
-                    schema_cache_[k] = static_cast<FieldType>(v.get<int>());
-                }
-            } catch(...) {
-                LOG_ERROR(1201, index_id_, "Failed to load filter schema");
-            }
-        }
-        mdbx_txn_abort(txn);
-    }
-
-    void save_schema_internal() {
-        nlohmann::json j;
-        for(const auto& [k, v] : schema_cache_) {
-            j[k] = static_cast<int>(v);
-        }
-        std::string json_str = j.dump();
-
-        MDBX_txn* txn;
-        int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-        if(rc != MDBX_SUCCESS) {
-            LOG_ERROR(
-                    1208, index_id_, "Failed to begin schema write transaction: " << mdbx_strerror(rc));
-            return;
-        }
-
-        MDBX_val key{const_cast<char*>(SCHEMA_KEY), strlen(SCHEMA_KEY)};
-        MDBX_val data{const_cast<char*>(json_str.c_str()), json_str.size()};
-
-        rc = mdbx_put(txn, dbi_, &key, &data, MDBX_UPSERT);
-        if(rc == MDBX_SUCCESS) {
-            rc = mdbx_txn_commit(txn);
-            if(rc != MDBX_SUCCESS) {
-                LOG_ERROR(
-                        1209, index_id_, "Failed to commit filter schema update: " << mdbx_strerror(rc));
-            }
-        } else {
-            mdbx_txn_abort(txn);
-            LOG_ERROR(1211, index_id_, "Failed to persist filter schema: " << mdbx_strerror(rc));
-        }
-    }
-
-    bool register_field_type(const std::string& field, FieldType type) {
-        std::lock_guard<std::mutex> lock(schema_mutex_);
-        auto it = schema_cache_.find(field);
-        if(it != schema_cache_.end()) {
-            return it->second == type;
-        }
-
-        schema_cache_[field] = type;
-        save_schema_internal();
-        return true;
-    }
-
-    void init_environment() {
-        int rc = mdbx_env_create(&env_);
-        if(rc != 0) {
-            throw std::runtime_error(std::string("Failed to create LMDB env for filters: ") + mdbx_strerror(rc));
-        }
-        // max DBs to allow multiple databases (main + schema + numeric_forward + numeric_inverted)
-        mdbx_env_set_maxdbs(env_, 10);
-
-        // Set geometry for auto-grow using the filter map size settings
-        rc = mdbx_env_set_geometry(
-                env_,
-                -1,                                          // lower size bound (use default)
-                1ULL << settings::FILTER_MAP_SIZE_BITS,      // current/now size
-                1ULL << settings::FILTER_MAP_SIZE_MAX_BITS,  // upper size bound
-                1ULL << settings::FILTER_MAP_SIZE_BITS,      // growth step
-                -1,                                          // shrink threshold (use default)
-                -1);                                         // pagesize (use default)
-        if(rc != MDBX_SUCCESS) {
-            throw std::runtime_error(std::string("Failed to set geometry for filters: ") + mdbx_strerror(rc));
-        }
-
-        rc = mdbx_env_open(
-                env_, path_.c_str(), MDBX_WRITEMAP | MDBX_MAPASYNC | MDBX_NORDAHEAD, 0664);
-        if(rc != 0) {
-            throw std::runtime_error(std::string("Failed to open filter environment: ") + mdbx_strerror(rc));
-        }
-
-        MDBX_txn* txn;
-        rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-        if(rc != 0) {
-            throw std::runtime_error(std::string("Failed to begin filter transaction: ") + mdbx_strerror(rc));
-        }
-
-        rc = mdbx_dbi_open(txn, nullptr, MDBX_CREATE, &dbi_);
-        if(rc != 0) {
-            mdbx_txn_abort(txn);
-            throw std::runtime_error(std::string("Failed to open filter database: ") + mdbx_strerror(rc));
-        }
-        rc = mdbx_txn_commit(txn);
-        if(rc != 0) {
-            throw std::runtime_error(std::string("Failed to commit filter transaction: ") + mdbx_strerror(rc));
-        }
-
-        // Initialize Indices
-        numeric_index_ = std::make_unique<ndd::filter::NumericIndex>(env_);
-        category_index_ = std::make_unique<ndd::filter::CategoryIndex>(env_);
-
-        load_schema();
-    }
-
-    static std::string format_filter_key(const std::string& field, const std::string& value) {
-        return field + ":" + value;
-    }
+    /*
+     * Loads the persisted filter schema into the in-memory schema cache.
+     *
+     * Return codes:
+     * 0 = success
+     * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+     * 200 = corrupt schema JSON payload; caller should log ERROR and return HTTP 500
+     */
+    ndd::OperationResult<> load_schema();
+
+    /*
+     * Persists the current in-memory filter schema cache.
+     *
+     * Return codes:
+     * 0 = success
+     * 100 = MDBX transaction, write, or commit failure; caller should log ERROR and return HTTP 500
+     */
+    ndd::OperationResult<> save_schema_internal();
+
+    /*
+     * Registers a field type in the filter schema if it is not already present.
+     *
+     * Return codes:
+     * 0 = success
+     * 3 = field type mismatch with existing schema; caller should return HTTP 400
+     * 100-199 = propagated MDBX/storage failure from schema persistence
+     */
+    ndd::OperationResult<> register_field_type(const std::string& field, FieldType type);
+
+    /**
+     * Converts a JSON number into the current sortable numeric filter encoding.
+     * All numeric filter values use one float32 sortable domain, including JSON
+     * integers, so 2 and 2.0 compare equal. Limitations: values are rounded to
+     * float precision before indexing/querying, distinct large integers can
+     * collapse to the same key, and strict comparisons use the next float32
+     * representable value around the rounded query bound. float32 has 24 bits
+     * of integer precision (23 stored mantissa bits plus the hidden bit), so it
+     * represents every integer only up to 2^24 = 16,777,216; above that, not all
+     * consecutive integers are representable. Consecutive integers are also less
+     * dense in the float sortable bit domain than under int_to_sortable, so
+     * integer-heavy fields can create more numeric buckets and make wide range
+     * scans walk more bucket entries. Existing filter DBs that indexed integers
+     * with int_to_sortable must be rebuilt.
+     *
+     * Return codes:
+     * 0 = success
+     * 2 = value is not numeric or not finite in float32; caller should return HTTP 400
+     */
+    static ndd::OperationResult<uint32_t> sortable_from_json(const nlohmann::json& value,
+                                                            const std::string& context);
+
+    /*
+     * Converts a JSON scalar into the category key value representation.
+     *
+     * Return codes:
+     * 0 = success
+     * 2 = value is not a supported category scalar or is too long; caller should return HTTP 400
+     */
+    static ndd::OperationResult<std::string> category_value_from_json(
+            const nlohmann::json& value,
+            const std::string& context);
+
+    // Rejects ':' because it is the MDBX key delimiter for category and numeric
+    // indexes (see format_filter_key, NumericIndex::make_*_key). Allowing ':' in
+    // user input causes byte-level key collisions across distinct (field, value)
+    // pairs.
+    static ndd::OperationResult<>
+    validate_filter_key_component(const std::string& component,
+                                  const std::string& context);
+
+    static std::string format_filter_key(const std::string& field, const std::string& value);
+
+    /*
+     * Resolves [$lt | $lte | $gt | $gte] on a JSON numeric value into a
+     * sortable [min, max] range usable against NumericIndex::range / check_range.
+     * A returned pair with min > max signals a provably-empty range
+     * (e.g. $gt the largest finite float32); callers must skip the lookup.
+     *
+     * Return codes:
+     * 0 = success
+     * 2 = value is not a finite number, or operator is not a numeric comparison;
+     *     caller should return HTTP 400
+     */
+    static ndd::OperationResult<std::pair<uint32_t, uint32_t>>
+    numeric_bound_from_comparison(const std::string& op, const nlohmann::json& val);
+
+    void init_environment();
 
 public:
-    Filter(const std::string& path, const std::string& index_id) :
-        index_id_(index_id),
-        path_(path) {
-        std::filesystem::create_directories(path);
-        init_environment();
-    }
-
-    ~Filter() {
-        mdbx_dbi_close(env_, dbi_);
-        mdbx_env_close(env_);
-    }
-
-    // Compute the filter bitmap based on the provided JSON filter array
-    ndd::RoaringBitmap computeFilterBitmap(const nlohmann::json& filter_array) const {
-        if(!filter_array.is_array()) {
-            throw std::runtime_error("Filter must be an array");
-        }
-
-        if(filter_array.empty()) {
-            LOG_DEBUG("Empty filter array, returning empty bitmap");
-            return ndd::RoaringBitmap();
-        }
-
-        std::vector<ndd::RoaringBitmap> partial_results;
-        partial_results.reserve(filter_array.size());
-
-        for(const auto& condition : filter_array) {
-            if(!condition.is_object() || condition.size() != 1) {
-                throw std::runtime_error("Each condition must be a single-field object");
-            }
-
-            const auto& field = condition.begin().key();
-            const auto& expr = condition.begin().value();
-
-            if(field.empty()) {
-                throw std::runtime_error("Filter field name cannot be empty");
-            }
-
-            // Check schema for field type
-            FieldType type = FieldType::Unknown;
-            {
-                std::lock_guard<std::mutex> lock(schema_mutex_);
-                auto it = schema_cache_.find(field);
-                if(it != schema_cache_.end()) {
-                    type = it->second;
-                }
-            }
-
-            ndd::RoaringBitmap or_result;
-
-            if(!expr.is_object() || expr.size() != 1) {
-                throw std::runtime_error("Operator must be a single-field object");
-            }
-
-            const std::string op = expr.begin().key();
-            const auto& val = expr.begin().value();
-
-            if(op == "$eq") {
-                if(type == FieldType::Number) {
-                    uint32_t sortable_val;
-                    if(val.is_number_integer()) {
-                        sortable_val = ndd::filter::int_to_sortable(val.get<int>());
-                    } else if(val.is_number()) {
-                        sortable_val = ndd::filter::float_to_sortable(val.get<float>());
-                    } else {
-                        throw std::runtime_error("$eq value for numeric field must be a number");
-                    }
-                    or_result = numeric_index_->range(field, sortable_val, sortable_val);
-                } else {
-                    if(!val.is_string() && !val.is_number_integer() && !val.is_boolean()) {
-                        throw std::runtime_error("$eq value must be string, integer or boolean");
-                    }
-                    std::string str_val;
-                    if(val.is_string()) {
-                        str_val = val.get<std::string>();
-                    } else if(val.is_boolean()) {
-                        str_val = val.get<bool>() ? "1" : "0";
-                    } else {
-                        str_val = std::to_string(val.get<int>());
-                        if (str_val.size() > 255) throw std::runtime_error("Category value too long");
-                    }
-                    std::string key = format_filter_key(field, str_val);
-                    or_result = category_index_->get_bitmap_by_key(key);
-                }
-            } else if(op == "$in") {
-                if(!val.is_array()) {
-                    throw std::runtime_error("$in must be array");
-                }
-                if(val.empty()) {
-                    LOG_DEBUG("Empty $in array for field: " << field);
-                } else {
-                    for(const auto& v : val) {
-                        if(type == FieldType::Number) {
-                            uint32_t sortable_val;
-                            if(v.is_number_integer()) {
-                                sortable_val = ndd::filter::int_to_sortable(v.get<int>());
-                            } else if(v.is_number()) {
-                                sortable_val = ndd::filter::float_to_sortable(v.get<float>());
-                            } else {
-                                throw std::runtime_error(
-                                        "$in value for numeric field must be a number");
-                            }
-                            or_result |= numeric_index_->range(field, sortable_val, sortable_val);
-                        } else {
-                            if(!v.is_string() && !v.is_number_integer() && !v.is_boolean()) {
-                                throw std::runtime_error(
-                                        "$in values must be string, integer or boolean");
-                            }
-                            std::string str_val;
-                            if(v.is_string()) {
-                                str_val = v.get<std::string>();
-                            } else if(v.is_boolean()) {
-                                str_val = v.get<bool>() ? "1" : "0";
-                            } else {
-                                str_val = std::to_string(v.get<int>());
-                            }
-                            if(!str_val.empty()) {
-                                if (str_val.size() > 255) throw std::runtime_error("Category value too long");
-                                std::string key = format_filter_key(field, str_val);
-                                or_result |= category_index_->get_bitmap_by_key(key);
-                            }
-                        }
-                    }
-                }
-            } else if(op == "$range") {
-                if(!val.is_array() || val.size() != 2) {
-                    throw std::runtime_error(
-                            "$range must be [start, end] array with exactly 2 elements");
-                }
-
-                if(type == FieldType::Number) {
-                    uint32_t start_val, end_val;
-
-                    if(val[0].is_number_integer()) {
-                        start_val = ndd::filter::int_to_sortable(val[0].get<int>());
-                    } else if(val[0].is_number()) {
-                        start_val = ndd::filter::float_to_sortable(val[0].get<float>());
-                    } else {
-                        throw std::runtime_error("Range start must be a number");
-                    }
-
-                    if(val[1].is_number_integer()) {
-                        end_val = ndd::filter::int_to_sortable(val[1].get<int>());
-                    } else if(val[1].is_number()) {
-                        end_val = ndd::filter::float_to_sortable(val[1].get<float>());
-                    } else {
-                        throw std::runtime_error("Range end must be a number");
-                    }
-
-                    if(start_val > end_val) {
-                        throw std::runtime_error("Invalid range: start > end");
-                    }
-
-                    or_result = numeric_index_->range(field, start_val, end_val);
-                } else {
-                    throw std::runtime_error(
-                            "$range operator is only supported for numeric fields");
-                }
-            } else {
-                throw std::runtime_error("Unsupported operator: " + op);
-            }
-            
-            partial_results.push_back(std::move(or_result));
-        }
-
-        // Optimization: Sort by cardinality (smallest first)
-        std::sort(partial_results.begin(), partial_results.end(), 
-                 [](const ndd::RoaringBitmap& a, const ndd::RoaringBitmap& b) {
-                     return a.cardinality() < b.cardinality();
-                 });
-
-        if (partial_results.empty()) return ndd::RoaringBitmap();
-
-        ndd::RoaringBitmap final_result = partial_results[0];
-        for(size_t i = 1; i < partial_results.size(); ++i) {
-            final_result &= partial_results[i];
-            // If result becomes empty, stop early
-            if(final_result.isEmpty()) return final_result;
-        }
-
-        return final_result;
-    }
-
-    // Get IDs matching the filter using the provided JSON filter array
-    std::vector<ndd::idInt> getIdsMatchingFilter(const nlohmann::json& filter_array) const {
-        auto result = computeFilterBitmap(filter_array);
-        std::vector<ndd::idInt> ids;
-        ids.reserve(result.cardinality());
-        result.iterate(
-                [](ndd::idInt val, void* ptr) {
-                    static_cast<std::vector<ndd::idInt>*>(ptr)->push_back(val);
-                    return true;
-                },
-                &ids);
-        return ids;
-    }
-
-    // Count the number of IDs matching the filter using the provided JSON filter array
-    size_t countIdsMatchingFilter(const nlohmann::json& filter_array) const {
-        return computeFilterBitmap(filter_array).cardinality();
-    }
-
-    void add_to_filter(const std::string& field, const std::string& value, ndd::idInt numeric_id) {
-        category_index_->add(field, value, numeric_id);
-    }
-
-    // Batch add operation for filters
-    void add_to_filter_batch(const std::string& filter_key,
-                             const std::vector<ndd::idInt>& numeric_ids) {
-        if(numeric_ids.empty()) {
-            return;
-        }
-        category_index_->add_batch_by_key(filter_key, numeric_ids);
-    }
-
-    // Optimized version to process filter JSON in batch
-    void add_filters_from_json_batch(
-            const std::vector<std::pair<ndd::idInt, std::string>>& id_filter_pairs) {
-        if(id_filter_pairs.empty()) {
-            return;
-        }
-
-        // Create a map to collect IDs for each filter
-        std::unordered_map<std::string, std::vector<ndd::idInt>> filter_to_ids;
-
-        // Group IDs by filter
-        for(const auto& [numeric_id, filter_json] : id_filter_pairs) {
-            try {
-                auto j = nlohmann::json::parse(filter_json);
-                for(const auto& [field, value] : j.items()) {
-                    FieldType type = FieldType::Unknown;
-                    if(value.is_boolean()) {
-                        type = FieldType::Bool;
-                    } else if(value.is_number()) {
-                        type = FieldType::Number;  // Unified check
-                    } else if(value.is_string()) {
-                        type = FieldType::String;
-                    }
-
-                    if(type == FieldType::Unknown) {
-                        LOG_DEBUG("Unsupported filter type for field '" << field << "'");
-                        continue;
-                    }
-
-                    if(!register_field_type(field, type)) {
-                        LOG_ERROR(1202, index_id_, "Type mismatch for field '" << field << "'");
-                        continue;
-                    }
-
-                    if(value.is_string()) {
-                        std::string filter_key = format_filter_key(field, value.get<std::string>());
-                        filter_to_ids[filter_key].push_back(numeric_id);
-                    } else if(value.is_number()) {
-                        // Use Numeric Index for numbers
-                        uint32_t sortable_val;
-                        if(value.is_number_integer()) {
-                            sortable_val = ndd::filter::int_to_sortable(value.get<int>());
-                        } else {
-                            sortable_val = ndd::filter::float_to_sortable(value.get<float>());
-                        }
-                        numeric_index_->put(field, numeric_id, sortable_val);
-                    } else if(value.is_boolean()) {
-                        std::string filter_key =
-                                format_filter_key(field, value.get<bool>() ? "1" : "0");
-                        filter_to_ids[filter_key].push_back(numeric_id);
-                    } else {
-                        LOG_WARN(1203,
-                                       index_id_,
-                                       "Unsupported filter type for field '" << field
-                                                                             << "' in filter: "
-                                                                             << value.dump());
-                    }
-                }
-            } catch(const std::exception& e) {
-                LOG_ERROR(1204, index_id_, "Error parsing filter JSON: " << e.what());
-            }
-        }
-
-        // Process each filter with its batch of IDs
-        for(const auto& [filter_key, ids] : filter_to_ids) {
-            add_to_filter_batch(filter_key, ids);
-        }
-    }
-
-    void
-    remove_from_filter(const std::string& field, const std::string& value, ndd::idInt numeric_id) {
-        category_index_->remove(field, value, numeric_id);
-    }
-
-    bool contains(const std::string& field, const std::string& value, ndd::idInt numeric_id) const {
-        return category_index_->contains(field, value, numeric_id);
-    }
-
-    void add_filters_from_json(ndd::idInt numeric_id, const std::string& filter_json) {
-        try {
-            auto j = nlohmann::json::parse(filter_json);
-            for(const auto& [field, value] : j.items()) {
-                FieldType type = FieldType::Unknown;
-                if(value.is_boolean()) {
-                    type = FieldType::Bool;
-                } else if(value.is_number()) {
-                    type = FieldType::Number;
-                } else if(value.is_string()) {
-                    type = FieldType::String;
-                }
-
-                if(type == FieldType::Unknown) {
-                    LOG_DEBUG("Unsupported filter type for field '" << field << "'");
-                    continue;
-                }
-
-                if(!register_field_type(field, type)) {
-                    LOG_ERROR(1205, index_id_, "Type mismatch for field '" << field << "'");
-                    continue;
-                }
-
-                if(value.is_string()) {
-                    add_to_filter(field, value.get<std::string>(), numeric_id);
-                } else if(value.is_number()) {
-                    uint32_t sortable_val;
-                    if(value.is_number_integer()) {
-                        sortable_val = ndd::filter::int_to_sortable(value.get<int>());
-                    } else {
-                        sortable_val = ndd::filter::float_to_sortable(value.get<float>());
-                    }
-                    numeric_index_->put(field, numeric_id, sortable_val);
-                } else if(value.is_boolean()) {
-                    add_to_filter(field, value.get<bool>() ? "1" : "0", numeric_id);
-                }
-            }
-        } catch(const std::exception& e) {
-            LOG_ERROR(1206, index_id_, "Error adding filters: " << e.what());
-        }
-    }
-
-    void remove_filters_from_json(ndd::idInt numeric_id, const std::string& filter_json) {
-        try {
-            auto j = nlohmann::json::parse(filter_json);
-            for(const auto& [field, value] : j.items()) {
-                if(value.is_string()) {
-                    remove_from_filter(field, value.get<std::string>(), numeric_id);
-                } else if(value.is_number()) {
-                    // Remove from Numeric Index
-                    numeric_index_->remove(field, numeric_id);
-                } else if(value.is_boolean()) {
-                    remove_from_filter(field, value.get<bool>() ? "1" : "0", numeric_id);
-                }
-            }
-        } catch(const std::exception& e) {
-            LOG_ERROR(1207, index_id_, "Error removing filters: " << e.what());
-        }
-    }
-
-    // Combine multiple filters using AND operation
-    ndd::RoaringBitmap
-    combine_filters_and(const std::vector<std::pair<std::string, std::string>>& filters) const {
-        ndd::RoaringBitmap result;
-        bool first = true;
-        for(const auto& [field, value] : filters) {
-            if(first) {
-                result = category_index_->get_bitmap(field, value);
-                first = false;
-            } else {
-                result &= category_index_->get_bitmap(field, value);
-            }
-        }
-        return result;
-    }
-
-    // Combine multiple filters using OR operation
-    ndd::RoaringBitmap
-    combine_filters_or(const std::vector<std::pair<std::string, std::string>>& filters) const {
-        ndd::RoaringBitmap result;
-        for(const auto& [field, value] : filters) {
-            result |= category_index_->get_bitmap(field, value);
-        }
-        return result;
-    }
-
-    // Check if ID satisfies a numeric condition using Forward Index
-    bool check_numeric(const std::string& field,
-                       ndd::idInt id,
-                       const std::string& op,
-                       const nlohmann::json& val) const {
-        if(op == "$eq") {
-            uint32_t sortable_val;
-            if(val.is_number_integer()) {
-                sortable_val = ndd::filter::int_to_sortable(val.get<int>());
-            } else if(val.is_number()) {
-                sortable_val = ndd::filter::float_to_sortable(val.get<float>());
-            } else {
-                return false;
-            }
-            return numeric_index_->check_range(field, id, sortable_val, sortable_val);
-        } else if(op == "$in") {
-            if(!val.is_array()) {
-                return false;
-            }
-            for(const auto& v : val) {
-                uint32_t sortable_val;
-                if(v.is_number_integer()) {
-                    sortable_val = ndd::filter::int_to_sortable(v.get<int>());
-                } else if(v.is_number()) {
-                    sortable_val = ndd::filter::float_to_sortable(v.get<float>());
-                } else {
-                    continue;
-                }
-
-                if(numeric_index_->check_range(field, id, sortable_val, sortable_val)) {
-                    return true;
-                }
-            }
-            return false;
-        } else if(op == "$range") {
-            if(!val.is_array() || val.size() != 2) {
-                return false;
-            }
-            uint32_t start_val, end_val;
-
-            if(val[0].is_number_integer()) {
-                start_val = ndd::filter::int_to_sortable(val[0].get<int>());
-            } else if(val[0].is_number()) {
-                start_val = ndd::filter::float_to_sortable(val[0].get<float>());
-            } else {
-                return false;
-            }
-
-            if(val[1].is_number_integer()) {
-                end_val = ndd::filter::int_to_sortable(val[1].get<int>());
-            } else if(val[1].is_number()) {
-                end_val = ndd::filter::float_to_sortable(val[1].get<float>());
-            } else {
-                return false;
-            }
-
-            return numeric_index_->check_range(field, id, start_val, end_val);
-        }
-        return false;
-    }
+    Filter(const std::string& path, const std::string& index_id);
+
+    Filter(const std::string& path);
+
+    ~Filter();
+
+    /*
+     * Computes the bitmap for an AND filter query.
+     *
+     * Return codes:
+     * 0 = success
+     * 1 = invalid filter query shape; caller should return HTTP 400
+     * 2 = invalid operator or value for field type; caller should return HTTP 400
+     * 100-199 = propagated MDBX/storage failure from category or numeric index
+     * 200-299 = propagated corruption/invariant failure from category or numeric index
+     */
+    ndd::OperationResult<ndd::RoaringBitmap>
+    computeFilterBitmap(const nlohmann::json& filter_array) const;
+
+    /**
+     * Returns numeric ids matching a filter query based on the provided JSON filter array
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from bitmap computation
+     * 100-199 = propagated MDBX/storage failure from bitmap computation
+     * 200-299 = propagated corruption/invariant failure from bitmap computation
+     */
+    ndd::OperationResult<std::vector<ndd::idInt>>
+    getIdsMatchingFilter(const nlohmann::json& filter_array) const;
+
+    /*
+     * Counts numeric ids matching a filter query.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from bitmap computation
+     * 100-199 = propagated MDBX/storage failure from bitmap computation
+     * 200-299 = propagated corruption/invariant failure from bitmap computation
+     */
+    ndd::OperationResult<size_t> countIdsMatchingFilter(
+            const nlohmann::json& filter_array) const;
+
+    /*
+     * Adds one id to a category filter.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<>
+    add_to_filter(const std::string& field, const std::string& value, ndd::idInt numeric_id);
+
+    /*
+     * Adds a batch of ids to one already formatted category filter key.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<> add_to_filter_batch(const std::string& filter_key,
+                                               const std::vector<ndd::idInt>& numeric_ids);
+
+    /*
+     * Adds one batch of filter JSON documents into the numeric and category indexes.
+     *
+     * Return codes:
+     * 0 = success
+     * 1 = invalid filter JSON or field shape; caller should return HTTP 400
+     * 2 = unsupported filter field type or category value too long; caller should return HTTP 400
+     * 3 = field type mismatch with existing schema; caller should return HTTP 400
+     * 100-199 = propagated MDBX/storage failure from schema, numeric, or category writes
+     * 200-299 = propagated corruption/invariant failure from numeric or category writes
+     */
+    ndd::OperationResult<> add_filters_from_json_batch(
+            const std::vector<std::pair<ndd::idInt, std::string>>& id_filter_pairs);
+
+    /*
+     * Removes one id from a category filter.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<>
+    remove_from_filter(const std::string& field,
+                       const std::string& value,
+                       ndd::idInt numeric_id);
+
+    /*
+     * Checks whether one id is present in a category filter.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<bool>
+    contains(const std::string& field, const std::string& value, ndd::idInt numeric_id) const;
+
+    /*
+     * Adds one filter JSON document into the numeric and category indexes.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from batch add
+     * 100-199 = propagated MDBX/storage failure from batch add
+     * 200-299 = propagated corruption/invariant failure from batch add
+     */
+    ndd::OperationResult<> add_filters_from_json(ndd::idInt numeric_id,
+                                                 const std::string& filter_json);
+
+    /*
+     * Removes one filter JSON document from the numeric and category indexes.
+     *
+     * Return codes:
+     * 0 = success
+     * 1 = invalid filter JSON or field shape; caller should return HTTP 400
+     * 2 = unsupported filter field type; caller should return HTTP 400
+     * 100-199 = propagated MDBX/storage failure from numeric or category index
+     * 200-299 = propagated corruption/invariant failure from numeric or category index
+     */
+    ndd::OperationResult<> remove_filters_from_json(ndd::idInt numeric_id,
+                                                    const std::string& filter_json);
+
+    /*
+     * Combines category filters with AND semantics.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<ndd::RoaringBitmap> combine_filters_and(
+            const std::vector<std::pair<std::string, std::string>>& filters) const;
+
+    /*
+     * Combines category filters with OR semantics.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from category index
+     * 200-299 = propagated corruption/invariant failure from category index
+     */
+    ndd::OperationResult<ndd::RoaringBitmap> combine_filters_or(
+            const std::vector<std::pair<std::string, std::string>>& filters) const;
+
+    /*
+     * Checks whether one id satisfies one numeric filter expression.
+     *
+     * Return codes:
+     * 0 = success
+     * 2 = invalid numeric operator or value; caller should return HTTP 400
+     * 100-199 = propagated MDBX/storage failure from numeric index
+     * 200-299 = propagated corruption/invariant failure from numeric index
+     */
+    ndd::OperationResult<bool> check_numeric(const std::string& field,
+                                             ndd::idInt id,
+                                             const std::string& op,
+                                             const nlohmann::json& val) const;
 };
diff --git a/src/filter/numeric_index.cpp b/src/filter/numeric_index.cpp
new file mode 100644
index 0000000000..5b23d40b74
--- /dev/null
+++ b/src/filter/numeric_index.cpp
@@ -0,0 +1,1144 @@
+#include "numeric_index.hpp"
+
+#include <algorithm>
+#include <cstring>
+#include <stdexcept>
+#include <utility>
+
+#include "../utils/log.hpp"
+
+namespace ndd {
+    namespace filter {
+
+        NumericBatchEntry::NumericBatchEntry(std::string field_in,
+                                             ndd::idInt id_in,
+                                             uint32_t value_in) :
+            field(std::move(field_in)),
+            id(id_in),
+            value(value_in) {}
+
+        // --- Sortable Key Utilities ---
+        uint32_t float_to_sortable(float f) {
+            uint32_t i;
+            std::memcpy(&i, &f, sizeof(float));
+            // IEEE 754: if sign bit set, flip all bits. Else flip just sign.
+            // This makes negatives < positives order correctly.
+            uint32_t mask = (int32_t(i) >> 31) | 0x80000000;
+            return i ^ mask;
+        }
+
+        float sortable_to_float(uint32_t i) {
+            uint32_t mask = ((i >> 31) - 1) | 0x80000000;
+            uint32_t result = i ^ mask;
+            float f;
+            std::memcpy(&f, &result, sizeof(float));
+            return f;
+        }
+
+        uint32_t int_to_sortable(int32_t i) {
+            return static_cast<uint32_t>(i) ^ 0x80000000;
+        }
+
+        int32_t sortable_to_int(uint32_t i) {
+            return static_cast<int32_t>(i ^ 0x80000000);
+        }
+
+        ndd::OperationResult<ndd::RoaringBitmap>
+        Bucket::read_bitmap_payload(const uint8_t* data, size_t len) {
+            if(len == 0) {
+                return {SUCCESS, "", ndd::RoaringBitmap()};
+            }
+            if(data == nullptr) {
+                return {200, "empty bitmap payload"};
+            }
+
+            const char* bytes = reinterpret_cast<const char*>(data);
+            const size_t consumed =
+                roaring::api::roaring_bitmap_portable_deserialize_size(bytes, len);
+            if(consumed == 0) {
+                return {200, "invalid or truncated bitmap payload"};
+            }
+            if(consumed != len) {
+                return {200,
+                        "bitmap payload length mismatch: consumed "
+                        + std::to_string(consumed) + " of "
+                        + std::to_string(len) + " bytes"};
+            }
+
+            ndd::RoaringBitmap bitmap;
+            try {
+                bitmap = ndd::RoaringBitmap::readSafe(bytes, len);
+            } catch(const std::exception& e) {
+                return {200,
+                        "failed to deserialize bitmap payload: " + std::string(e.what())};
+            }
+
+            const char* reason = nullptr;
+            if(!roaring::api::roaring_bitmap_internal_validate(&bitmap.roaring,
+                                                                &reason)) {
+                return {200,
+                        std::string("invalid bitmap internals")
+                        + (reason != nullptr ? ": " + std::string(reason) : "")};
+            }
+            return {SUCCESS, "", std::move(bitmap)};
+        }
+
+        // Helper to get actual value
+        uint32_t Bucket::get_value(size_t index) const {
+            return base_value + deltas[index];
+        }
+
+        void Bucket::add(uint32_t val, ndd::idInt id) {
+            if (val < base_value) {
+                 // Should not happen if Key logic is correct
+                 throw std::runtime_error("Insert value < Base Value");
+            }
+            uint32_t delta_32 = val - base_value;
+            if (delta_32 > MAX_DELTA) {
+                throw std::runtime_error("Delta overflow");
+            }
+
+            summary_bitmap.add(id);
+            is_dirty = true;
+
+            /**
+             * If the bucket is already at MAX_SIZE in the parallel
+             * arrays AND the new value equals base_value, route the
+             * id into summary_bitmap only. Every id in the bitmap
+             * with no matching delta is implicitly value-tagged by
+             * base_value, so range queries can recover its value
+             * without a per-id delta entry. This caps the on-disk
+             * deltas/ids growth for duplicate-heavy values.
+             *
+             * Non-duplicate inserts (delta_32 != 0) still go into
+             * the sorted arrays even when the bucket is "full" --
+             * the slide-split fallthrough then pushes the bucket
+             * one over MAX_SIZE momentarily and the next insert's
+             * slide-split finds the new value boundary and splits.
+             */
+            if (delta_32 == 0 && ids.size() >= MAX_SIZE) {
+                return;
+            }
+
+            uint16_t delta = static_cast<uint16_t>(delta_32);
+            auto it = std::lower_bound(deltas.begin(), deltas.end(), delta);
+            size_t index = std::distance(deltas.begin(), it);
+            deltas.insert(it, delta);
+            ids.insert(ids.begin() + index, id);
+        }
+
+        bool Bucket::remove(ndd::idInt id) {
+            if (!summary_bitmap.contains(id)) {
+                return false;
+            }
+            /**
+             * The id might live only in the bitmap (added past MAX_SIZE).
+             * The linear scan is best effort to also clear the ordered
+             * arrays; the bitmap is the source of truth.
+             */
+            for (size_t i = 0; i < ids.size(); ++i) {
+                if (ids[i] == id) {
+                    ids.erase(ids.begin() + i);
+                    deltas.erase(deltas.begin() + i);
+                    break;
+                }
+            }
+            summary_bitmap.remove(id);
+            is_dirty = true;
+            return true;
+        }
+
+        /**
+         * Serialization Format:
+         *   [BitmapSize (uint32_t)]
+         *   [Bitmap Bytes]
+         *   [Deltas (nr_array_entries * sizeof(uint16_t))]
+         *   [IDs    (nr_array_entries * sizeof(idInt))]
+         *
+         * nr_array_entries is recovered on read from
+         *   (iov_len - sizeof(uint32_t) - bm_size)
+         *       / (sizeof(uint16_t) + sizeof(idInt))
+         */
+        std::vector<uint8_t> Bucket::serialize() const {
+            const_cast<ndd::RoaringBitmap&>(summary_bitmap).runOptimize();
+
+            /**
+             * Note: ids.size() can transiently exceed MAX_SIZE when
+             * the slide-split fallthrough in add_to_buckets has just
+             * pushed a non-duplicate into a saturated bucket. The
+             * very next insert into that bucket will trigger a
+             * standard slide-split that splits on the new boundary,
+             * so the on-disk over-MAX_SIZE state is short-lived.
+             * Saturated-with-duplicate inserts go bitmap-only via
+             * Bucket::add and do not grow ids/deltas.
+             */
+            size_t bm_size = summary_bitmap.getSizeInBytes();
+            size_t nr_array_entries = ids.size();
+            size_t total_size = sizeof(uint32_t) + bm_size
+                                + (nr_array_entries * sizeof(uint16_t))
+                                + (nr_array_entries * sizeof(ndd::idInt));
+            std::vector<uint8_t> buffer(total_size);
+            uint8_t* ptr = buffer.data();
+
+            uint32_t bm_size_32 = static_cast<uint32_t>(bm_size);
+            std::memcpy(ptr, &bm_size_32, sizeof(uint32_t));
+            ptr += sizeof(uint32_t);
+
+            if (bm_size > 0) {
+                summary_bitmap.write(reinterpret_cast<char*>(ptr));
+                ptr += bm_size;
+            }
+
+            if (nr_array_entries > 0) {
+                std::memcpy(ptr, deltas.data(),
+                            nr_array_entries * sizeof(uint16_t));
+                ptr += nr_array_entries * sizeof(uint16_t);
+                std::memcpy(ptr, ids.data(),
+                            nr_array_entries * sizeof(ndd::idInt));
+            }
+
+            return buffer;
+        }
+
+        Bucket Bucket::deserialize(const void* data, size_t len, uint32_t base_val) {
+            Bucket b;
+            b.base_value = base_val;
+
+            if (len < sizeof(uint32_t)) return b; // Just the bm_size header
+
+            const uint8_t* ptr = static_cast<const uint8_t*>(data);
+            const uint8_t* end = ptr + len;
+
+            // 1. Bitmap size
+            uint32_t bm_size;
+            std::memcpy(&bm_size, ptr, sizeof(uint32_t));
+            ptr += sizeof(uint32_t);
+            if (bm_size > static_cast<size_t>(end - ptr)) {
+                throw std::runtime_error("Bucket corrupt: invalid bitmap size");
+            }
+
+            // 2. Bitmap
+            if (bm_size > 0) {
+                auto bitmap_result = read_bitmap_payload(ptr, bm_size);
+                if(!bitmap_result.ok()) {
+                    throw std::runtime_error("Bucket corrupt: "
+                                             + bitmap_result.message);
+                }
+                if(!bitmap_result.value.has_value()) {
+                    throw std::runtime_error(
+                        "Bucket corrupt: bitmap reader succeeded without a bitmap");
+                }
+                b.summary_bitmap = std::move(*bitmap_result.value);
+                ptr += bm_size;
+            }
+
+            // 3. Derive nr_array_entries from the residual.
+            size_t remaining = static_cast<size_t>(end - ptr);
+            constexpr size_t per_entry =
+                sizeof(uint16_t) + sizeof(ndd::idInt);
+            if (remaining % per_entry != 0) {
+                throw std::runtime_error(
+                    "Bucket corrupt: residual bytes not aligned");
+            }
+            size_t nr_array_entries = remaining / per_entry;
+
+            if (nr_array_entries > 0) {
+                size_t delta_size = nr_array_entries * sizeof(uint16_t);
+                size_t id_size = nr_array_entries * sizeof(ndd::idInt);
+                if (ptr + delta_size + id_size > end) {
+                    throw std::runtime_error("Bucket corrupt: truncated arrays");
+                }
+                b.deltas.resize(nr_array_entries);
+                std::memcpy(b.deltas.data(), ptr, delta_size);
+                ptr += delta_size;
+                b.ids.resize(nr_array_entries);
+                std::memcpy(b.ids.data(), ptr, id_size);
+            }
+
+            return b;
+        }
+
+        /**
+         * Fast access to just the bitmap.
+         *
+         * Used by range() when a bucket is fully covered by the query
+         * extent and we don't need the deltas/ids arrays. Skips the
+         * memcpy + vector allocations that full deserialize would do
+         * for those arrays.
+         */
+        ndd::RoaringBitmap Bucket::read_summary_bitmap(const void* data,
+                                                       size_t len) {
+            if (len < sizeof(uint32_t)) {
+                throw std::runtime_error("Bucket corrupt: missing bitmap size");
+            }
+            const uint8_t* ptr = static_cast<const uint8_t*>(data);
+            const uint8_t* end = ptr + len;
+            uint32_t bm_size;
+            std::memcpy(&bm_size, ptr, sizeof(uint32_t));
+            ptr += sizeof(uint32_t);
+            if (bm_size > static_cast<size_t>(end - ptr)) {
+                throw std::runtime_error("Bucket corrupt: invalid bitmap size");
+            }
+            constexpr size_t per_entry =
+                sizeof(uint16_t) + sizeof(ndd::idInt);
+            const size_t remaining =
+                static_cast<size_t>(end - ptr - bm_size);
+            if (remaining % per_entry != 0) {
+                throw std::runtime_error(
+                    "Bucket corrupt: residual bytes not aligned");
+            }
+            auto bitmap_result = read_bitmap_payload(ptr, bm_size);
+            if(!bitmap_result.ok()) {
+                throw std::runtime_error("Bucket corrupt: "
+                                         + bitmap_result.message);
+            }
+            if(!bitmap_result.value.has_value()) {
+                throw std::runtime_error(
+                    "Bucket corrupt: bitmap reader succeeded without a bitmap");
+            }
+            return std::move(*bitmap_result.value);
+        }
+
+        bool Bucket::is_full() const {
+            return ids.size() >= MAX_SIZE;
+        }
+
+        bool Bucket::is_empty() const {
+            return ids.empty() && summary_bitmap.isEmpty();
+        }
+
+        std::string NumericIndex::make_forward_key(const std::string& field, ndd::idInt id) {
+            return field + ":" + std::to_string(id);
+        }
+
+        // Key Format: [Field]:[BigEndian_BaseValue]
+        std::string NumericIndex::make_bucket_key(const std::string& field, uint32_t start_val) {
+            uint32_t be_val = 0;
+#if defined(__GNUC__) || defined(__clang__)
+            be_val = __builtin_bswap32(start_val);
+#else
+            be_val = ((start_val >> 24) & 0xff) | ((start_val << 8) & 0xff0000)
+                     | ((start_val >> 8) & 0xff00) | ((start_val << 24) & 0xff000000);
+#endif
+            std::string key = field + ":";
+            key.append(reinterpret_cast<char*>(&be_val), 4);
+            return key;
+        }
+
+        uint32_t NumericIndex::parse_bucket_key_val(const std::string& key) {
+            if(key.size() < 4) {
+                return 0;
+            }
+            uint32_t be_val;
+            std::memcpy(&be_val, key.data() + key.size() - 4, 4);
+#if defined(__GNUC__) || defined(__clang__)
+            return __builtin_bswap32(be_val);
+#else
+            return ((be_val >> 24) & 0xff) | ((be_val << 8) & 0xff0000)
+                   | ((be_val >> 8) & 0xff00) | ((be_val << 24) & 0xff000000);
+#endif
+        }
+
+        /*
+         * Removes one id from the numeric inverted bucket that currently owns its old value.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX cursor, read, delete, or write failure; caller should log ERROR and return HTTP 500
+         * 200 = corrupt numeric bucket payload; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<> NumericIndex::remove_from_buckets(MDBX_txn* txn,
+                                                                 const std::string& field,
+                                                                 uint32_t value,
+                                                                 ndd::idInt id) {
+            // Find bucket
+            std::string bkey_str = make_bucket_key(field, value);
+            MDBX_val key{const_cast<char*>(bkey_str.data()), bkey_str.size()};
+            MDBX_val data;
+            MDBX_cursor* cursor = nullptr;
+            int rc = mdbx_cursor_open(txn, inverted_dbi_, &cursor);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to open numeric bucket remove cursor: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            /**
+             * Scan backward to find bucket covering 'value'.
+             * Logic to find correct bucket:
+             */
+            rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
+            if(rc == MDBX_SUCCESS) {
+                // Check if we are in right field & range
+                std::string found_key(static_cast<char*>(key.iov_base), key.iov_len);
+                if(found_key.rfind(field + ":", 0) != 0
+                   || parse_bucket_key_val(found_key) > value) {
+                    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_PREV);
+                }
+            } else if(rc == MDBX_NOTFOUND) {
+                /**
+                 * The only possible bucket that could still contain
+                 * value is the very last bucket in the database.
+                 * Hence jumping there.
+                 */
+                rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
+            }
+
+            // Should be at correct bucket now
+            if(rc != MDBX_SUCCESS) {
+                mdbx_cursor_close(cursor);
+                if(rc == MDBX_NOTFOUND) {
+                    return {SUCCESS, ""};
+                }
+                return {100, "Failed to locate numeric bucket for remove: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            std::string found_key(static_cast<char*>(key.iov_base), key.iov_len);
+            if(found_key.rfind(field + ":", 0) != 0) {
+                mdbx_cursor_close(cursor);
+                return {SUCCESS, ""};
+            }
+
+            uint32_t bucket_base = parse_bucket_key_val(found_key);
+            if(value < bucket_base) {
+                mdbx_cursor_close(cursor);
+                return {SUCCESS, ""};
+            }
+
+            try {
+                Bucket bucket = Bucket::deserialize(data.iov_base, data.iov_len, bucket_base);
+                if(bucket.remove(id)) {
+                    // Save back or Delete if empty
+                    if(bucket.is_empty()) {
+                        rc = mdbx_cursor_del(cursor, static_cast<MDBX_put_flags_t>(0));
+                        if(rc != MDBX_SUCCESS) {
+                            mdbx_cursor_close(cursor);
+                            return {100, "Failed to delete empty numeric bucket: "
+                                                 + std::string(mdbx_strerror(rc))};
+                        }
+                    } else {
+                        auto bytes = bucket.serialize();
+                        MDBX_val new_data{bytes.data(), bytes.size()};
+                        rc = mdbx_cursor_put(cursor, &key, &new_data, MDBX_CURRENT);
+                        if(rc != MDBX_SUCCESS) {
+                            mdbx_cursor_close(cursor);
+                            return {100, "Failed to update numeric bucket after remove: "
+                                                 + std::string(mdbx_strerror(rc))};
+                        }
+                    }
+                }
+            } catch(const std::exception& e) {
+                mdbx_cursor_close(cursor);
+                return {200, "Corrupt numeric bucket while removing id: "
+                                     + std::string(e.what())};
+            }
+
+            mdbx_cursor_close(cursor);
+            return {SUCCESS, ""};
+        }
+
+        /*
+         * Adds one id/value pair into the numeric inverted bucket index.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX cursor, read, or write failure; caller should log ERROR and return HTTP 500
+         * 200 = corrupt numeric bucket payload or invalid bucket invariant; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<> NumericIndex::add_to_buckets(MDBX_txn* txn,
+                                                            const std::string& field,
+                                                            uint32_t value,
+                                                            ndd::idInt id) {
+            MDBX_cursor* cursor = nullptr;
+            int rc = mdbx_cursor_open(txn, inverted_dbi_, &cursor);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to open numeric bucket add cursor: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            // Find candidate bucket
+            std::string search_key = make_bucket_key(field, value);
+            MDBX_val key{const_cast<char*>(search_key.data()), search_key.size()};
+            MDBX_val data;
+
+            // Move logic to find predecessor
+            rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
+            if(rc == MDBX_SUCCESS) {
+                std::string found_key(static_cast<char*>(key.iov_base), key.iov_len);
+                if(found_key.rfind(field + ":", 0) != 0
+                   || parse_bucket_key_val(found_key) > value) {
+                    int prev_rc = mdbx_cursor_get(cursor, &key, &data, MDBX_PREV);
+                    if(prev_rc == MDBX_SUCCESS) {
+                        rc = prev_rc;
+                    } else if(prev_rc != MDBX_NOTFOUND) {
+                        mdbx_cursor_close(cursor);
+                        return {100, "Failed to seek previous numeric bucket: "
+                                             + std::string(mdbx_strerror(prev_rc))};
+                    } else {
+                        rc = MDBX_NOTFOUND;
+                    }
+                }
+            } else if(rc == MDBX_NOTFOUND) {
+                rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
+                if(rc != MDBX_SUCCESS && rc != MDBX_NOTFOUND) {
+                    mdbx_cursor_close(cursor);
+                    return {100, "Failed to seek last numeric bucket: "
+                                         + std::string(mdbx_strerror(rc))};
+                }
+            } else {
+                mdbx_cursor_close(cursor);
+                return {100, "Failed to seek numeric bucket: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            bool create_new = true;
+            std::string target_key_str;
+            uint32_t target_base = 0;
+            if(rc == MDBX_SUCCESS) {
+                std::string found_key(static_cast<char*>(key.iov_base), key.iov_len);
+                if(found_key.rfind(field + ":", 0) == 0) {
+                    target_base = parse_bucket_key_val(found_key);
+
+                    // Check range condition
+                    if(value >= target_base
+                       && (static_cast<uint64_t>(value) - target_base)
+                                  <= Bucket::MAX_DELTA) {
+                        target_key_str = found_key;
+                        create_new = false;
+                    }
+                }
+            }
+
+            try {
+                if(create_new) {
+                    // Create new bucket at exact value
+                    Bucket bucket;
+                    bucket.base_value = value;
+                    bucket.add(value, id);
+                    auto bytes = bucket.serialize();
+
+                    target_key_str = make_bucket_key(field, value);
+                    MDBX_val k{const_cast<char*>(target_key_str.data()),
+                               target_key_str.size()};
+                    MDBX_val v{bytes.data(), bytes.size()};
+                    rc = mdbx_put(txn, inverted_dbi_, &k, &v, MDBX_UPSERT);
+                    if(rc != MDBX_SUCCESS) {
+                        mdbx_cursor_close(cursor);
+                        return {100, "Failed to create numeric bucket: "
+                                             + std::string(mdbx_strerror(rc))};
+                    }
+                } else {
+                    /**
+                     * Update existing.
+                     * We must re-fetch current key/data because cursor move might have updated key/data.
+                     */
+                    MDBX_val k{const_cast<char*>(target_key_str.data()),
+                               target_key_str.size()};
+                    MDBX_val v;
+                    rc = mdbx_cursor_get(cursor, &k, &v, MDBX_SET);
+                    if(rc != MDBX_SUCCESS) {
+                        // Should not happen if logic is correct
+                        mdbx_cursor_close(cursor);
+                        return {200, "Failed to resync numeric bucket cursor: "
+                                             + std::string(mdbx_strerror(rc))};
+                    }
+
+                    Bucket bucket = Bucket::deserialize(v.iov_base, v.iov_len, target_base);
+                    // Capacity Check
+                    if(bucket.ids.size() >= Bucket::MAX_SIZE) {
+                        /**
+                         * SPLIT LOGIC
+                         * Sort is maintained by arrays.
+                         * "Slide Split": Scan right from median.
+                         * Ensure we don't split a group of identical values.
+                         */
+                        size_t mid_idx = bucket.ids.size() / 2;
+                        size_t probe_right = mid_idx;
+                        while(probe_right < bucket.deltas.size() && probe_right > 0
+                              && bucket.deltas[probe_right]
+                                         == bucket.deltas[probe_right - 1]) {
+                            probe_right++;
+                        }
+
+                        if(probe_right < bucket.deltas.size()) {
+                            mid_idx = probe_right;
+                        } else {
+                            // Fallback: Try scanning left
+                            size_t probe_left = mid_idx;
+                            while(probe_left > 0
+                                  && bucket.deltas[probe_left]
+                                             == bucket.deltas[probe_left - 1]) {
+                                probe_left--;
+                            }
+                            // All identical
+                            mid_idx = probe_left > 0 ? probe_left : bucket.deltas.size();
+                        }
+
+                        /**
+                         * Slide-split could not find a value boundary
+                         * -- the bucket is all duplicates of
+                         * base_value, so there is no clean place to
+                         * cut. Just append the new entry; the bucket
+                         * goes momentarily past MAX_SIZE.
+                         *
+                         * If the new value equals base_value, it
+                         * extends the duplicate run; the next insert
+                         * of any value will fall into the same
+                         * fallthrough.
+                         *
+                         * If the new value is greater than base_value,
+                         * it introduces the boundary that was missing,
+                         * and the very next insert hitting this
+                         * bucket will split cleanly via the standard
+                         * slide-split path below.
+                         *
+                         * The on-disk count field has been removed
+                         * from the bucket payload, so this transient
+                         * over-MAX_SIZE state can no longer cause the
+                         * uint16_t cliff at 65,536 entries -- the
+                         * deserializer derives N from the residual
+                         * bytes after the bitmap.
+                         */
+                        if(mid_idx == bucket.deltas.size()) {
+                            bucket.add(value, id);
+                            auto bytes = bucket.serialize();
+                            MDBX_val k2{const_cast<char*>(target_key_str.data()),
+                                        target_key_str.size()};
+                            MDBX_val v2{bytes.data(), bytes.size()};
+                            rc = mdbx_cursor_put(cursor, &k2, &v2, MDBX_CURRENT);
+                            mdbx_cursor_close(cursor);
+                            if(rc != MDBX_SUCCESS) {
+                                return {100, "Failed to update overfull numeric bucket: "
+                                                     + std::string(mdbx_strerror(rc))};
+                            }
+                            return {SUCCESS, ""};
+                        }
+
+                        // Standard Slide Split
+                        Bucket right_bucket;
+                        right_bucket.base_value = bucket.base_value + bucket.deltas[mid_idx];
+                        // Move entries
+                        for(size_t i = mid_idx; i < bucket.deltas.size(); ++i) {
+                            right_bucket.add(bucket.base_value + bucket.deltas[i],
+                                             bucket.ids[i]);
+                        }
+
+                        // Truncate left
+                        bucket.deltas.resize(mid_idx);
+                        bucket.ids.resize(mid_idx);
+                        /**
+                         * Left bitmap = original bitmap minus the ids
+                         * that moved to right_bucket. This preserves
+                         * any delta-0 bitmap-only entries on the left
+                         * (their value == base_value and the left
+                         * bucket's base_value is unchanged), where
+                         * rebuilding from bucket.ids alone would drop
+                         * them.
+                         */
+                        for(size_t i = 0; i < right_bucket.ids.size(); ++i) {
+                            bucket.summary_bitmap.remove(right_bucket.ids[i]);
+                        }
+
+                        // Now add new value to correct bucket
+                        if(value >= right_bucket.base_value) {
+                            right_bucket.add(value, id);
+                        } else {
+                            /**
+                             * If value < right, goes to left.
+                             * But wait, split point was determined by existing items.
+                             * If new value is >= base+split_delta, it goes right.
+                             * BUT we just cleared right from b.
+                             * Correct logic:
+                             * Oh wait, if we added to left, we might overflow again or break order?
+                             * Simply: Check which bucket covers it.
+                             * Left covers [Base, RightBase-1].
+                             * Right covers [RightBase, ...].
+                             */
+                            bucket.add(value, id);
+                        }
+
+                        // Save Left
+                        auto left_bytes = bucket.serialize();
+                        MDBX_val left_v{left_bytes.data(), left_bytes.size()};
+                        MDBX_val left_k{const_cast<char*>(target_key_str.data()),
+                                        target_key_str.size()};
+                        rc = mdbx_cursor_put(cursor, &left_k, &left_v, MDBX_CURRENT);
+                        if(rc != MDBX_SUCCESS) {
+                            mdbx_cursor_close(cursor);
+                            return {100, "Failed to update split numeric bucket: "
+                                                 + std::string(mdbx_strerror(rc))};
+                        }
+
+                        // Save Right
+                        auto right_bytes = right_bucket.serialize();
+                        std::string right_k_str =
+                                make_bucket_key(field, right_bucket.base_value);
+                        MDBX_val right_k{const_cast<char*>(right_k_str.data()),
+                                         right_k_str.size()};
+                        MDBX_val right_v{right_bytes.data(), right_bytes.size()};
+                        // Use put for new key
+                        rc = mdbx_put(txn, inverted_dbi_, &right_k, &right_v, MDBX_UPSERT);
+                        if(rc != MDBX_SUCCESS) {
+                            mdbx_cursor_close(cursor);
+                            return {100, "Failed to write split numeric bucket: "
+                                                 + std::string(mdbx_strerror(rc))};
+                        }
+                    } else {
+                        // Normal Insert
+                        bucket.add(value, id);
+                        auto bytes = bucket.serialize();
+                        MDBX_val new_data{bytes.data(), bytes.size()};
+                        // Use cursor put to update current
+                        rc = mdbx_cursor_put(cursor, &k, &new_data, MDBX_CURRENT);
+                        if(rc != MDBX_SUCCESS) {
+                            mdbx_cursor_close(cursor);
+                            return {100, "Failed to update numeric bucket: "
+                                                 + std::string(mdbx_strerror(rc))};
+                        }
+                    }
+                }
+            } catch(const std::exception& e) {
+                mdbx_cursor_close(cursor);
+                return {200, "Corrupt numeric bucket while adding id: "
+                                     + std::string(e.what())};
+            }
+
+            mdbx_cursor_close(cursor);
+            return {SUCCESS, ""};
+        }
+
+        /*
+         * Writes one numeric forward entry and updates the inverted buckets inside a caller transaction.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX read or write failure; caller should log ERROR and return HTTP 500
+         * 100-199 = propagated MDBX/storage failure from bucket helpers
+         * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+         * 200-299 = propagated corruption/invariant failure from bucket helpers
+         */
+        ndd::OperationResult<> NumericIndex::put_internal(MDBX_txn* txn,
+                                                          const std::string& field,
+                                                          ndd::idInt id,
+                                                          uint32_t value) {
+
+            // 1. Check Forward Index
+            std::string fwd_key_str = make_forward_key(field, id);
+            MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
+            MDBX_val fwd_val;
+
+            int rc = mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val);
+            if(rc == MDBX_SUCCESS) {
+                if(fwd_val.iov_len != sizeof(uint32_t)) {
+                    return {200, "Corrupt numeric forward value for field '" + field + "'"};
+                }
+                uint32_t old_val;
+                std::memcpy(&old_val, fwd_val.iov_base, sizeof(uint32_t));
+                if(old_val == value) {
+                    return {SUCCESS, ""};
+                }
+                auto remove_result = remove_from_buckets(txn, field, old_val, id);
+                if(!remove_result.ok()) {
+                    return remove_result;
+                }
+            } else if(rc != MDBX_NOTFOUND) {
+                return {100, "Failed to read numeric forward value: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            // 2. Update Forward
+            MDBX_val new_val_data{&value, sizeof(uint32_t)};
+            rc = mdbx_put(txn, forward_dbi_, &fwd_key, &new_val_data, MDBX_UPSERT);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to write numeric forward value: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            // 3. Add to Inverted Buckets
+            return add_to_buckets(txn, field, value, id);
+        }
+
+        NumericIndex::NumericIndex(MDBX_env* env) :
+            env_(env) {
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+            if(rc != MDBX_SUCCESS) {
+                throw std::runtime_error(std::string("Failed to begin NumericIndex init: ")
+                                         + mdbx_strerror(rc));
+            }
+
+            rc = mdbx_dbi_open(txn, "numeric_forward", MDBX_CREATE, &forward_dbi_);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                throw std::runtime_error(std::string("Failed to open numeric_forward dbi: ")
+                                         + mdbx_strerror(rc));
+            }
+
+            rc = mdbx_dbi_open(txn, "numeric_inverted", MDBX_CREATE, &inverted_dbi_);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                throw std::runtime_error(std::string("Failed to open numeric_inverted dbi: ")
+                                         + mdbx_strerror(rc));
+            }
+
+            rc = mdbx_txn_commit(txn);
+            if(rc != MDBX_SUCCESS) {
+                throw std::runtime_error(std::string("Failed to commit NumericIndex init: ")
+                                         + mdbx_strerror(rc));
+            }
+        }
+
+        /*
+         * Writes a batch of numeric filter entries in bounded MDBX write transaction chunks.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction or commit failure; caller should log ERROR and return HTTP 500
+         * 100-199 = propagated MDBX/storage failure from per-entry writes
+         * 200-299 = propagated corruption/invariant failure from per-entry writes
+         */
+        ndd::OperationResult<> NumericIndex::put_batch(
+                const std::vector<NumericBatchEntry>& entries) {
+            if(entries.empty()) {
+                return {SUCCESS, ""};
+            }
+
+            for(size_t start = 0; start < entries.size(); start += BATCH_TXN_CHUNK_SIZE) {
+                size_t end = std::min(start + BATCH_TXN_CHUNK_SIZE, entries.size());
+
+                MDBX_txn* txn = nullptr;
+                int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+                if(rc != MDBX_SUCCESS) {
+                    return {100, "Failed to begin numeric batch write transaction: "
+                                         + std::string(mdbx_strerror(rc))};
+                }
+
+                for(size_t i = start; i < end; ++i) {
+                    const auto& entry = entries[i];
+                    auto put_result = put_internal(txn, entry.field, entry.id, entry.value);
+                    if(!put_result.ok()) {
+                        mdbx_txn_abort(txn);
+                        return put_result;
+                    }
+                }
+
+                rc = mdbx_txn_commit(txn);
+                if(rc != MDBX_SUCCESS) {
+                    return {100, "Failed to commit numeric batch write transaction: "
+                                         + std::string(mdbx_strerror(rc))};
+                }
+            }
+            return {SUCCESS, ""};
+        }
+
+        /*
+         * Removes one id from the numeric forward and inverted indexes for a field.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction, read, delete, or commit failure; caller should log ERROR and return HTTP 500
+         * 100-199 = propagated MDBX/storage failure from bucket helpers
+         * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+         * 200-299 = propagated corruption/invariant failure from bucket helpers
+         */
+        ndd::OperationResult<> NumericIndex::remove(const std::string& field, ndd::idInt id) {
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to begin numeric remove transaction: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            std::string fwd_key_str = make_forward_key(field, id);
+            MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
+            MDBX_val fwd_val;
+
+            rc = mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val);
+            if(rc == MDBX_NOTFOUND) {
+                mdbx_txn_abort(txn);
+                return {SUCCESS, ""};
+            }
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100, "Failed to read numeric forward value for remove: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+            if(fwd_val.iov_len != sizeof(uint32_t)) {
+                mdbx_txn_abort(txn);
+                return {200, "Corrupt numeric forward value for field '" + field + "'"};
+            }
+
+            uint32_t old_val;
+            std::memcpy(&old_val, fwd_val.iov_base, sizeof(uint32_t));
+            auto remove_result = remove_from_buckets(txn, field, old_val, id);
+            if(!remove_result.ok()) {
+                mdbx_txn_abort(txn);
+                return remove_result;
+            }
+
+            rc = mdbx_del(txn, forward_dbi_, &fwd_key, nullptr);
+            if(rc != MDBX_SUCCESS && rc != MDBX_NOTFOUND) {
+                mdbx_txn_abort(txn);
+                return {100, "Failed to delete numeric forward value: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            rc = mdbx_txn_commit(txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to commit numeric remove transaction: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+            return {SUCCESS, ""};
+        }
+
+        /*
+         * Computes a bitmap of ids whose numeric field value falls within an inclusive sortable range.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction, cursor, or scan failure; caller should log ERROR and return HTTP 500
+         * 200 = corrupt numeric bucket payload; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<ndd::RoaringBitmap>
+        NumericIndex::range(const std::string& field, uint32_t min_val, uint32_t max_val) {
+            ndd::RoaringBitmap result;
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to begin numeric range transaction: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            MDBX_cursor* cursor = nullptr;
+            rc = mdbx_cursor_open(txn, inverted_dbi_, &cursor);
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100, "Failed to open numeric range cursor: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            // 1. Find Start Bucket
+            std::string start_k = make_bucket_key(field, min_val);
+            MDBX_val key{const_cast<char*>(start_k.data()), start_k.size()};
+            MDBX_val data;
+
+            rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
+            if(rc == MDBX_SUCCESS) {
+                std::string fkey(static_cast<char*>(key.iov_base), key.iov_len);
+                if(fkey.rfind(field + ":", 0) != 0 || parse_bucket_key_val(fkey) > min_val) {
+                    // Check if we need to back up
+                    MDBX_val prev_key = key;
+                    MDBX_val prev_data;
+                    // Check prev
+                    int prev_rc = mdbx_cursor_get(cursor, &prev_key, &prev_data, MDBX_PREV);
+                    if(prev_rc == MDBX_SUCCESS) {
+                        std::string prev_key_str(static_cast<char*>(prev_key.iov_base),
+                                                 prev_key.iov_len);
+                        if(prev_key_str.rfind(field + ":", 0) == 0) {
+                            // Prev is valid start
+                            key = prev_key;
+                            data = prev_data;
+                        }
+                    } else if(prev_rc != MDBX_NOTFOUND) {
+                        mdbx_cursor_close(cursor);
+                        mdbx_txn_abort(txn);
+                        return {100, "Failed to seek previous numeric range bucket: "
+                                             + std::string(mdbx_strerror(prev_rc))};
+                    }
+                }
+            } else if(rc == MDBX_NOTFOUND) {
+                rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
+                if(rc == MDBX_SUCCESS) {
+                    std::string fkey(static_cast<char*>(key.iov_base), key.iov_len);
+                    if(fkey.rfind(field + ":", 0) != 0) {
+                        rc = MDBX_NOTFOUND;
+                    }
+                } else if(rc != MDBX_NOTFOUND) {
+                    mdbx_cursor_close(cursor);
+                    mdbx_txn_abort(txn);
+                    return {100, "Failed to seek last numeric range bucket: "
+                                         + std::string(mdbx_strerror(rc))};
+                }
+            } else {
+                mdbx_cursor_close(cursor);
+                mdbx_txn_abort(txn);
+                return {100, "Failed to seek numeric range bucket: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            try {
+                // Iterate forward
+                while(rc == MDBX_SUCCESS) {
+                    std::string cur_key(static_cast<char*>(key.iov_base), key.iov_len);
+                    if(cur_key.rfind(field + ":", 0) != 0) {
+                        break;
+                    }
+
+                    uint32_t bucket_base = parse_bucket_key_val(cur_key);
+                    if(bucket_base > max_val) {
+                        break;
+                    }
+
+                    /**
+                     * Coarse full-coverage fast path.
+                     *
+                     * A bucket can hold values in [base, base+MAX_DELTA]
+                     * by construction. If that whole extent is inside
+                     * [min_val, max_val], we don't need to look at the
+                     * deltas/ids arrays -- the bucket's summary_bitmap
+                     * already enumerates every id that belongs in the
+                     * result. Skip the full deserialize and read just
+                     * the bitmap header.
+                     *
+                     * This fires on every interior bucket of a wide
+                     * range scan, so for "score >= a AND score <= b"
+                     * with a wide [a,b] only the start and end buckets
+                     * pay the deltas/ids parsing cost.
+                     */
+                    if(bucket_base >= min_val
+                       && static_cast<uint64_t>(bucket_base) + Bucket::MAX_DELTA
+                                  <= max_val) {
+                        result |= Bucket::read_summary_bitmap(data.iov_base,
+                                                              data.iov_len);
+                        rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
+                        continue;
+                    }
+
+                    Bucket bucket = Bucket::deserialize(data.iov_base,
+                                                        data.iov_len,
+                                                        bucket_base);
+
+                    if(bucket.ids.empty()) {
+                        /**
+                         * ids[] empty but the bucket survived means the
+                         * bitmap still carries delta-0 (bitmap-only)
+                         * entries that were absorbed past MAX_SIZE by
+                         * the saturated-duplicate path in Bucket::add.
+                         * All such ids have value == base_value, so
+                         * include them iff base_value is in range.
+                         */
+                        if(!bucket.summary_bitmap.isEmpty()
+                           && bucket_base >= min_val && bucket_base <= max_val) {
+                            result |= bucket.summary_bitmap;
+                        }
+                        rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
+                        continue;
+                    }
+
+                    uint32_t bucket_min = bucket.get_value(0);
+                    uint32_t bucket_max = bucket.get_value(bucket.ids.size() - 1);
+
+                    if(bucket_min >= min_val && bucket_max <= max_val) {
+                        /**
+                         * Full overlap. summary_bitmap is a superset
+                         * of bucket.ids (it also carries any bitmap-
+                         * only entries from the saturated-duplicate
+                         * path, all of which have value == base_value
+                         * and therefore lie inside the query since
+                         * bucket_min == base_value is inside).
+                         */
+                        result |= bucket.summary_bitmap;
+                    } else {
+                        // Partial overlap on the parallel arrays.
+                        for(size_t i = 0; i < bucket.ids.size(); ++i) {
+                            uint32_t value = bucket.get_value(i);
+                            if(value >= min_val && value <= max_val) {
+                                result.add(bucket.ids[i]);
+                            }
+                        }
+                        /**
+                         * Bitmap-only entries (cardinality > ids.size())
+                         * exist when Bucket::add saturated and absorbed
+                         * duplicates of base_value into summary_bitmap
+                         * only. Every such entry has value == base_value
+                         * by construction. Include them iff base_value
+                         * lies in [min_val, max_val].
+                         *
+                         * "bitmap-only" set =
+                         *     summary_bitmap minus { ids[i] : deltas[i] != 0 }
+                         * because the delta-zero ids in ids[] are also
+                         * in the bitmap and would be redundantly added,
+                         * but Roaring set union is idempotent so
+                         * removing only the delta>0 entries is enough
+                         * to leave us with all delta-zero ids (whether
+                         * they live in ids[] or only in the bitmap).
+                         */
+                        if(bucket_base >= min_val && bucket_base <= max_val
+                           && bucket.summary_bitmap.cardinality()
+                                      > bucket.ids.size()) {
+                            ndd::RoaringBitmap bitmap_only =
+                                    bucket.summary_bitmap;
+                            for(size_t i = 0; i < bucket.ids.size(); ++i) {
+                                if(bucket.deltas[i] != 0) {
+                                    bitmap_only.remove(bucket.ids[i]);
+                                }
+                            }
+                            result |= bitmap_only;
+                        }
+                    }
+
+                    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
+                }
+            } catch(const std::exception& e) {
+                mdbx_cursor_close(cursor);
+                mdbx_txn_abort(txn);
+                return {200, "Corrupt numeric bucket during range scan: "
+                                     + std::string(e.what())};
+            }
+
+            mdbx_cursor_close(cursor);
+            mdbx_txn_abort(txn);
+            if(rc != MDBX_SUCCESS && rc != MDBX_NOTFOUND) {
+                return {100, "Failed during numeric range scan: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+            return {SUCCESS, "", std::move(result)};
+        }
+
+        /*
+         * Checks whether one id has a numeric field value inside an inclusive sortable range.
+         *
+         * Return codes:
+         * 0 = success
+         * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+         * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+         */
+        ndd::OperationResult<bool>
+        NumericIndex::check_range(const std::string& field,
+                                  ndd::idInt id,
+                                  uint32_t min_val,
+                                  uint32_t max_val) {
+            MDBX_txn* txn = nullptr;
+            int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+            if(rc != MDBX_SUCCESS) {
+                return {100, "Failed to begin numeric check transaction: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+
+            std::string fwd_key_str = make_forward_key(field, id);
+            MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
+            MDBX_val fwd_val;
+
+            rc = mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val);
+            if(rc == MDBX_NOTFOUND) {
+                mdbx_txn_abort(txn);
+                return {SUCCESS, "", false};
+            }
+            if(rc != MDBX_SUCCESS) {
+                mdbx_txn_abort(txn);
+                return {100, "Failed to read numeric forward value during check: "
+                                     + std::string(mdbx_strerror(rc))};
+            }
+            if(fwd_val.iov_len != sizeof(uint32_t)) {
+                mdbx_txn_abort(txn);
+                return {200, "Corrupt numeric forward value for field '" + field + "'"};
+            }
+
+            uint32_t value;
+            std::memcpy(&value, fwd_val.iov_base, sizeof(uint32_t));
+            mdbx_txn_abort(txn);
+            return {SUCCESS, "", value >= min_val && value <= max_val};
+        }
+
+    }  // namespace filter
+}  // namespace ndd
diff --git a/src/filter/numeric_index.hpp b/src/filter/numeric_index.hpp
index c002652137..a24bce6cf6 100644
--- a/src/filter/numeric_index.hpp
+++ b/src/filter/numeric_index.hpp
@@ -1,47 +1,41 @@
 #pragma once
 
+#include <cstddef>
 #include <cstdint>
-#include <vector>
 #include <string>
-#include <cstring>
-#include <algorithm>
-#include <stdexcept>
-#include <iostream>
+#include <vector>
+
 #include "mdbx/mdbx.h"
-#include "../utils/log.hpp"
 #include "../core/types.hpp"
+#include "../utils/types.hpp"
 
 namespace ndd {
     namespace filter {
 
+        struct NumericBatchEntry {
+            std::string field;
+            ndd::idInt id;
+            uint32_t value;
+
+            NumericBatchEntry(std::string field_in, ndd::idInt id_in, uint32_t value_in);
+        };
+
         // --- Sortable Key Utilities ---
-        inline uint32_t float_to_sortable(float f) {
-            uint32_t i;
-            std::memcpy(&i, &f, sizeof(float));
-            // IEEE 754: if sign bit set, flip all bits. Else flip just sign.
-            // This makes negatives < positives order correctly.
-            uint32_t mask = (int32_t(i) >> 31) | 0x80000000;
-            return i ^ mask;
-        }
-
-        inline float sortable_to_float(uint32_t i) {
-            uint32_t mask = ((i >> 31) - 1) | 0x80000000;
-            uint32_t result = i ^ mask;
-            float f;
-            std::memcpy(&f, &result, sizeof(float));
-            return f;
-        }
-
-        inline uint32_t int_to_sortable(int32_t i) {
-            return static_cast<uint32_t>(i) ^ 0x80000000;
-        }
-
-        inline int32_t sortable_to_int(uint32_t i) {
-            return static_cast<int32_t>(i ^ 0x80000000);
-        }
+        uint32_t float_to_sortable(float f);
+        float sortable_to_float(uint32_t i);
+        uint32_t int_to_sortable(int32_t i);
+        int32_t sortable_to_int(uint32_t i);
 
         // --- Bucket Structure (Hybrid) ---
         struct Bucket {
+            /**
+             * XXX: Ideally this bucket should be page size
+             * bounded. Currently it is difficult to do that
+             * here because the size of summary_bitmap depends
+             * on the kind of userspace filter upserts and not
+             * the number of them.
+             */
+
             static constexpr size_t MAX_SIZE = 1024;
             static constexpr uint32_t MAX_DELTA = 65535;
 
@@ -55,153 +49,44 @@ namespace ndd {
 
             bool is_dirty = false;
 
+            static ndd::OperationResult<ndd::RoaringBitmap>
+            read_bitmap_payload(const uint8_t* data, size_t len);
+
             // Helper to get actual value
-            uint32_t get_value(size_t index) const {
-                return base_value + deltas[index];
-            }
-
-            void add(uint32_t val, ndd::idInt id) {
-                if (val < base_value) {
-                     // Should not happen if Key logic is correct
-                     throw std::runtime_error("Insert value < Base Value"); 
-                }
-                uint32_t delta_32 = val - base_value;
-                if (delta_32 > MAX_DELTA) {
-                    throw std::runtime_error("Delta overflow");
-                }
-                
-                // Maintain sorted order by Value (Delta)
-                uint16_t delta = static_cast<uint16_t>(delta_32);
-                
-                // Find insertion point
-                auto it = std::lower_bound(deltas.begin(), deltas.end(), delta);
-                size_t index = std::distance(deltas.begin(), it);
-
-                deltas.insert(it, delta);
-                ids.insert(ids.begin() + index, id);
-                
-                summary_bitmap.add(id);
-                is_dirty = true;
-            }
-
-            bool remove(ndd::idInt id) {
-                // Find index by ID (linear scan needed as ids are not sorted)
-                for (size_t i = 0; i < ids.size(); ++i) {
-                    if (ids[i] == id) {
-                        ids.erase(ids.begin() + i);
-                        deltas.erase(deltas.begin() + i);
-                        
-                        // Rebuild or update bitmap? Roaring remove is fast
-                        summary_bitmap.remove(id);
-                        is_dirty = true;
-                        return true;
-                    }
-                }
-                return false;
-            }
-
-            // Serialization Format:
-            // [BitmapSize (4)]
-            // [Bitmap Bytes]
-            // [Count (2)]
-            // [Deltas (Count * 2)]
-            // [IDs (Count * sizeof(idInt))]
-            std::vector<uint8_t> serialize() const {
-                // Optimize bitmap
-                const_cast<ndd::RoaringBitmap&>(summary_bitmap).runOptimize();
-                
-                size_t bm_size = summary_bitmap.getSizeInBytes();
-                uint16_t count = static_cast<uint16_t>(ids.size());
-                
-                size_t total_size = 4 + bm_size + 2 + (count * 2) + (count * sizeof(ndd::idInt));
-                std::vector<uint8_t> buffer(total_size);
-                uint8_t* ptr = buffer.data();
-
-                // 1. Bitmap Header
-                uint32_t bm_size_32 = static_cast<uint32_t>(bm_size);
-                std::memcpy(ptr, &bm_size_32, 4); ptr += 4;
-
-                // 2. Bitmap Data
-                if (bm_size > 0) {
-                    summary_bitmap.write(reinterpret_cast<char*>(ptr));
-                    ptr += bm_size;
-                }
-
-                // 3. Count
-                std::memcpy(ptr, &count, 2); ptr += 2;
-
-                // 4. Deltas
-                if (count > 0) {
-                    std::memcpy(ptr, deltas.data(), count * 2); ptr += count * 2;
-                }
-
-                // 5. IDs
-                if (count > 0) {
-                    std::memcpy(ptr, ids.data(), count * sizeof(ndd::idInt)); 
-                }
-                
-                return buffer;
-            }
-
-            static Bucket deserialize(const void* data, size_t len, uint32_t base_val) {
-                Bucket b;
-                b.base_value = base_val;
-                
-                if (len < 6) return b; // Min valid size
-
-                const uint8_t* ptr = static_cast<const uint8_t*>(data);
-                const uint8_t* end = ptr + len;
-                
-                // 1. Bitmap Size
-                uint32_t bm_size;
-                std::memcpy(&bm_size, ptr, 4); ptr += 4;
-
-                if (ptr + bm_size > end) {
-                    throw std::runtime_error("Bucket corrupt: invalid bitmap size");
-                }
-
-                // 2. Bitmap
-                if (bm_size > 0) {
-                   b.summary_bitmap = ndd::RoaringBitmap::read(reinterpret_cast<const char*>(ptr));
-                   ptr += bm_size;
-                }
-
-                if (ptr + 2 > end) throw std::runtime_error("Bucket corrupt: truncated count");
-
-                // 3. Count
-                uint16_t count;
-                std::memcpy(&count, ptr, 2); ptr += 2;
-
-                // 4. Deltas & IDs
-                if (count > 0) {
-                    size_t delta_size = count * 2;
-                    size_t id_size = count * sizeof(ndd::idInt);
-                    
-                    if (ptr + delta_size + id_size > end) {
-                         throw std::runtime_error("Bucket corrupt: truncated Data");
-                    }
-
-                    b.deltas.resize(count);
-                    std::memcpy(b.deltas.data(), ptr, delta_size); ptr += delta_size;
-
-                    b.ids.resize(count);
-                    std::memcpy(b.ids.data(), ptr, id_size); 
-                }
-                
-                return b;
-            }
-
-            // Fast access to just the bitmap (for middle buckets)
-            static ndd::RoaringBitmap read_summary_bitmap(const void* data, size_t len) {
-               const uint8_t* ptr = static_cast<const uint8_t*>(data);
-               uint32_t bm_size;
-               std::memcpy(&bm_size, ptr, 4); ptr += 4;
-               if(bm_size == 0) return ndd::RoaringBitmap();
-               return ndd::RoaringBitmap::read(reinterpret_cast<const char*>(ptr));
-            }
-
-            bool is_full() const { return ids.size() >= MAX_SIZE; }
-            bool is_empty() const { return ids.empty(); }
+            uint32_t get_value(size_t index) const;
+
+            void add(uint32_t val, ndd::idInt id);
+
+            bool remove(ndd::idInt id);
+
+            /**
+             * Serialization Format:
+             *   [BitmapSize (uint32_t)]
+             *   [Bitmap Bytes]
+             *   [Deltas (nr_array_entries * sizeof(uint16_t))]
+             *   [IDs    (nr_array_entries * sizeof(idInt))]
+             *
+             * nr_array_entries is recovered on read from
+             *   (iov_len - sizeof(uint32_t) - bm_size)
+             *       / (sizeof(uint16_t) + sizeof(idInt))
+             */
+            std::vector<uint8_t> serialize() const;
+
+            static Bucket deserialize(const void* data, size_t len, uint32_t base_val);
+
+            /**
+             * Fast access to just the bitmap.
+             *
+             * Used by range() when a bucket is fully covered by the query
+             * extent and we don't need the deltas/ids arrays. Skips the
+             * memcpy + vector allocations that full deserialize would do
+             * for those arrays.
+             */
+            static ndd::RoaringBitmap read_summary_bitmap(const void* data,
+                                                          size_t len);
+
+            bool is_full() const;
+            bool is_empty() const;
         };
 
         class NumericIndex {
@@ -209,440 +94,107 @@ namespace ndd {
             MDBX_env* env_;
             MDBX_dbi forward_dbi_;   // ID -> Value (Field:ID -> Value)
             MDBX_dbi inverted_dbi_;  // BucketKey -> BucketBlob
+            static constexpr size_t BATCH_TXN_CHUNK_SIZE = 256;
 
-            std::string make_forward_key(const std::string& field, ndd::idInt id) {
-                return field + ":" + std::to_string(id);
-            }
+            std::string make_forward_key(const std::string& field, ndd::idInt id);
 
             // Key Format: [Field]:[BigEndian_BaseValue]
-            std::string make_bucket_key(const std::string& field, uint32_t start_val) {
-                uint32_t be_val = 0;
-#if defined(__GNUC__) || defined(__clang__)
-                be_val = __builtin_bswap32(start_val);
-#else
-                be_val = ((start_val >> 24) & 0xff) | ((start_val << 8) & 0xff0000)
-                         | ((start_val >> 8) & 0xff00) | ((start_val << 24) & 0xff000000);
-#endif
-                std::string key = field + ":";
-                key.append((char*)&be_val, 4);
-                return key;
-            }
-
-            uint32_t parse_bucket_key_val(const std::string& key) {
-                if (key.size() < 4) return 0;
-                uint32_t be_val;
-                std::memcpy(&be_val, key.data() + key.size() - 4, 4);
-#if defined(__GNUC__) || defined(__clang__)
-                return __builtin_bswap32(be_val);
-#else
-                return ((be_val >> 24) & 0xff) | ((be_val << 8) & 0xff0000)
-                       | ((be_val >> 8) & 0xff00) | ((be_val << 24) & 0xff000000);
-#endif
-            }
-
-        public:
-            NumericIndex(MDBX_env* env) : env_(env) {
-                MDBX_txn* txn;
-                if (mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn) == MDBX_SUCCESS) {
-                    mdbx_dbi_open(txn, "numeric_forward", MDBX_CREATE, &forward_dbi_);
-                    mdbx_dbi_open(txn, "numeric_inverted", MDBX_CREATE, &inverted_dbi_);
-                    mdbx_txn_commit(txn);
-                }
-            }
-
-            void put(const std::string& field, ndd::idInt id, uint32_t value) {
-                MDBX_txn* txn;
-                mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-                try {
-                    put_internal(txn, field, id, value);
-                    mdbx_txn_commit(txn);
-                } catch(...) {
-                    mdbx_txn_abort(txn);
-                    throw;
-                }
-            }
-
-            void remove(const std::string& field, ndd::idInt id) {
-                MDBX_txn* txn;
-                mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
-                try {
-                    std::string fwd_key_str = make_forward_key(field, id);
-                    MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
-                    MDBX_val fwd_val;
-
-                    if(mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val) == MDBX_SUCCESS) {
-                        uint32_t old_val;
-                        std::memcpy(&old_val, fwd_val.iov_base, sizeof(uint32_t));
-                        remove_from_buckets(txn, field, old_val, id);
-                        mdbx_del(txn, forward_dbi_, &fwd_key, nullptr);
-                    }
-
-                    mdbx_txn_commit(txn);
-                } catch(...) {
-                    mdbx_txn_abort(txn);
-                    throw;
-                }
-            }
-
-        private:
-            void put_internal(MDBX_txn* txn, const std::string& field, ndd::idInt id, uint32_t value) {
-                // 1. Check Forward Index
-                std::string fwd_key_str = make_forward_key(field, id);
-                MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
-                MDBX_val fwd_val;
-
-                if (mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val) == MDBX_SUCCESS) {
-                    uint32_t old_val;
-                    std::memcpy(&old_val, fwd_val.iov_base, 4);
-                    if (old_val == value) return;
-                    remove_from_buckets(txn, field, old_val, id);
-                }
-
-                // 2. Update Forward
-                MDBX_val new_val_data{&value, sizeof(uint32_t)};
-                mdbx_put(txn, forward_dbi_, &fwd_key, &new_val_data, MDBX_UPSERT);
-
-                // 3. Add to Inverted Buckets
-                add_to_buckets(txn, field, value, id);
-            }
-
-            void remove_from_buckets(MDBX_txn* txn, const std::string& field, uint32_t value, ndd::idInt id) {
-                // Find bucket
-                std::string bkey_str = make_bucket_key(field, value);
-                MDBX_val key{const_cast<char*>(bkey_str.data()), bkey_str.size()};
-                MDBX_val data;
-                MDBX_cursor* cursor;
-                mdbx_cursor_open(txn, inverted_dbi_, &cursor);
-
-                // Scan backward to find bucket covering 'value'
-                int rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
-                
-                // Logic to find correct bucket:
-                std::string found_key;
-
-                if (rc == MDBX_SUCCESS) {
-                    found_key = std::string((char*)key.iov_base, key.iov_len);
-                    // Check if we are in right field & range
-                    if (found_key.rfind(field + ":", 0) != 0 || parse_bucket_key_val(found_key) > value) {
-                            rc = mdbx_cursor_get(cursor, &key, &data, MDBX_PREV);
-                    }
-                } else if (rc == MDBX_NOTFOUND) {
-                   rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
-                }
-
-                // Should be at correct bucket now
-                if (rc == MDBX_SUCCESS) {
-                     found_key = std::string((char*)key.iov_base, key.iov_len);
-                     if (found_key.rfind(field + ":", 0) == 0) {
-                         uint32_t bucket_base = parse_bucket_key_val(found_key);
-                         if (value >= bucket_base) {
-                             Bucket b = Bucket::deserialize(data.iov_base, data.iov_len, bucket_base);
-                             if (b.remove(id)) {
-                                 // Save back or Delete if empty
-                                 if (b.is_empty()) {
-                                     mdbx_cursor_del(cursor, static_cast<MDBX_put_flags_t>(0));
-                                 } else {
-                                     auto bytes = b.serialize();
-                                     MDBX_val new_data{bytes.data(), bytes.size()};
-                                     mdbx_cursor_put(cursor, &key, &new_data, MDBX_CURRENT);
-                                 }
-                             }
-                         }
-                     }
-                }
-                mdbx_cursor_close(cursor);
-            }
-
-            void add_to_buckets(MDBX_txn* txn, const std::string& field, uint32_t value, ndd::idInt id) {
-                MDBX_cursor* cursor;
-                mdbx_cursor_open(txn, inverted_dbi_, &cursor);
-
-                // Find candidate bucket
-                std::string search_key = make_bucket_key(field, value);
-                MDBX_val key{const_cast<char*>(search_key.data()), search_key.size()};
-                MDBX_val data;
-
-                int rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
-                
-                bool create_new = false;
-                std::string target_key_str;
-                uint32_t target_base = 0;
-
-                // Move logic to find predecessor
-                if (rc == MDBX_SUCCESS) {
-                     std::string found_key((char*)key.iov_base, key.iov_len);
-                     if (found_key.rfind(field + ":", 0) != 0 || parse_bucket_key_val(found_key) > value) {
-                         rc = mdbx_cursor_get(cursor, &key, &data, MDBX_PREV);
-                     }
-                } else {
-                    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
-                }
-
-                if (rc == MDBX_SUCCESS) {
-                    std::string found_key((char*)key.iov_base, key.iov_len);
-                    if (found_key.rfind(field + ":", 0) == 0) {
-                        target_base = parse_bucket_key_val(found_key);
-                        // Check range condition
-                        if (value >= target_base && (static_cast<uint64_t>(value) - target_base) <= Bucket::MAX_DELTA) {
-                             target_key_str = found_key;
-                        } else {
-                            create_new = true;
-                        }
-                    } else {
-                        create_new = true;
-                    }
-                } else {
-                    create_new = true;
-                }
-
-                if (create_new) {
-                    // Create new bucket at exact value
-                    Bucket b;
-                    b.base_value = value;
-                    b.add(value, id);
-                    auto bytes = b.serialize();
-                    
-                    target_key_str = make_bucket_key(field, value);
-                    MDBX_val k{const_cast<char*>(target_key_str.data()), target_key_str.size()};
-                    MDBX_val v{bytes.data(), bytes.size()};
-                    mdbx_put(txn, inverted_dbi_, &k, &v, MDBX_UPSERT);
-                    
-                } else {
-                    // Update existing
-                    // We must re-fetch current key/data because cursor move might have updated key/data
-                     MDBX_val k{const_cast<char*>(target_key_str.data()), target_key_str.size()};
-                     MDBX_val v;
-                     if(mdbx_cursor_get(cursor, &k, &v, MDBX_SET) != MDBX_SUCCESS) {
-                         // Should not happen if logic is correct
-                         throw std::runtime_error("Cursor sync fail");
-                     }
-
-                    Bucket b = Bucket::deserialize(v.iov_base, v.iov_len, target_base);
-                    
-                    // Capacity Check
-                    if (b.ids.size() >= Bucket::MAX_SIZE) {
-                         // SPLIT LOGIC
-                         // Sort is maintained by arrays. 
-                         // "Slide Split": Scan right from median
-                         size_t mid_idx = b.ids.size() / 2;
-                         
-                         // Ensure we don't split a group of identical values
-                         size_t probe_right = mid_idx;
-                         while (probe_right < b.deltas.size() && probe_right > 0 && b.deltas[probe_right] == b.deltas[probe_right - 1]) {
-                             probe_right++;
-                         }
-
-                         if (probe_right < b.deltas.size()) {
-                             mid_idx = probe_right;
-                         } else {
-                             // Fallback: Try scanning left
-                             size_t probe_left = mid_idx;
-                             while (probe_left > 0 && b.deltas[probe_left] == b.deltas[probe_left - 1]) {
-                                 probe_left--;
-                             }
-                             
-                             if (probe_left > 0) {
-                                 mid_idx = probe_left;
-                             } else {
-                                 // All identical
-                                 mid_idx = b.deltas.size();
-                             }
-                         }
-                         
-                         // If we hit end, we can't split by value uniqueness
-                         if (mid_idx == b.deltas.size()) {
-                             // Fallback: Just append (overfill) or implement logic to handle identicals.
-                             // For now: Append
-                             b.add(value, id);
-                             auto bytes = b.serialize();
-                             MDBX_val k2{const_cast<char*>(target_key_str.data()), target_key_str.size()};
-                             MDBX_val v2{bytes.data(), bytes.size()};
-                             mdbx_cursor_put(cursor, &k2, &v2, MDBX_CURRENT);
-                             mdbx_cursor_close(cursor);
-                             return;
-                         }
-
-                         // Standard Slide Split
-                         Bucket right_b;
-                         right_b.base_value = b.base_value + b.deltas[mid_idx]; // New base
-                         
-                         // Move entries
-                         for(size_t i=mid_idx; i<b.deltas.size(); ++i) {
-                             right_b.add(b.base_value + b.deltas[i], b.ids[i]);
-                         }
-                         
-                         // Truncate left
-                         b.deltas.resize(mid_idx);
-                         b.ids.resize(mid_idx);
-                         // Rebuild left bitmap
-                         b.summary_bitmap = ndd::RoaringBitmap();
-                         for(auto pid : b.ids) b.summary_bitmap.add(pid);
-
-                         // Now add new value to correct bucket
-                         if (value >= right_b.base_value) {
-                             right_b.add(value, id);
-                         } else {
-                             // If value < right, goes to left. 
-                             // But wait, split point was determined by existing items.
-                             // If new value is >= base+split_delta, it goes right.
-                             // BUT we just cleared right from b.
-                             // Correct logic:
-                             b.add(value, id); // Add to left if it fits range (logic handles delta)
-                             // Oh wait, if we added to left, we might overflow again or break order? 
-                             // Simply: Check which bucket covers it.
-                             // Left covers [Base, RightBase-1]
-                             // Right covers [RightBase, ...]
-                         }
-
-                         // Save Left
-                         auto left_bytes = b.serialize();
-                         MDBX_val left_v{left_bytes.data(), left_bytes.size()};
-                         MDBX_val left_k{const_cast<char*>(target_key_str.data()), target_key_str.size()};
-                         mdbx_cursor_put(cursor, &left_k, &left_v, MDBX_CURRENT);
-
-                         // Save Right
-                         auto right_bytes = right_b.serialize();
-                         std::string right_k_str = make_bucket_key(field, right_b.base_value);
-                         MDBX_val right_k{const_cast<char*>(right_k_str.data()), right_k_str.size()};
-                         MDBX_val right_v{right_bytes.data(), right_bytes.size()};
-                         
-                         // Use put for new key
-                         mdbx_put(txn, inverted_dbi_, &right_k, &right_v, MDBX_UPSERT);
-
-                    } else {
-                        // Normal Insert
-                        b.add(value, id);
-                        auto bytes = b.serialize();
-                        MDBX_val new_data{bytes.data(), bytes.size()};
-                        
-                        // Use cursor put to update current
-                         mdbx_cursor_put(cursor, &k, &new_data, MDBX_CURRENT);
-                    }
-                }
-                mdbx_cursor_close(cursor);
-            }
+            std::string make_bucket_key(const std::string& field, uint32_t start_val);
+
+            uint32_t parse_bucket_key_val(const std::string& key);
+
+            /*
+             * Removes one id from the numeric inverted bucket that currently owns its old value.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX cursor, read, delete, or write failure; caller should log ERROR and return HTTP 500
+             * 200 = corrupt numeric bucket payload; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<> remove_from_buckets(MDBX_txn* txn,
+                                                       const std::string& field,
+                                                       uint32_t value,
+                                                       ndd::idInt id);
+
+            /*
+             * Adds one id/value pair into the numeric inverted bucket index.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX cursor, read, or write failure; caller should log ERROR and return HTTP 500
+             * 200 = corrupt numeric bucket payload or invalid bucket invariant; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<> add_to_buckets(MDBX_txn* txn,
+                                                  const std::string& field,
+                                                  uint32_t value,
+                                                  ndd::idInt id);
+
+            /*
+             * Writes one numeric forward entry and updates the inverted buckets inside a caller transaction.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX read or write failure; caller should log ERROR and return HTTP 500
+             * 100-199 = propagated MDBX/storage failure from bucket helpers
+             * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+             * 200-299 = propagated corruption/invariant failure from bucket helpers
+             */
+            ndd::OperationResult<> put_internal(MDBX_txn* txn,
+                                                const std::string& field,
+                                                ndd::idInt id,
+                                                uint32_t value);
 
         public:
-            ndd::RoaringBitmap range(const std::string& field, uint32_t min_val, uint32_t max_val) {
-                ndd::RoaringBitmap result;
-                MDBX_txn* txn;
-                if (mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn) != MDBX_SUCCESS) return result;
-
-                MDBX_cursor* cursor;
-                mdbx_cursor_open(txn, inverted_dbi_, &cursor);
-
-                // 1. Find Start Bucket
-                std::string start_k = make_bucket_key(field, min_val);
-                MDBX_val key{const_cast<char*>(start_k.data()), start_k.size()};
-                MDBX_val data;
-
-                int rc = mdbx_cursor_get(cursor, &key, &data, MDBX_SET_RANGE);
-                if (rc == MDBX_SUCCESS) {
-                    // Check if we need to back up
-                     std::string fkey((char*)key.iov_base, key.iov_len);
-                     if (fkey.rfind(field + ":", 0) != 0 || parse_bucket_key_val(fkey) > min_val) {
-                         // Check prev
-                         MDBX_val p_key = key; 
-                         MDBX_val p_data;
-                         if (mdbx_cursor_get(cursor, &p_key, &p_data, MDBX_PREV) == MDBX_SUCCESS) {
-                              std::string pkey_str((char*)p_key.iov_base, p_key.iov_len);
-                              if (pkey_str.rfind(field + ":", 0) == 0) {
-                                  // Prev is valid start
-                                  key = p_key; data = p_data;
-                                  rc = MDBX_SUCCESS;
-                              }
-                         }
-                     }
-                } else if (rc == MDBX_NOTFOUND) {
-                     rc = mdbx_cursor_get(cursor, &key, &data, MDBX_LAST);
-                     if (rc == MDBX_SUCCESS && data.iov_len > 0) {
-                         std::string fkey((char*)key.iov_base, key.iov_len);
-                         if (fkey.rfind(field + ":", 0) == 0) {
-                             rc = MDBX_SUCCESS;
-                         } else {
-                             rc = MDBX_NOTFOUND;
-                         }
-                     } else {
-                         rc = MDBX_NOTFOUND;
-                     }
-                }
-
-                // Iterate forward
-                while (rc == MDBX_SUCCESS) {
-                    std::string cur_key((char*)key.iov_base, key.iov_len);
-                    if (cur_key.rfind(field + ":", 0) != 0) break; // End of field
-
-                    uint32_t bucket_base = parse_bucket_key_val(cur_key);
-                    
-                    if (bucket_base > max_val) break; // Past the end
-
-                    // Peek Strategy:
-                    // If bucket_base >= min_val, we know the start is covered.
-                    // If we could know NEXT bucket start, we'd know overlap.
-                    // Since we iterate, we can be greedy on read.
-                    
-                    // For now, always deserialize. 
-                    // Potential optimization: Read only bitmap if we are "deep" in the range. 
-                    // e.g. min_val=10, max_val=100. Bucket=20.
-                    // If bucket=20. Next Bucket=30.
-                    // Then Bucket 20 covers [20..30).
-                    // Range [10..100] covers [20..30] fully.
-                    // So we need lookahead. 
-                    
-                    // Simple logic without lookahead:
-                    // Just read full bucket. It's 8KB max (2 pages). 
-                    // It's fast unless we have millions of buckets.
-                    
-                    Bucket b = Bucket::deserialize(data.iov_base, data.iov_len, bucket_base);
-                    
-                    if (b.ids.empty()) {
-                        rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
-                        continue;
-                    }
-
-                    uint32_t b_min = b.get_value(0);
-                    uint32_t b_max = b.get_value(b.ids.size()-1);
-
-                    if (b_min >= min_val && b_max <= max_val) {
-                         // Full overlap
-                         result |= b.summary_bitmap;
-                    } else {
-                        // Partial overlap
-                         for(size_t i=0; i<b.ids.size(); ++i) {
-                             uint32_t v = b.get_value(i);
-                             if (v >= min_val && v <= max_val) {
-                                 result.add(b.ids[i]);
-                             }
-                         }
-                    }
-
-                    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
-                }
-
-                mdbx_cursor_close(cursor);
-                mdbx_txn_abort(txn);
-                return result;
-            }
-
-            bool check_range(const std::string& field, ndd::idInt id, uint32_t min_val, uint32_t max_val) {
-                MDBX_txn* txn;
-                if(mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn) != MDBX_SUCCESS) return false;
-                
-                std::string fwd_key_str = make_forward_key(field, id);
-                MDBX_val fwd_key{const_cast<char*>(fwd_key_str.data()), fwd_key_str.size()};
-                MDBX_val fwd_val;
-                
-                bool match = false;
-                if(mdbx_get(txn, forward_dbi_, &fwd_key, &fwd_val) == MDBX_SUCCESS) {
-                    uint32_t val;
-                    std::memcpy(&val, fwd_val.iov_base, 4);
-                    if(val >= min_val && val <= max_val) match = true;
-                }
-                
-                mdbx_txn_abort(txn);
-                return match;
-            }
+            NumericIndex(MDBX_env* env);
+
+            /*
+             * Writes a batch of numeric filter entries in bounded MDBX write transaction chunks.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction or commit failure; caller should log ERROR and return HTTP 500
+             * 100-199 = propagated MDBX/storage failure from per-entry writes
+             * 200-299 = propagated corruption/invariant failure from per-entry writes
+             */
+            ndd::OperationResult<> put_batch(const std::vector<NumericBatchEntry>& entries);
+
+            /*
+             * Removes one id from the numeric forward and inverted indexes for a field.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction, read, delete, or commit failure; caller should log ERROR and return HTTP 500
+             * 100-199 = propagated MDBX/storage failure from bucket helpers
+             * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+             * 200-299 = propagated corruption/invariant failure from bucket helpers
+             */
+            ndd::OperationResult<> remove(const std::string& field, ndd::idInt id);
+
+            /*
+             * Computes a bitmap of ids whose numeric field value falls within an inclusive sortable range.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction, cursor, or scan failure; caller should log ERROR and return HTTP 500
+             * 200 = corrupt numeric bucket payload; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<ndd::RoaringBitmap>
+            range(const std::string& field, uint32_t min_val, uint32_t max_val);
+
+            /*
+             * Checks whether one id has a numeric field value inside an inclusive sortable range.
+             *
+             * Return codes:
+             * 0 = success
+             * 100 = MDBX transaction or read failure; caller should log ERROR and return HTTP 500
+             * 200 = corrupt numeric forward value; caller should log ERROR and return HTTP 500
+             */
+            ndd::OperationResult<bool>
+            check_range(const std::string& field,
+                        ndd::idInt id,
+                        uint32_t min_val,
+                        uint32_t max_val);
         };
 
-    } // namespace filter
-} // namespace ndd
+    }  // namespace filter
+}  // namespace ndd
diff --git a/src/main.cpp b/src/main.cpp
index 4654a54c20..934ab1b5aa 100644
--- a/src/main.cpp
+++ b/src/main.cpp
@@ -37,6 +37,7 @@
 #include "core/ndd.hpp"
 #include "auth.hpp"
 #include "quant/common.hpp"
+#include "server/request_validation.hpp"
 #include "system_sanity/system_sanity.hpp"
 
 using ndd::quant::quantLevelToString;
@@ -88,6 +89,21 @@ inline crow::response json_error(int code, const std::string& message) {
     crow::json::wvalue err_json({{"error", message}});
     return crow::response(code, err_json.dump());
 }
+
+
+/**
+ * OperationResult code ranges are the contract between core/filter code and the HTTP
+ * boundary: SUCCESS means success, 1-99 means the request was rejected for caller-fixable
+ * input such as filter validation, and 100+ means storage/internal/corruption failure.
+ * When adding an OperationResult-returning function, document its code ranges and keep
+ * client-correctable errors below 100 so this helper maps them to HTTP 400 instead of
+ * the 500 path.
+ */
+template <typename T>
+inline bool operation_error_is_client_error(const ndd::OperationResult<T>& result) {
+    return result.code > SUCCESS && result.code < 100;
+}
+
 // Special helper function to log and send error messages in JSON format for 500 errors
 inline crow::response json_error_500(const std::string& username,
                                      const std::string& index_name,
@@ -207,7 +223,7 @@ int main(int argc, char** argv) {
     }
 
     if(!run_startup_sanity_checks()) {
-        LOG_ERROR(1799, "Server startup aborted due to failed sanity checks");
+        LOG_ERROR(1076, "Server startup aborted due to failed sanity checks");
         return 1;
     }
 
@@ -822,14 +838,33 @@ int main(int argc, char** argv) {
 
                 // Extract filter parameters (Option B from chat plan)
                 ndd::FilterParams filter_params;
-                if (body.has("filter_params")) {
-                     auto fp = body["filter_params"];
-                     if (fp.has("prefilter_threshold")) {
-                         filter_params.prefilter_threshold = static_cast<size_t>(fp["prefilter_threshold"].i());
-                     }
-                     if (fp.has("boost_percentage")) {
-                         filter_params.boost_percentage = static_cast<size_t>(fp["boost_percentage"].i());
-                     }
+                if(body.has("filter_params")) {
+                    auto fp = body["filter_params"];
+                    if(fp.t() != crow::json::type::Object) {
+                        return json_error(400, "filter_params must be an object");
+                    }
+                    if(fp.has("prefilter_threshold")) {
+                        auto prefilter_threshold = ndd::server::parse_bounded_size(
+                                fp["prefilter_threshold"],
+                                "filter_params.prefilter_threshold",
+                                0,
+                                settings::MAX_VECTORS_ADMIN);
+                        if(!prefilter_threshold.ok()) {
+                            return json_error(400, prefilter_threshold.message);
+                        }
+                        filter_params.prefilter_threshold = prefilter_threshold.value_or_throw();
+                    }
+                    if(fp.has("boost_percentage")) {
+                        auto boost_percentage =
+                                ndd::server::parse_bounded_size(fp["boost_percentage"],
+                                                                "filter_params.boost_percentage",
+                                                                0,
+                                                                100);
+                        if(!boost_percentage.ok()) {
+                            return json_error(400, boost_percentage.message);
+                        }
+                        filter_params.boost_percentage = boost_percentage.value_or_throw();
+                    }
                 }
 
                 float dense_rrf_weight = body.has("dense_rrf_weight") ? (float)body["dense_rrf_weight"].d() : settings::DEFAULT_DENSE_RRF_WEIGHT;
@@ -854,14 +889,23 @@ int main(int argc, char** argv) {
                                                                     dense_rrf_weight,
                                                                     rrf_rank_constant);
 
-                    if(!search_response) {
-                        LOG_WARN(1038, ctx.username, index_name, "Search request returned no results because the index is missing or search failed");
-                        return json_error(404, "Index not found or search failed");
+                    if(!search_response.ok()) {
+                        if(operation_error_is_client_error(search_response)) {
+                            LOG_WARN(1075,
+                                     ctx.username,
+                                     index_name,
+                                     "Search request rejected: " << search_response.message);
+                            return json_error(400, search_response.message);
+                        }
+                        return json_error_500(ctx.username,
+                                              index_name,
+                                              req.url,
+                                              search_response.message);
                     }
 
                     // Serialize the ResultSet using MessagePack
                     msgpack::sbuffer sbuf;
-                    msgpack::pack(sbuf, search_response.value());
+                    msgpack::pack(sbuf, search_response.value_or_throw());
                     crow::response resp(200, std::string(sbuf.data(), sbuf.size()));
                     resp.add_header("Content-Type", "application/msgpack");
                     return resp;
@@ -955,8 +999,21 @@ int main(int argc, char** argv) {
                     }
 
                     try {
-                        bool success = index_manager.addVectors(index_id, vectors);
-                        if(!success) {
+                        auto insert_result = index_manager.addVectors(index_id, vectors);
+                        if(!insert_result.ok()) {
+                            if(operation_error_is_client_error(insert_result)) {
+                                LOG_WARN(1069,
+                                         ctx.username,
+                                         index_name,
+                                         "Insert request rejected: " << insert_result.message);
+                                return json_error(400, insert_result.message);
+                            }
+                            return json_error_500(ctx.username,
+                                                  index_name,
+                                                  req.url,
+                                                  insert_result.message);
+                        }
+                        if(!insert_result.value_or_throw()) {
                             LOG_WARN(1066,
                                      ctx.username,
                                      index_name,
@@ -980,8 +1037,21 @@ int main(int argc, char** argv) {
                             // Try HybridVectorObject first
                             auto vectors = obj.as<std::vector<ndd::HybridVectorObject>>();
                             LOG_DEBUG("Batch size (Hybrid): " << vectors.size());
-                            bool success = index_manager.addVectors(index_id, vectors);
-                            if(!success) {
+                            auto insert_result = index_manager.addVectors(index_id, vectors);
+                            if(!insert_result.ok()) {
+                                if(operation_error_is_client_error(insert_result)) {
+                                    LOG_WARN(1070,
+                                             ctx.username,
+                                             index_name,
+                                             "Insert request rejected: " << insert_result.message);
+                                    return json_error(400, insert_result.message);
+                                }
+                                return json_error_500(ctx.username,
+                                                      index_name,
+                                                      req.url,
+                                                      insert_result.message);
+                            }
+                            if(!insert_result.value_or_throw()) {
                                 LOG_WARN(1067,
                                          ctx.username,
                                          index_name,
@@ -993,8 +1063,21 @@ int main(int argc, char** argv) {
                             // Fallback to VectorObject
                             auto vectors = obj.as<std::vector<ndd::VectorObject>>();
                             LOG_DEBUG("Batch size (Dense): " << vectors.size());
-                            bool success = index_manager.addVectors(index_id, vectors);
-                            if(!success) {
+                            auto insert_result = index_manager.addVectors(index_id, vectors);
+                            if(!insert_result.ok()) {
+                                if(operation_error_is_client_error(insert_result)) {
+                                    LOG_WARN(1071,
+                                             ctx.username,
+                                             index_name,
+                                             "Insert request rejected: " << insert_result.message);
+                                    return json_error(400, insert_result.message);
+                                }
+                                return json_error_500(ctx.username,
+                                                      index_name,
+                                                      req.url,
+                                                      insert_result.message);
+                            }
+                            if(!insert_result.value_or_throw()) {
                                 LOG_WARN(1068,
                                          ctx.username,
                                          index_name,
@@ -1066,7 +1149,21 @@ int main(int argc, char** argv) {
                 LOG_DEBUG("Deleting vector " << vector_id << " from index " << index_id);
 
                 try {
-                    if(index_manager.deleteVector(index_id, vector_id)) {
+                    auto delete_result = index_manager.deleteVector(index_id, vector_id);
+                    if(!delete_result.ok()) {
+                        if(operation_error_is_client_error(delete_result)) {
+                            LOG_WARN(1072,
+                                     ctx.username,
+                                     index_name,
+                                     "Delete-vector request rejected: " << delete_result.message);
+                            return json_error(400, delete_result.message);
+                        }
+                        return json_error_500(ctx.username,
+                                              index_name,
+                                              req.url,
+                                              delete_result.message);
+                    }
+                    if(delete_result.value_or_throw()) {
                         return crow::response(200, "Vector deleted successfully");
                     } else {
                         LOG_WARN(1046, ctx.username, index_name, "Delete-vector request for missing vector id " << vector_id);
@@ -1112,10 +1209,25 @@ int main(int argc, char** argv) {
                                           "Filter must be an array. Please use format: "
                                           "[{\"field\":{\"$op\":value}}]");
                     }
-                    size_t deleted_count =
+                    auto delete_result =
                             index_manager.deleteVectorsByFilter(index_id, filter_array);
+                    if(!delete_result.ok()) {
+                        if(operation_error_is_client_error(delete_result)) {
+                            LOG_WARN(1073,
+                                     ctx.username,
+                                     index_name,
+                                     "Delete-by-filter request rejected: " << delete_result.message);
+                            return json_error(400, delete_result.message);
+                        }
+                        return json_error_500(ctx.username,
+                                              index_name,
+                                              req.url,
+                                              delete_result.message);
+                    }
 
-                    return crow::response(200, std::to_string(deleted_count) + " vectors deleted");
+                    return crow::response(200,
+                                          std::to_string(delete_result.value_or_throw())
+                                                  + " vectors deleted");
                 } catch(const std::runtime_error& e) {
                     LOG_WARN(1051, ctx.username, index_name, "Delete-by-filter request rejected: " << e.what());
                     return json_error(400, e.what());
@@ -1162,8 +1274,23 @@ int main(int argc, char** argv) {
                         updates.emplace_back(id, filter);
                     }
 
-                    size_t count = index_manager.updateFilters(index_id, updates);
-                    return crow::response(200, std::to_string(count) + " filters updated");
+                    auto update_result = index_manager.updateFilters(index_id, updates);
+                    if(!update_result.ok()) {
+                        if(operation_error_is_client_error(update_result)) {
+                            LOG_WARN(1074,
+                                     ctx.username,
+                                     index_name,
+                                     "Update-filters request rejected: " << update_result.message);
+                            return json_error(400, update_result.message);
+                        }
+                        return json_error_500(ctx.username,
+                                              index_name,
+                                              req.url,
+                                              update_result.message);
+                    }
+                    return crow::response(200,
+                                          std::to_string(update_result.value_or_throw())
+                                                  + " filters updated");
 
                 } catch(const std::runtime_error& e) {
                     LOG_WARN(1054, ctx.username, index_name, "Update-filters request rejected: " << e.what());
diff --git a/src/server/request_validation.hpp b/src/server/request_validation.hpp
new file mode 100644
index 0000000000..c8838b31d6
--- /dev/null
+++ b/src/server/request_validation.hpp
@@ -0,0 +1,59 @@
+#pragma once
+
+#include <cstddef>
+#include <cstdint>
+#include <exception>
+#include <string>
+
+#include "crow/json.h"
+#include "utils/types.hpp"
+
+namespace ndd::server {
+
+inline std::string bounded_size_error(const std::string& field_name, size_t min_value, size_t max_value) {
+    return field_name + " must be between " + std::to_string(min_value) + " and "
+            + std::to_string(max_value);
+}
+
+inline ndd::OperationResult<size_t>
+parse_bounded_size(const crow::json::rvalue& value,
+                   const std::string& field_name,
+                   size_t min_value,
+                   size_t max_value) {
+    try {
+        if(value.t() != crow::json::type::Number) {
+            return {1, field_name + " must be an integer"};
+        }
+
+        const auto number_type = value.nt();
+        if(number_type == crow::json::num_type::Floating_point
+           || number_type == crow::json::num_type::Double_precision_floating_point) {
+            return {1, field_name + " must be an integer"};
+        }
+
+        size_t parsed_value = 0;
+        if(number_type == crow::json::num_type::Unsigned_integer) {
+            const uint64_t unsigned_value = value.u();
+            if(unsigned_value > static_cast<uint64_t>(max_value)) {
+                return {1, bounded_size_error(field_name, min_value, max_value)};
+            }
+            parsed_value = static_cast<size_t>(unsigned_value);
+        } else {
+            const int64_t signed_value = value.i();
+            if(signed_value < 0) {
+                return {1, bounded_size_error(field_name, min_value, max_value)};
+            }
+            parsed_value = static_cast<size_t>(signed_value);
+        }
+
+        if(parsed_value < min_value || parsed_value > max_value) {
+            return {1, bounded_size_error(field_name, min_value, max_value)};
+        }
+
+        return {SUCCESS, "", parsed_value};
+    } catch(const std::exception&) {
+        return {1, field_name + " must be an integer"};
+    }
+}
+
+}  // namespace ndd::server
diff --git a/src/storage/vector_storage.hpp b/src/storage/vector_storage.hpp
index 8ca7f56ab9..acd35e6ba2 100644
--- a/src/storage/vector_storage.hpp
+++ b/src/storage/vector_storage.hpp
@@ -13,6 +13,7 @@
 #include <memory>
 #include <stdexcept>
 #include <filesystem>
+#include <utility>
 
 // Handles vector storage
 class VectorStore {
@@ -339,6 +340,40 @@ class VectorStore {
         }
     }
 
+    template <typename Visitor>
+    size_t visit_vectors_by_ids(const std::vector<ndd::idInt>& numeric_ids,
+                                Visitor&& visitor) const {
+        if(numeric_ids.empty()) {
+            return 0;
+        }
+
+        MDBX_txn* txn;
+        int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_RDONLY, &txn);
+        if(rc != MDBX_SUCCESS) {
+            throw std::runtime_error(std::string("Failed to begin transaction: ") + mdbx_strerror(rc));
+        }
+
+        size_t visited = 0;
+        try {
+            for(const auto& numeric_id : numeric_ids) {
+                MDBX_val key{const_cast<ndd::idInt*>(&numeric_id), sizeof(ndd::idInt)};
+                MDBX_val data;
+
+                rc = mdbx_get(txn, dbi_, &key, &data);
+                if(rc == MDBX_SUCCESS && data.iov_len == bytes_per_vector_) {
+                    visitor(numeric_id, static_cast<const void*>(data.iov_base));
+                    visited++;
+                }
+            }
+
+            mdbx_txn_abort(txn);
+            return visited;
+        } catch(...) {
+            mdbx_txn_abort(txn);
+            throw;
+        }
+    }
+
     void remove(ndd::idInt numeric_id) {
         MDBX_txn* txn;
         int rc = mdbx_txn_begin(env_, nullptr, MDBX_TXN_READWRITE, &txn);
@@ -558,19 +593,30 @@ class VectorStorage {
         filter_store_ = std::make_unique<Filter>(base_path + "/filters", index_id_);
     }
     VectorStore::Cursor getCursor() { return vector_store_->getCursor(); }
-    // Get numeric ids of matching filters
-    std::vector<ndd::idInt> getIdsMatchingFilters(
+    /*
+     * Returns numeric ids matching legacy category filter pairs.
+     *
+     * Return codes:
+     * 0 = success
+     * 100-199 = propagated MDBX/storage failure from filter store
+     * 200-299 = propagated corruption/invariant failure from filter store
+     */
+    ndd::OperationResult<std::vector<ndd::idInt>> getIdsMatchingFilters(
             const std::vector<std::pair<std::string, std::string>>& filter_pairs) const {
-        auto bitmap = filter_store_->combine_filters_and(filter_pairs);
+        auto bitmap_result = filter_store_->combine_filters_and(filter_pairs);
+        if(!bitmap_result.ok()) {
+            return {bitmap_result.code, bitmap_result.message};
+        }
+
         std::vector<ndd::idInt> numeric_ids;
-        bitmap.iterate(
+        bitmap_result.value_or_throw().iterate(
                 [](ndd::idInt value, void* ptr) -> bool {
                     auto* ids = static_cast<std::vector<ndd::idInt>*>(ptr);
                     ids->push_back(value);
                     return true;
                 },
                 &numeric_ids);
-        return numeric_ids;
+        return {SUCCESS, "", std::move(numeric_ids)};
     }
 
     bool matches_filter(ndd::idInt numeric_id,
@@ -606,7 +652,8 @@ class VectorStorage {
             }
 
             if(is_numeric_query) {
-                if(!filter_store_->check_numeric(field, numeric_id, op, val)) {
+                auto check_result = filter_store_->check_numeric(field, numeric_id, op, val);
+                if(!check_result.ok() || !check_result.value_or_throw()) {
                     return false;
                 }
             } else {
@@ -681,14 +728,160 @@ class VectorStorage {
         }
     }
 
-    // Optimized batch operation using pre-quantized QuantVectorObject
-    // This avoids double quantization by using already quantized data
-    void store_vectors_batch(const std::vector<std::pair<ndd::idInt, QuantVectorObject>>& vectors) {
+    /*
+     * Stores vectors, metadata, and associated filter documents for one pre-quantized batch.
+     *
+     * High-level shape:
+     *   1. Cleanup pass: for every entry that is an upsert of an already-live numeric_id,
+     *      read its previous meta.filter and remove the corresponding entries from the
+     *      filter index. Without this step every prior filter value would remain matchable
+     *      via the category / numeric indexes even though the vector now carries a
+     *      different filter document.
+     *   2. Write the new vector bytes (vector_store_).
+     *   3. Overwrite meta (meta_store_) — this is where meta.filter takes its new value.
+     *   4. Add the new filter index entries (filter_store_).
+     *
+     * `is_new_to_db[i]` mirrors the id_mapper's "did this str_id already exist?" signal:
+     *   - true  : the str_id was NOT in the id_mapper when this batch began. That covers
+     *             both genuinely fresh ids and reuses of a previously-deleted slot. In the
+     *             reuse case the old filter index entries were already scrubbed at delete
+     *             time (see deletePoint / deleteFilter), so there is nothing to clean up.
+     *   - false : the str_id was already mapped to this numeric_id, i.e. this is an upsert
+     *             of a live point. Its prior filter index entries are still present and
+     *             must be removed before the new filter is added — otherwise queries with
+     *             the OLD filter value will keep matching this id.
+     *
+     * If `is_new_to_db` is empty (default), the caller has not opted into the cleanup
+     * contract and we conservatively skip the cleanup pass entirely. This preserves the
+     * pre-fix semantics for any caller that has not yet been updated. New callers should
+     * always pass the id_mapper signal.
+     *
+     * Atomicity, by design (and constrained by the filter roadmap):
+     *   - The cleanup pass, vector_store, meta_store, and filter_store writes are each
+     *     internally transactional, but the four phases are NOT a single distributed
+     *     transaction. A crash between phases leaves torn state (e.g. old filter index
+     *     entries removed but new vector / meta not written).
+     *   - `updateFilter` already operates under the same constraint; cross-store ACID
+     *     work is tracked separately in the filter roadmap.
+     *
+     * Limitations:
+     *   - This patch only prevents NEW stale filter index entries from accumulating. It
+     *     does not retroactively scrub entries left behind by previous upserts written
+     *     before the fix landed. A targeted rebuild is required to clean historical drift.
+     *   - The cleanup pass issues one MDBX read per upsert id to fetch the prior meta.
+     *     For a batch that is mostly fresh inserts (the common case) this cost stays low;
+     *     a batch dominated by upserts will see N extra reads.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from filter store, or argument shape
+     * 100-199 = propagated MDBX/storage failure from filter or meta store
+     * 200-299 = propagated corruption/invariant failure from filter store
+     */
+    ndd::OperationResult<>
+    store_vectors_batch(const std::vector<std::pair<ndd::idInt, QuantVectorObject>>& vectors,
+                        const std::vector<bool>& is_new_to_db = {}) {
         if(vectors.empty()) {
-            return;
+            return {SUCCESS, ""};
         }
 
-        // Prepare vector and meta batches
+        /*
+         * `have_flags` distinguishes the new opt-in cleanup contract from legacy callers
+         * that pass nothing. When flags are present they must match the batch one-to-one;
+         * a size mismatch is a programmer error and we surface it rather than silently
+         * applying the cleanup to a misaligned subset of the batch.
+         */
+        const bool have_flags = !is_new_to_db.empty();
+        if(have_flags && is_new_to_db.size() != vectors.size()) {
+            LOG_ERROR(1223,
+                      index_id_,
+                      "store_vectors_batch: is_new_to_db size mismatch ("
+                              << is_new_to_db.size() << " vs " << vectors.size() << ")");
+            return {1, "store_vectors_batch: is_new_to_db size mismatch"};
+        }
+
+        /*
+         * ---- Phase 1: upsert cleanup ----
+         *
+         * For each entry the id_mapper flagged as already-live (is_new_to_db == false),
+         * read its previous meta.filter and remove the corresponding filter index entries.
+         * We do this BEFORE writing the new meta in phase 3, because the new meta would
+         * overwrite the only record of which filter document used to be associated with
+         * this id — and once that record is gone, we cannot tell the filter index which
+         * entries belong to "the old filter" anymore.
+         *
+         * Skipping the entire pass when flags are absent is intentional: without the
+         * id_mapper signal we cannot tell apart a fresh slot (no cleanup needed) from
+         * an upsert (cleanup required), so trying to "always clean up" would issue
+         * get_meta() on every fresh id and either throw or short-circuit on empty.
+         */
+        if(have_flags) {
+            for(size_t i = 0; i < vectors.size(); ++i) {
+                // Fresh slot or reuse of a deleted slot — nothing to clean.
+                if(is_new_to_db[i]) {
+                    continue;
+                }
+                ndd::idInt numeric_id = vectors[i].first;
+
+                /*
+                 * Fetch the prior filter document. This is the only point where we can
+                 * recover what the OLD filter was; once we overwrite meta in phase 3 it
+                 * is gone. We pay one MDBX read per upserted id here.
+                 */
+                std::string old_filter;
+                try {
+                    old_filter = meta_store_->get_meta(numeric_id).filter;
+                } catch(const std::exception& e) {
+                    /*
+                     * Mapper says this numeric_id is already live, but its meta cannot
+                     * be loaded. That contradiction means an earlier write was torn
+                     * (e.g. id_mapper got committed but meta did not). Surfacing this
+                     * is preferable to silently overwriting: the operator can then
+                     * decide whether to repair via rebuild, and the user gets HTTP 500
+                     * instead of a "successful" write that leaves the index inconsistent.
+                     */
+                    LOG_ERROR(1224,
+                              index_id_,
+                              "Upsert cleanup: meta missing for existing numeric_id "
+                                      << numeric_id << ": " << e.what());
+                    return {103,
+                            "Upsert cleanup: meta missing for numeric_id "
+                                    + std::to_string(numeric_id) + ": " + e.what()};
+                }
+
+                /*
+                 * The previous version of this vector had no filter document, so there
+                 * is nothing in the filter index to remove. Common after deleteFilter
+                 * or after an insert that omitted filters entirely.
+                 */
+                if(old_filter.empty()) {
+                    continue;
+                }
+
+                /*
+                 * Drop the old filter's category and numeric index entries for this id.
+                 * Any failure here aborts the batch — partially-cleaned state would be
+                 * worse than the original drift, because the bitmap would no longer
+                 * match meta.filter even temporarily.
+                 */
+                auto remove_result =
+                        filter_store_->remove_filters_from_json(numeric_id, old_filter);
+                if(!remove_result.ok()) {
+                    LOG_ERROR(1225,
+                              index_id_,
+                              "Upsert cleanup: failed to remove old filter for numeric_id "
+                                      << numeric_id << " (code=" << remove_result.code
+                                      << "): " << remove_result.message);
+                    return remove_result;
+                }
+            }
+        }
+
+        /*
+         * ---- Phase 2 prep: assemble per-store batches from the input ----
+         * We unzip the input vector into one batch per backing store so each store can
+         * commit its batch in a single MDBX transaction.
+         */
         std::vector<std::pair<ndd::idInt, std::vector<uint8_t>>> vector_batch;
         std::vector<std::pair<ndd::idInt, ndd::VectorMeta>> meta_batch;
         std::vector<std::pair<ndd::idInt, std::string>> filter_batch;
@@ -698,10 +891,17 @@ class VectorStorage {
         filter_batch.reserve(vectors.size());
 
         for(const auto& [numeric_id, quant_obj] : vectors) {
-            // Use pre-quantized data directly - no conversion needed!
+            /*
+             * The vector bytes were quantized upstream (HNSW path) so we can store them
+             * verbatim; copying here only because store_vectors_batch wants ownership.
+             */
             std::vector<uint8_t> vector_bytes = quant_obj.quant_vector;
 
-            // Create metadata from QuantVectorObject
+            /*
+             * VectorMeta is the durable record of what filter document this id carries.
+             * After phase 3 overwrites it, get_meta() returns these new values and the
+             * upsert-cleanup pass on a future upsert will read THIS old_filter to drop.
+             */
             ndd::VectorMeta meta;
             meta.id = quant_obj.id;
             meta.filter = quant_obj.filter;
@@ -711,20 +911,39 @@ class VectorStorage {
             vector_batch.emplace_back(numeric_id, std::move(vector_bytes));
             meta_batch.emplace_back(numeric_id, std::move(meta));
 
-            // Collect filter data for batch processing
+            /*
+             * Empty filter docs are intentionally excluded: there is nothing to add to
+             * the filter index. Meta.filter still records the empty string so the next
+             * upsert's cleanup pass correctly observes "no prior filter to remove".
+             */
             if(!quant_obj.filter.empty()) {
                 filter_batch.emplace_back(numeric_id, quant_obj.filter);
             }
         }
 
-        // Store vectors and metadata in single transactions
+        // Phase 2: write vector bytes. One MDBX txn for the whole batch inside vector_store_.
         vector_store_->store_vectors_batch(vector_batch);
+
+        /*
+         * Phase 3: overwrite meta. This makes meta.filter authoritative for the new
+         * state. After this point, get_meta() returns the new filter document — any
+         * later upsert-cleanup pass on this id will use it as the "old" value to
+         * remove from the filter index.
+         */
         meta_store_->store_meta_batch(meta_batch);
 
-        // Process filter data in batch if any
+        /*
+         * Phase 4: add new filter index entries. The filter store iterates the batched
+         * JSON documents and inserts the appropriate category and numeric index
+         * entries for each id.
+         */
         if(!filter_batch.empty()) {
-            filter_store_->add_filters_from_json_batch(filter_batch);
+            auto filter_result = filter_store_->add_filters_from_json_batch(filter_batch);
+            if(!filter_result.ok()) {
+                return filter_result;
+            }
         }
+        return {SUCCESS, ""};
     }
 
     std::vector<uint8_t> get_vector(ndd::idInt numeric_id) const {
@@ -745,41 +964,150 @@ class VectorStorage {
     get_vectors_batch(const std::vector<ndd::idInt>& numeric_ids) const {
         return vector_store_->get_vectors_batch(numeric_ids);
     }
+
+    template <typename Visitor>
+    size_t visit_vectors_by_ids(const std::vector<ndd::idInt>& numeric_ids,
+                                Visitor&& visitor) const {
+        return vector_store_->visit_vectors_by_ids(
+                numeric_ids,
+                std::forward<Visitor>(visitor));
+    }
+
     ndd::VectorMeta get_meta(ndd::idInt numeric_id) const {
         return meta_store_->get_meta(numeric_id);
     }
 
-    // NOT used anymore. Deletes filter, meta and vector data.
-    void deletePoint(ndd::idInt numeric_id) {
+    /*
+     * Deletes filter, metadata, and vector data for one numeric id.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from filter store
+     * 100-199 = propagated MDBX/storage failure from filter store
+     * 200-299 = propagated corruption/invariant failure from filter store
+     */
+    ndd::OperationResult<> deletePoint(ndd::idInt numeric_id) {
         try {
             // Get metadata first to get filter info
             auto meta = meta_store_->get_meta(numeric_id);
 
             // Remove filter entries if they exist
             if(!meta.filter.empty()) {
-                filter_store_->remove_filters_from_json(numeric_id, meta.filter);
+                auto filter_result = filter_store_->remove_filters_from_json(numeric_id, meta.filter);
+                if(!filter_result.ok()) {
+                    return filter_result;
+                }
             }
             // Try to remove both vector and meta data
             vector_store_->remove(numeric_id);
             meta_store_->remove(numeric_id);
+            return {SUCCESS, ""};
         } catch(const std::exception& e) {
-            throw std::runtime_error(std::string("Failed to remove vector and metadata: ")
-                                     + e.what());
+            return {100, std::string("Failed to remove vector and metadata: ") + e.what()};
         }
     }
-    // Deletes filter only.
-    void deleteFilter(ndd::idInt numeric_id, std::string filter) {
-        filter_store_->remove_filters_from_json(numeric_id, filter);
+
+    /*
+     * Deletes filter index entries for one numeric id and keeps `meta.filter` in sync.
+     *
+     * Why both? The filter index (category + numeric) and meta.filter are two records
+     * of the same fact ("this vector matches the following filter document"). If we
+     * remove from the index but leave meta.filter populated, a later get_meta() returns
+     * a JSON document whose index entries are gone — searches via that filter no longer
+     * return this id, even though meta still advertises the filter. Other code paths
+     * (notably the upsert cleanup in store_vectors_batch) read meta.filter as the
+     * source of truth for "what is the prior filter" and would incorrectly try to
+     * remove already-removed entries. Keeping them in lockstep avoids both confusions.
+     *
+     * Contract:
+     *   - The caller passes the exact filter document being removed. The single
+     *     in-tree caller is deleteVectorsByIds at ndd.hpp, which always passes the
+     *     entire meta.filter for a full filter clear.
+     *   - If meta.filter matches the input, it is cleared in-place.
+     *   - If meta.filter differs (caller is asking to remove a partial document or
+     *     something that does not match the current state), we leave meta alone — the
+     *     index removal is still performed best-effort, but we do not over-clear meta
+     *     because we cannot tell which subset of meta.filter the caller intended.
+     *
+     * Atomicity / limitations:
+     *   - Index removal and meta sync are separate MDBX transactions. A crash between
+     *     them leaves meta.filter populated while index entries are gone (the very
+     *     drift this function is meant to prevent on the happy path). Cross-store
+     *     ACID is tracked separately in the filter roadmap.
+     *   - Meta read or write failure AFTER successful index removal is surfaced as
+     *     code 102 so the caller can return 500. We do NOT try to re-add the index
+     *     entries on rollback — that would itself require another transaction and
+     *     could also fail. The operator is expected to repair via rebuild if this
+     *     ever fires.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from filter store
+     * 100-199 = propagated MDBX/storage failure from filter or meta store
+     * 200-299 = propagated corruption/invariant failure from filter store
+     */
+    ndd::OperationResult<> deleteFilter(ndd::idInt numeric_id, std::string filter) {
+        /*
+         * Step 1: remove the index entries first. If this fails we have not touched
+         * meta yet — caller gets a clean error, no drift introduced.
+         */
+        auto remove_result = filter_store_->remove_filters_from_json(numeric_id, filter);
+        if(!remove_result.ok()) {
+            return remove_result;
+        }
+
+        /*
+         * Step 2: sync meta.filter. We only clear it when it matches the caller's
+         * input — see the contract note above for why we cannot just unconditionally
+         * clear meta.filter. The empty-check is a fast path for ids that already
+         * have no filter recorded.
+         */
+        try {
+            auto meta = meta_store_->get_meta(numeric_id);
+            if(!meta.filter.empty() && meta.filter == filter) {
+                meta.filter.clear();
+                meta_store_->store_meta(numeric_id, meta);
+            }
+        } catch(const std::exception& e) {
+            /*
+             * Either get_meta failed (no meta for this id, or MDBX error) or
+             * store_meta failed. The index entries are already gone at this point,
+             * so meta.filter is now potentially stale relative to the index. We
+             * surface the failure as 102 rather than swallow it: the operator sees
+             * the inconsistency and can repair via rebuild, and the user does not
+             * receive a "successful" response on top of an inconsistent state.
+             */
+            LOG_ERROR(1226,
+                      index_id_,
+                      "deleteFilter meta sync failed for numeric_id "
+                              << numeric_id << ": " << e.what());
+            return {102,
+                    "deleteFilter meta sync failed for numeric_id "
+                            + std::to_string(numeric_id) + ": " + e.what()};
+        }
+        return {SUCCESS, ""};
     }
 
-    // Update filter for a vector
-    void updateFilter(ndd::idInt numeric_id, const std::string& new_filter_json) {
+    /*
+     * Replaces the filter document for one vector.
+     *
+     * Return codes:
+     * 0 = success
+     * 1-99 = propagated filter validation failure from filter store
+     * 100-199 = propagated MDBX/storage failure from filter store
+     * 200-299 = propagated corruption/invariant failure from filter store
+     */
+    ndd::OperationResult<> updateFilter(ndd::idInt numeric_id,
+                                        const std::string& new_filter_json) {
         // Get existing meta
         auto meta = meta_store_->get_meta(numeric_id);
 
         // Remove old filters
         if(!meta.filter.empty()) {
-            filter_store_->remove_filters_from_json(numeric_id, meta.filter);
+            auto remove_result = filter_store_->remove_filters_from_json(numeric_id, meta.filter);
+            if(!remove_result.ok()) {
+                return remove_result;
+            }
         }
 
         // Update meta
@@ -788,8 +1116,12 @@ class VectorStorage {
 
         // Add new filters
         if(!new_filter_json.empty()) {
-            filter_store_->add_filters_from_json(numeric_id, new_filter_json);
+            auto add_result = filter_store_->add_filters_from_json(numeric_id, new_filter_json);
+            if(!add_result.ok()) {
+                return add_result;
+            }
         }
+        return {SUCCESS, ""};
     }
 
     ndd::quant::QuantizationLevel getQuantLevel() const { return vector_store_->getQuantLevel(); }
diff --git a/src/utils/settings.hpp b/src/utils/settings.hpp
index 9949e9109e..07210e7bc9 100644
--- a/src/utils/settings.hpp
+++ b/src/utils/settings.hpp
@@ -5,6 +5,7 @@
 #include <sstream>
 #include <algorithm>
 #include <cstdint>
+#include <thread>
 
 constexpr uint64_t KB = (1024ULL);
 constexpr uint64_t MB = (1024ULL * KB);
diff --git a/src/utils/types.hpp b/src/utils/types.hpp
index 431407b7e9..45dc18f572 100644
--- a/src/utils/types.hpp
+++ b/src/utils/types.hpp
@@ -1,18 +1,45 @@
 #pragma once
 
 #include <optional>
+#include <stdexcept>
 #include <string>
+#include <utility>
 #include <variant>
 
+#ifndef SUCCESS
+#    define SUCCESS 0
+#endif
+
 namespace ndd {
 
 template <typename T = std::monostate>
 struct OperationResult {
-    unsigned int code = 0;
+    unsigned int code = SUCCESS;
     std::string message;
     std::optional<T> value;
 
-    bool ok() const { return code == 0; }
+    bool ok() const { return code == SUCCESS; }
+
+    T& value_or_throw() & {
+        if(!ok() || !value.has_value()) {
+            throw std::logic_error("OperationResult success value is not available: " + message);
+        }
+        return *value;
+    }
+
+    const T& value_or_throw() const& {
+        if(!ok() || !value.has_value()) {
+            throw std::logic_error("OperationResult success value is not available: " + message);
+        }
+        return *value;
+    }
+
+    T&& value_or_throw() && {
+        if(!ok() || !value.has_value()) {
+            throw std::logic_error("OperationResult success value is not available: " + message);
+        }
+        return std::move(*value);
+    }
 };
 
 }  // namespace ndd
diff --git a/tests/CMakeLists.txt b/tests/CMakeLists.txt
index 0793a2e2f3..18aa11e95c 100644
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@@ -36,5 +36,73 @@ target_include_directories(ndd_filter_test PRIVATE
 # Add other necessary definitions
 target_compile_definitions(ndd_filter_test PRIVATE MDB_MAXKEYSIZE=512)
 
+# Vector storage tests: bring up the integration layer (vector + meta + filter
+# stores) so we can verify upsert cleanup and deleteFilter meta sync end-to-end.
+add_executable(ndd_vector_storage_test vector_storage_test.cpp
+    ${LMDB_SOURCES}
+    ${ROARING_SOURCE})
+
+target_link_libraries(ndd_vector_storage_test GTest::gtest_main)
+
+target_include_directories(ndd_vector_storage_test PRIVATE
+    ${CMAKE_SOURCE_DIR}/src
+    ${CMAKE_SOURCE_DIR}/src/core
+    ${CMAKE_SOURCE_DIR}/src/filter
+    ${CMAKE_SOURCE_DIR}/src/storage
+    ${CMAKE_SOURCE_DIR}/src/quant
+    ${CMAKE_SOURCE_DIR}/src/utils
+    ${CMAKE_SOURCE_DIR}/third_party
+    ${CMAKE_SOURCE_DIR}/third_party/json
+    ${CMAKE_SOURCE_DIR}/third_party/msgpack/include
+)
+
+target_compile_definitions(ndd_vector_storage_test PRIVATE MDB_MAXKEYSIZE=512)
+if(USE_AVX512)
+    target_compile_definitions(ndd_vector_storage_test PRIVATE USE_AVX512)
+    target_compile_options(ndd_vector_storage_test PRIVATE
+        -mavx512f -mavx512bw -mavx512vnni -mavx512fp16 -mavx512vpopcntdq)
+elseif(USE_AVX2)
+    target_compile_definitions(ndd_vector_storage_test PRIVATE USE_AVX2)
+    target_compile_options(ndd_vector_storage_test PRIVATE -mavx2 -mfma -mf16c)
+elseif(USE_SVE2)
+    target_compile_definitions(ndd_vector_storage_test PRIVATE USE_SVE2)
+    target_compile_options(ndd_vector_storage_test PRIVATE -march=armv8.6-a+sve2+fp16+dotprod)
+elseif(USE_NEON)
+    target_compile_definitions(ndd_vector_storage_test PRIVATE USE_NEON)
+endif()
+
+add_executable(ndd_request_validation_test request_validation_test.cpp)
+
+target_link_libraries(ndd_request_validation_test GTest::gtest_main)
+
+target_include_directories(ndd_request_validation_test PRIVATE
+    ${CMAKE_SOURCE_DIR}/src
+    ${CMAKE_SOURCE_DIR}/src/server
+    ${CMAKE_SOURCE_DIR}/src/utils
+    ${CROW_INCLUDE_DIR}
+)
+
+# Numeric index stress test: random churn + drain phase, asserts the
+# forward<->inverted invariant across the bitmap-only / split paths.
+add_executable(ndd_numeric_index_stress_test numeric_index_stress_test.cpp
+    ${LMDB_SOURCES}
+    ${ROARING_SOURCE})
+
+target_link_libraries(ndd_numeric_index_stress_test GTest::gtest_main)
+
+target_include_directories(ndd_numeric_index_stress_test PRIVATE
+    ${CMAKE_SOURCE_DIR}/src
+    ${CMAKE_SOURCE_DIR}/src/core
+    ${CMAKE_SOURCE_DIR}/src/filter
+    ${CMAKE_SOURCE_DIR}/src/utils
+    ${CMAKE_SOURCE_DIR}/third_party
+    ${CMAKE_SOURCE_DIR}/third_party/json
+)
+
+target_compile_definitions(ndd_numeric_index_stress_test PRIVATE MDB_MAXKEYSIZE=512)
+
 include(GoogleTest)
 gtest_discover_tests(ndd_filter_test)
+gtest_discover_tests(ndd_vector_storage_test)
+gtest_discover_tests(ndd_request_validation_test)
+gtest_discover_tests(ndd_numeric_index_stress_test)
diff --git a/tests/filter_test.cpp b/tests/filter_test.cpp
index 101be3403e..448ec5cd3d 100644
--- a/tests/filter_test.cpp
+++ b/tests/filter_test.cpp
@@ -1,14 +1,38 @@
 #include <gtest/gtest.h>
+#include <algorithm>
+#include <atomic>
+#include <chrono>
+#include <climits>
+#include <cmath>
+#include <cstdlib>
+#include <cstdio>
 #include <filesystem>
+#include <iomanip>
+#include <limits>
+#include <sstream>
 #include <string>
+#include <thread>
+#include <utility>
 #include <vector>
 #include "filter/filter.hpp"
+#include "filter/category_index.hpp"
 #include "json/nlohmann_json.hpp"
 #include "filter/numeric_index.hpp" // For Bucket test
 
 namespace fs = std::filesystem;
 using json = nlohmann::json;
 
+static void expect_ok(const ndd::OperationResult<>& result) {
+    EXPECT_TRUE(result.ok()) << result.message;
+}
+
+template <typename T>
+static T unwrap_ok(ndd::OperationResult<T> result) {
+    EXPECT_TRUE(result.ok()) << result.message;
+    EXPECT_TRUE(result.value.has_value());
+    return std::move(*result.value);
+}
+
 TEST(BucketTest, Serialization) {
     ndd::filter::Bucket b;
     b.base_value = 100;
@@ -55,16 +79,16 @@ TEST_F(FilterTest, CategoryFilterBasics) {
     // ID 2: City=London
     // ID 3: City=Paris
     
-    filter->add_to_filter("city", "Paris", 1);
-    filter->add_to_filter("city", "London", 2);
-    filter->add_to_filter("city", "Paris", 3);
+    expect_ok(filter->add_to_filter("city", "Paris", 1));
+    expect_ok(filter->add_to_filter("city", "London", 2));
+    expect_ok(filter->add_to_filter("city", "Paris", 3));
 
     // Query for City=Paris
     json query = json::array({
         {{"city", {{"$eq", "Paris"}}}}
     });
 
-    std::vector<ndd::idInt> ids = filter->getIdsMatchingFilter(query);
+    std::vector<ndd::idInt> ids = unwrap_ok(filter->getIdsMatchingFilter(query));
     
     // Should find 1 and 3
     EXPECT_EQ(ids.size(), 2);
@@ -73,21 +97,150 @@ TEST_F(FilterTest, CategoryFilterBasics) {
     EXPECT_EQ(std::find(ids.begin(), ids.end(), 2), ids.end());
 }
 
+class CategoryIndexCorruptionTest : public ::testing::Test {
+protected:
+    std::string db_path;
+    MDBX_env* env = nullptr;
+    std::unique_ptr<ndd::filter::CategoryIndex> category_index;
+
+    void SetUp() override {
+        db_path = "./category_corrupt_db_" + std::to_string(rand());
+        if(fs::exists(db_path)) {
+            fs::remove_all(db_path);
+        }
+        fs::create_directories(db_path);
+
+        int rc = mdbx_env_create(&env);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+
+        rc = mdbx_env_set_maxdbs(env, 10);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+
+        rc = mdbx_env_set_geometry(env,
+                                   -1,
+                                   1ULL << settings::FILTER_MAP_SIZE_BITS,
+                                   1ULL << settings::FILTER_MAP_SIZE_MAX_BITS,
+                                   1ULL << settings::FILTER_MAP_SIZE_BITS,
+                                   -1,
+                                   -1);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+
+        rc = mdbx_env_open(env,
+                           db_path.c_str(),
+                           MDBX_WRITEMAP | MDBX_MAPASYNC | MDBX_NORDAHEAD,
+                           0664);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+
+        category_index = std::make_unique<ndd::filter::CategoryIndex>(env);
+    }
+
+    void TearDown() override {
+        category_index.reset();
+        if(env != nullptr) {
+            mdbx_env_close(env);
+            env = nullptr;
+        }
+        if(fs::exists(db_path)) {
+            fs::remove_all(db_path);
+        }
+    }
+
+    void put_raw_payload(const std::string& key_string, std::vector<char>& payload) {
+        MDBX_txn* txn = nullptr;
+        int rc = mdbx_txn_begin(env, nullptr, MDBX_TXN_READWRITE, &txn);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+
+        MDBX_val key{const_cast<char*>(key_string.data()), key_string.size()};
+        MDBX_val data{payload.data(), payload.size()};
+        rc = mdbx_put(txn, category_index->get_dbi(), &key, &data, MDBX_UPSERT);
+        if(rc != MDBX_SUCCESS) {
+            mdbx_txn_abort(txn);
+            ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+        }
+
+        rc = mdbx_txn_commit(txn);
+        ASSERT_EQ(rc, MDBX_SUCCESS) << mdbx_strerror(rc);
+    }
+};
+
+TEST_F(CategoryIndexCorruptionTest, RejectsTruncatedBitmapPayload) {
+    ndd::RoaringBitmap bitmap;
+    bitmap.add(1);
+    bitmap.add(3);
+
+    std::vector<char> payload(bitmap.getSizeInBytes());
+    bitmap.write(payload.data(), true);
+    ASSERT_GT(payload.size(), 1u);
+    payload.pop_back();
+
+    put_raw_payload(ndd::filter::CategoryIndex::make_key("city", "Paris"), payload);
+
+    auto result = category_index->get_bitmap("city", "Paris");
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 200u);
+}
+
+TEST_F(CategoryIndexCorruptionTest, ReadsValidRawBitmapPayload) {
+    ndd::RoaringBitmap bitmap;
+    bitmap.add(11);
+    bitmap.add(29);
+    bitmap.runOptimize();
+
+    std::vector<char> payload(bitmap.getSizeInBytes());
+    bitmap.write(payload.data(), true);
+
+    put_raw_payload(ndd::filter::CategoryIndex::make_key("city", "Berlin"), payload);
+
+    auto result = category_index->get_bitmap("city", "Berlin");
+    ASSERT_TRUE(result.ok()) << result.message;
+    ASSERT_TRUE(result.value.has_value());
+    EXPECT_TRUE(result.value->contains(11));
+    EXPECT_TRUE(result.value->contains(29));
+    EXPECT_FALSE(result.value->contains(30));
+}
+
+TEST_F(CategoryIndexCorruptionTest, RejectsGarbageBitmapPayload) {
+    std::vector<char> payload{0, 0, 0, 0, 1, 2, 3, 4};
+
+    put_raw_payload(ndd::filter::CategoryIndex::make_key("city", "Rome"), payload);
+
+    auto result = category_index->get_bitmap("city", "Rome");
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 200u);
+    EXPECT_NE(result.message.find("invalid or truncated bitmap payload"),
+              std::string::npos);
+}
+
+TEST_F(CategoryIndexCorruptionTest, RejectsTrailingBytesAfterBitmapPayload) {
+    ndd::RoaringBitmap bitmap;
+    bitmap.add(5);
+
+    std::vector<char> payload(bitmap.getSizeInBytes());
+    bitmap.write(payload.data(), true);
+    payload.push_back('\0');
+
+    put_raw_payload(ndd::filter::CategoryIndex::make_key("city", "London"), payload);
+
+    auto result = category_index->get_bitmap("city", "London");
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 200u);
+}
+
 TEST_F(FilterTest, BooleanFilterBasics) {
     // Boolean is just a special category "0" or "1"
     // ID 10: Active=true
     // ID 11: Active=false
     
     // Using JSON add interface for variety
-    filter->add_filters_from_json(10, R"({"is_active": true})");
-    filter->add_filters_from_json(11, R"({"is_active": false})");
+    expect_ok(filter->add_filters_from_json(10, R"({"is_active": true})"));
+    expect_ok(filter->add_filters_from_json(11, R"({"is_active": false})"));
 
     // Query Active=true
     json query_true = json::array({
         {{"is_active", {{"$eq", true}}}}
     });
     
-    auto ids_true = filter->getIdsMatchingFilter(query_true);
+    auto ids_true = unwrap_ok(filter->getIdsMatchingFilter(query_true));
     EXPECT_EQ(ids_true.size(), 1);
     EXPECT_EQ(ids_true[0], 10);
 
@@ -96,7 +249,7 @@ TEST_F(FilterTest, BooleanFilterBasics) {
         {{"is_active", {{"$eq", false}}}}
     });
     
-    auto ids_false = filter->getIdsMatchingFilter(query_false);
+    auto ids_false = unwrap_ok(filter->getIdsMatchingFilter(query_false));
     EXPECT_EQ(ids_false.size(), 1);
     EXPECT_EQ(ids_false[0], 11);
 }
@@ -106,16 +259,16 @@ TEST_F(FilterTest, NumericFilterBasics) {
     // ID 101: Age=30
     // ID 102: Age=35
     
-    filter->add_filters_from_json(100, R"({"age": 25})");
-    filter->add_filters_from_json(101, R"({"age": 30})");
-    filter->add_filters_from_json(102, R"({"age": 35})");
+    expect_ok(filter->add_filters_from_json(100, R"({"age": 25})"));
+    expect_ok(filter->add_filters_from_json(101, R"({"age": 30})"));
+    expect_ok(filter->add_filters_from_json(102, R"({"age": 35})"));
 
     // Range Query: 20 <= Age <= 32
     json query_range = json::array({
         {{"age", {{"$range", {20, 32}}}}}
     });
 
-    auto ids = filter->getIdsMatchingFilter(query_range);
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query_range));
     
     // Should match 100 (25) and 101 (30)
     EXPECT_EQ(ids.size(), 2);
@@ -132,14 +285,14 @@ TEST_F(FilterTest, FloatNumericFilter) {
     // ID 1: Price=10.5
     // ID 2: Price=20.0
     
-    filter->add_filters_from_json(1, R"({"price": 10.5})");
-    filter->add_filters_from_json(2, R"({"price": 20.0})");
+    expect_ok(filter->add_filters_from_json(1, R"({"price": 10.5})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"price": 20.0})"));
 
     json query = json::array({
         {{"price", {{"$range", {10.0, 15.0}}}}}
     });
 
-    auto ids = filter->getIdsMatchingFilter(query);
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query));
     EXPECT_EQ(ids.size(), 1);
     EXPECT_EQ(ids[0], 1);
 }
@@ -149,9 +302,9 @@ TEST_F(FilterTest, MixedAndLogic) {
     // ID 2: City=NY, Age=40 (Age fail)
     // ID 3: City=LA, Age=30 (City fail)
     
-    filter->add_filters_from_json(1, R"({"city": "NY", "age": 30})");
-    filter->add_filters_from_json(2, R"({"city": "NY", "age": 40})");
-    filter->add_filters_from_json(3, R"({"city": "LA", "age": 30})");
+    expect_ok(filter->add_filters_from_json(1, R"({"city": "NY", "age": 30})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"city": "NY", "age": 40})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"city": "LA", "age": 30})"));
 
     // Filter: City=NY AND Age < 35
     json query = json::array({
@@ -159,7 +312,7 @@ TEST_F(FilterTest, MixedAndLogic) {
         {{"age", {{"$range", {0, 35}}}}}
     });
 
-    auto ids = filter->getIdsMatchingFilter(query);
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query));
     EXPECT_EQ(ids.size(), 1);
     EXPECT_EQ(ids[0], 1);
 }
@@ -169,51 +322,1440 @@ TEST_F(FilterTest, InOperator) {
     // ID 2: Color=Blue
     // ID 3: Color=Green
     
-    filter->add_to_filter("color", "Red", 1);
-    filter->add_to_filter("color", "Blue", 2);
-    filter->add_to_filter("color", "Green", 3);
+    expect_ok(filter->add_to_filter("color", "Red", 1));
+    expect_ok(filter->add_to_filter("color", "Blue", 2));
+    expect_ok(filter->add_to_filter("color", "Green", 3));
 
     // Query: Color IN [Red, Green]
     json query = json::array({
         {{"color", {{"$in", {"Red", "Green"}}}}}
     });
 
-    auto ids = filter->getIdsMatchingFilter(query);
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query));
     EXPECT_EQ(ids.size(), 2); // 1 and 3
 }
 
 TEST_F(FilterTest, DeleteFilter) {
     // ID 1: Tag=A
-    filter->add_to_filter("tag", "A", 1);
+    expect_ok(filter->add_to_filter("tag", "A", 1));
     
     json query = json::array({
         {{"tag", {{"$eq", "A"}}}}
     });
     
-    EXPECT_EQ(filter->countIdsMatchingFilter(query), 1);
+    EXPECT_EQ(unwrap_ok(filter->countIdsMatchingFilter(query)), 1);
     
     // Remove functionality test
     // Usually removal requires us to know what to remove or we remove entire ID?
     // The Filter class has: remove_from_filter(field, value, id)
     
-    filter->remove_from_filter("tag", "A", 1);
+    expect_ok(filter->remove_from_filter("tag", "A", 1));
     
-    EXPECT_EQ(filter->countIdsMatchingFilter(query), 0);
+    EXPECT_EQ(unwrap_ok(filter->countIdsMatchingFilter(query)), 0);
 }
 
 TEST_F(FilterTest, NumericDelete) {
     // ID 1: Score=100
-    filter->add_filters_from_json(1, R"({"score": 100})");
+    expect_ok(filter->add_filters_from_json(1, R"({"score": 100})"));
     
     // Check it exists
     json query = json::array({
         {{"score", {{"$eq", 100}}}}
     });
-    EXPECT_EQ(filter->countIdsMatchingFilter(query), 1);
+    EXPECT_EQ(unwrap_ok(filter->countIdsMatchingFilter(query)), 1);
     
     // Remove
     // remove_filters_from_json uses the whole object
-    filter->remove_filters_from_json(1, R"({"score": 100})");
+    expect_ok(filter->remove_filters_from_json(1, R"({"score": 100})"));
     
-    EXPECT_EQ(filter->countIdsMatchingFilter(query), 0);
+    EXPECT_EQ(unwrap_ok(filter->countIdsMatchingFilter(query)), 0);
+}
+
+TEST_F(FilterTest, RejectsMalformedFilterJson) {
+    auto result = filter->add_filters_from_json(1, R"({"city": "Paris")");
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1);
+}
+
+TEST_F(FilterTest, RejectsUnsupportedFilterType) {
+    auto result = filter->add_filters_from_json(1, R"({"tags": ["a", "b"]})");
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 2);
+}
+
+TEST_F(FilterTest, RejectsSchemaTypeMismatch) {
+    expect_ok(filter->add_filters_from_json(1, R"({"age": 30})"));
+
+    auto result = filter->add_filters_from_json(2, R"({"age": "thirty"})");
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 3);
+}
+
+TEST_F(FilterTest, RejectsInvalidOperator) {
+    json query = json::array({
+        {{"city", {{"$contains", "Paris"}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 2);
+}
+
+TEST_F(FilterTest, RejectsInvalidRange) {
+    expect_ok(filter->add_filters_from_json(1, R"({"score": 100})"));
+    json query = json::array({
+        {{"score", {{"$range", {200, 100}}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 2);
+}
+
+TEST_F(FilterTest, RejectsColonInFieldNameOnInsert) {
+    auto result = filter->add_filters_from_json(1, R"({"user:id": "x"})");
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1);
+}
+
+TEST_F(FilterTest, RejectsColonInValueOnInsert) {
+    auto result = filter->add_filters_from_json(1, R"({"city": "Paris:France"})");
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1);
+}
+
+TEST_F(FilterTest, RejectsColonInFieldNameOnQuery) {
+    json query = json::array({
+        {{"user:id", {{"$eq", "x"}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1);
+}
+
+TEST_F(FilterTest, RejectsColonInValueOnQuery) {
+    expect_ok(filter->add_filters_from_json(1, R"({"city": "Paris"})"));
+    json query = json::array({
+        {{"city", {{"$eq", "Paris:France"}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1);
+}
+
+TEST_F(FilterTest, RejectsColonInLowLevelAddToFilter) {
+    auto field_result = filter->add_to_filter("user:id", "x", 1);
+    EXPECT_FALSE(field_result.ok());
+    EXPECT_EQ(field_result.code, 1);
+
+    auto value_result = filter->add_to_filter("user", "x:y", 1);
+    EXPECT_FALSE(value_result.ok());
+    EXPECT_EQ(value_result.code, 1);
+}
+
+namespace {
+
+std::vector<ndd::idInt> sorted_ids(std::vector<ndd::idInt> ids) {
+    std::sort(ids.begin(), ids.end());
+    return ids;
+}
+
+std::string hex32(uint32_t value) {
+    std::ostringstream out;
+    out << "0x" << std::hex << std::uppercase << std::setw(8)
+        << std::setfill('0') << value;
+    return out.str();
+}
+
+}  // namespace
+
+TEST_F(FilterTest, IntegerIndexedNumericFieldCanBeQueriedWithFloatNumber) {
+    expect_ok(filter->add_filters_from_json(1, R"({"score": 1})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"score": 2})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"score": 3})"));
+
+    const uint32_t float_two = ndd::filter::float_to_sortable(2.0f);
+
+    json exact_float_query = json::parse(R"([{"score":{"$eq":2.0}}])");
+    auto exact_ids = sorted_ids(
+            unwrap_ok(filter->getIdsMatchingFilter(exact_float_query)));
+
+    EXPECT_EQ(exact_ids, (std::vector<ndd::idInt>{2}))
+        << "integer JSON values should be indexed through the shared float "
+           "sortable domain: float_to_sortable(2.0)="
+        << hex32(float_two);
+
+    json lt_float_query = json::parse(R"([{"score":{"$lt":2.0}}])");
+    auto lt_ids = sorted_ids(
+            unwrap_ok(filter->getIdsMatchingFilter(lt_float_query)));
+
+    EXPECT_EQ(lt_ids, (std::vector<ndd::idInt>{1}))
+        << "stored integer values and float comparison bounds should share "
+           "the same float sortable domain";
+}
+
+TEST_F(FilterTest, FloatIndexedNumericFieldCanBeQueriedWithIntegerNumber) {
+    expect_ok(filter->add_filters_from_json(1, R"({"score": 1.0})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"score": 2.0})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"score": 3.0})"));
+
+    json exact_int_query = json::parse(R"([{"score":{"$eq":2}}])");
+    auto exact_ids = sorted_ids(
+            unwrap_ok(filter->getIdsMatchingFilter(exact_int_query)));
+
+    EXPECT_EQ(exact_ids, (std::vector<ndd::idInt>{2}));
+
+    json gte_int_query = json::parse(R"([{"score":{"$gte":2}}])");
+    auto gte_ids = sorted_ids(
+            unwrap_ok(filter->getIdsMatchingFilter(gte_int_query)));
+
+    EXPECT_EQ(gte_ids, (std::vector<ndd::idInt>{2, 3}));
+}
+
+TEST_F(FilterTest, ComparisonOperatorsInteger) {
+    expect_ok(filter->add_filters_from_json(1, R"({"age": 25})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"age": 30})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"age": 35})"));
+
+    auto run = [&](const json& expr) {
+        json query = json::array({{{"age", expr}}});
+        return sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    };
+
+    EXPECT_EQ(run({{"$lt", 30}}),  (std::vector<ndd::idInt>{1}));
+    EXPECT_EQ(run({{"$lte", 30}}), (std::vector<ndd::idInt>{1, 2}));
+    EXPECT_EQ(run({{"$gt", 30}}),  (std::vector<ndd::idInt>{3}));
+    EXPECT_EQ(run({{"$gte", 30}}), (std::vector<ndd::idInt>{2, 3}));
+}
+
+TEST_F(FilterTest, ComparisonOperatorsFloat) {
+    expect_ok(filter->add_filters_from_json(1, R"({"price": 10.5})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"price": 20.0})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"price": 20.5})"));
+
+    auto run = [&](const json& expr) {
+        json query = json::array({{{"price", expr}}});
+        return sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    };
+
+    EXPECT_EQ(run({{"$lt", 20.0}}),  (std::vector<ndd::idInt>{1}));
+    EXPECT_EQ(run({{"$lte", 20.0}}), (std::vector<ndd::idInt>{1, 2}));
+    EXPECT_EQ(run({{"$gt", 20.0}}),  (std::vector<ndd::idInt>{3}));
+    EXPECT_EQ(run({{"$gte", 20.0}}), (std::vector<ndd::idInt>{2, 3}));
+}
+
+TEST_F(FilterTest, ComparisonOperatorsNegativeAndZero) {
+    expect_ok(filter->add_filters_from_json(1, R"({"temp": -5})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"temp": 0})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"temp": 5})"));
+
+    auto run = [&](const json& expr) {
+        json query = json::array({{{"temp", expr}}});
+        return sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    };
+
+    EXPECT_EQ(run({{"$lt", 0}}),    (std::vector<ndd::idInt>{1}));
+    EXPECT_EQ(run({{"$gte", 0}}),   (std::vector<ndd::idInt>{2, 3}));
+    EXPECT_EQ(run({{"$lt", -5}}),   (std::vector<ndd::idInt>{}));
+    EXPECT_EQ(run({{"$lte", -5}}),  (std::vector<ndd::idInt>{1}));
+}
+
+TEST_F(FilterTest, ComparisonAndCombination) {
+    expect_ok(filter->add_filters_from_json(1, R"({"city": "NY", "age": 25})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"city": "NY", "age": 30})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"city": "NY", "age": 35})"));
+    expect_ok(filter->add_filters_from_json(4, R"({"city": "LA", "age": 30})"));
+
+    json query = json::array({
+        {{"city", {{"$eq", "NY"}}}},
+        {{"age",  {{"$gte", 25}}}},
+        {{"age",  {{"$lt", 35}}}}
+    });
+
+    auto ids = sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    EXPECT_EQ(ids, (std::vector<ndd::idInt>{1, 2}));
+}
+
+TEST_F(FilterTest, ComparisonInteractionWithIn) {
+    expect_ok(filter->add_filters_from_json(1, R"({"score": 1})"));
+    expect_ok(filter->add_filters_from_json(2, R"({"score": 5})"));
+    expect_ok(filter->add_filters_from_json(3, R"({"score": 10})"));
+
+    json query = json::array({
+        {{"score", {{"$in",  {1, 5, 10}}}}},
+        {{"score", {{"$gte", 5}}}}
+    });
+
+    auto ids = sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    EXPECT_EQ(ids, (std::vector<ndd::idInt>{2, 3}));
+}
+
+TEST_F(FilterTest, ComparisonInteractionWithRange) {
+    for(int i = 10; i <= 50; i += 10) {
+        std::string body = R"({"v": )" + std::to_string(i) + "}";
+        expect_ok(filter->add_filters_from_json(i, body));
+    }
+
+    json query = json::array({
+        {{"v", {{"$range", {10, 50}}}}},
+        {{"v", {{"$gt", 20}}}},
+        {{"v", {{"$lte", 30}}}}
+    });
+
+    auto ids = sorted_ids(unwrap_ok(filter->getIdsMatchingFilter(query)));
+    EXPECT_EQ(ids, (std::vector<ndd::idInt>{30}));
+}
+
+TEST_F(FilterTest, ComparisonRejectsNonNumericValue) {
+    expect_ok(filter->add_filters_from_json(1, R"({"age": 25})"));
+    json query = json::array({
+        {{"age", {{"$gt", "old"}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 2);
+}
+
+TEST_F(FilterTest, ComparisonRejectsOnNonNumericField) {
+    expect_ok(filter->add_filters_from_json(1, R"({"city": "NY"})"));
+    json query = json::array({
+        {{"city", {{"$gt", 5}}}}
+    });
+
+    auto result = filter->getIdsMatchingFilter(query);
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 2);
+}
+
+TEST_F(FilterTest, ComparisonEmptyRangeAtIntegerBoundary) {
+    expect_ok(filter->add_filters_from_json(1, R"({"x": 0})"));
+
+    json q_lt_min = json::array({
+        {{"x", {{"$lt", INT_MIN}}}}
+    });
+    auto r1 = filter->getIdsMatchingFilter(q_lt_min);
+    EXPECT_TRUE(r1.ok()) << r1.message;
+    EXPECT_EQ(r1.value_or_throw().size(), 0u);
+
+    json q_gt_max = json::array({
+        {{"x", {{"$gt", INT_MAX}}}}
+    });
+    auto r2 = filter->getIdsMatchingFilter(q_gt_max);
+    EXPECT_TRUE(r2.ok()) << r2.message;
+    EXPECT_EQ(r2.value_or_throw().size(), 0u);
+}
+
+// =================================================================
+// Hypothesis tests for the dirty numeric_index.hpp range() perf work.
+//
+// These tests do NOT modify production code; they probe internal
+// invariants of Bucket and end-to-end behavior of Filter to confirm
+// or refute the claims made about the post_filter_new regression.
+//
+// Naming convention: HypothesisN_*  where N matches the analysis.
+// A failing assertion in these tests means the corresponding
+// hypothesis is correct (the claimed unwanted behavior is observable).
+// =================================================================
+
+// --- Hypothesis 1 ----------------------------------------------------
+// Claim: For VectorDBBench-style packed int data, bucket values are
+// densely packed in a much narrower extent than 65536, so the new
+// "Coarse full-coverage fast path" predicate
+//     bucket_base >= min_val
+//     && bucket_base + Bucket::MAX_DELTA <= max_val
+// is FALSE on the typical bucket -- even when the OLD post-deserialize
+// predicate (bucket_min >= min_val && bucket_max <= max_val) is TRUE.
+// Implication: the fast path does not actually fire on the workload
+// it was meant to optimize, and we keep paying the deserialize cost.
+//
+// PASS = both predicates evaluated below match the hypothesis values.
+// FAIL = the predicates disagree with the hypothesis (analysis is wrong).
+TEST(Hypothesis1, FastPathPredicateMissesPackedBucket) {
+    constexpr uint32_t base = 0x80000000u;  // sortable encoding of int 0
+    constexpr size_t   N = ndd::filter::Bucket::MAX_SIZE;
+    constexpr uint32_t spread = 1023;       // values densely packed in [base, base+1023]
+
+    ndd::filter::Bucket bucket;
+    bucket.base_value = base;
+    for (size_t i = 0; i < N; ++i) {
+        bucket.add(base + static_cast<uint32_t>(i % (spread + 1)),
+                   static_cast<ndd::idInt>(i + 1));
+    }
+    ASSERT_EQ(bucket.ids.size(), N);
+
+    const uint32_t bucket_min = bucket.get_value(0);
+    const uint32_t bucket_max = bucket.get_value(bucket.ids.size() - 1);
+    EXPECT_EQ(bucket_min, base);
+    EXPECT_EQ(bucket_max, base + spread);
+
+    // Query covers exactly the bucket's actual extent.
+    const uint32_t min_val = bucket_min;
+    const uint32_t max_val = bucket_max;
+
+    const bool old_full_overlap = bucket_min >= min_val && bucket_max <= max_val;
+    const bool new_fast_path =
+        bucket.base_value >= min_val
+        && static_cast<uint64_t>(bucket.base_value)
+                   + ndd::filter::Bucket::MAX_DELTA <= max_val;
+
+    EXPECT_TRUE(old_full_overlap)
+        << "OLD code's full-overlap branch would fire on this bucket";
+    EXPECT_FALSE(new_fast_path)
+        << "NEW fast path requires the entire 65536-wide extent to fit "
+           "inside [min,max], so it MISSES on packed buckets";
+}
+
+// Counter-test: when bucket values DO span the full delta range and
+// the query is wide enough, the new fast path predicate is TRUE.
+TEST(Hypothesis1, FastPathFiresOnWidelySpreadBucket) {
+    constexpr uint32_t base = 100'000;
+    ndd::filter::Bucket bucket;
+    bucket.base_value = base;
+    for (size_t i = 0; i < 1024; ++i) {
+        const uint32_t val = base
+            + static_cast<uint32_t>(
+                  (i * static_cast<uint64_t>(ndd::filter::Bucket::MAX_DELTA))
+                  / 1023);
+        bucket.add(val, static_cast<ndd::idInt>(i + 1));
+    }
+
+    const uint32_t min_val = base;
+    const uint32_t max_val = base + ndd::filter::Bucket::MAX_DELTA;
+    const bool new_fast_path =
+        bucket.base_value >= min_val
+        && static_cast<uint64_t>(bucket.base_value)
+                   + ndd::filter::Bucket::MAX_DELTA <= max_val;
+    EXPECT_TRUE(new_fast_path);
+}
+
+// --- Hypothesis 2 ----------------------------------------------------
+// Claim: After bucket saturation with duplicates (the dirty Bucket::add
+// caps deltas/ids at MAX_SIZE for delta_32 == 0 inserts but keeps
+// adding to summary_bitmap), the bucket has cardinality > ids.size,
+// and the new bitmap-only-inclusion branch in range() returns ids
+// that the OLD code would never have surfaced.
+TEST(Hypothesis2, SaturationCreatesBitmapOnlyEntries) {
+    constexpr uint32_t base = 0;
+    constexpr ndd::idInt N_TOTAL = ndd::filter::Bucket::MAX_SIZE + 500;
+
+    ndd::filter::Bucket bucket;
+    bucket.base_value = base;
+    for (ndd::idInt i = 1; i <= N_TOTAL; ++i) {
+        bucket.add(base, i);  // all duplicates of base_value
+    }
+
+    EXPECT_EQ(bucket.ids.size(), ndd::filter::Bucket::MAX_SIZE);
+    EXPECT_EQ(bucket.summary_bitmap.cardinality(), N_TOTAL);
+    EXPECT_GT(bucket.summary_bitmap.cardinality(), bucket.ids.size())
+        << "bitmap-only branch in range() will fire iff cardinality > ids.size";
+}
+
+// End-to-end check through the Filter API: when we insert MAX_SIZE+K
+// rows that all share a numeric value, an $eq query should return all
+// MAX_SIZE+K ids. If saturation drops K of them, this test fails -- but
+// then the recall bump observed in the chart cannot be explained by
+// this branch and we should look elsewhere.
+TEST_F(FilterTest, Hypothesis2_RangeReturnsAllSaturatedDuplicates) {
+    constexpr int VALUE = 42;
+    constexpr ndd::idInt EXTRA = 500;
+    constexpr ndd::idInt N = ndd::filter::Bucket::MAX_SIZE + EXTRA;
+
+    const std::string filter_payload =
+        std::string(R"({"score": )") + std::to_string(VALUE) + "}";
+    for (ndd::idInt i = 1; i <= N; ++i) {
+        expect_ok(filter->add_filters_from_json(i, filter_payload));
+    }
+
+    json query = json::array({{ {"score", {{"$eq", VALUE}}} }});
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query));
+    EXPECT_EQ(ids.size(), N)
+        << "If saturation logic is dropping ids, recall would actually go DOWN, "
+           "not up, contradicting the chart.";
+}
+
+// --- Hypothesis 3 ----------------------------------------------------
+// Claim: When a slide-split fires on a saturated bucket, the LEFT
+// bucket's summary_bitmap is rebuilt from `ids` only (see
+// add_to_buckets at numeric_index.hpp:614-617):
+//     bucket.summary_bitmap = ndd::RoaringBitmap();
+//     for (auto bucket_id : bucket.ids) bucket.summary_bitmap.add(bucket_id);
+// Any bitmap-only entries (excess saturated duplicates) that lived on
+// the LEFT side of the split are silently dropped.
+//
+// We reproduce the rebuild step inline because the slide-split lives
+// inside NumericIndex::add_to_buckets (a private path with no test
+// hook). If H3 holds, the data loss is observable on the local Bucket.
+TEST(Hypothesis3, SlideSplitRebuildLosesBitmapOnlyEntries) {
+    constexpr uint32_t base = 0;
+    ndd::filter::Bucket bucket;
+    bucket.base_value = base;
+
+    // Fill with MAX_SIZE unique-delta entries so a real split is possible.
+    for (uint32_t v = 0; v < ndd::filter::Bucket::MAX_SIZE; ++v) {
+        bucket.add(v, static_cast<ndd::idInt>(v + 1));
+    }
+    ASSERT_EQ(bucket.ids.size(), ndd::filter::Bucket::MAX_SIZE);
+
+    // Simulate the saturated-duplicate path: bitmap gains an id but
+    // ids/deltas do not (because Bucket::add returns early for
+    // delta_32 == 0 once ids.size() >= MAX_SIZE).
+    constexpr ndd::idInt BITMAP_ONLY_ID_A = 100'000;
+    constexpr ndd::idInt BITMAP_ONLY_ID_B = 100'001;
+    bucket.summary_bitmap.add(BITMAP_ONLY_ID_A);
+    bucket.summary_bitmap.add(BITMAP_ONLY_ID_B);
+    ASSERT_EQ(bucket.summary_bitmap.cardinality(), bucket.ids.size() + 2);
+
+    // Reproduce the slide-split LEFT-side rebuild.
+    const size_t mid_idx = bucket.ids.size() / 2;
+    bucket.deltas.resize(mid_idx);
+    bucket.ids.resize(mid_idx);
+    bucket.summary_bitmap = ndd::RoaringBitmap();
+    for (auto id : bucket.ids) {
+        bucket.summary_bitmap.add(id);
+    }
+
+    EXPECT_FALSE(bucket.summary_bitmap.contains(BITMAP_ONLY_ID_A));
+    EXPECT_FALSE(bucket.summary_bitmap.contains(BITMAP_ONLY_ID_B));
+    EXPECT_EQ(bucket.summary_bitmap.cardinality(), bucket.ids.size());
+}
+
+// Regression: end-to-end through add_to_buckets. After a real split
+// fires on a saturated-with-duplicates bucket, bitmap-only ids that
+// belong to the left side must survive. Pre-fix the left bitmap was
+// rebuilt from ids[] only and bitmap-only ids were lost; the fix
+// preserves them by subtracting only the ids that moved right.
+//
+// Critical: the warm value must land in the SAME bucket as the anchor.
+// Filter values are floats, and sortable deltas grow ~2^18 per integer
+// unit near small anchors -- so e.g. anchor=42 and warm=47 (delta ~1.3M)
+// would exceed Bucket::MAX_DELTA and create a separate bucket, never
+// triggering the split path. std::nextafterf gives a one-ULP step
+// (sortable delta == 1), guaranteed in-bucket.
+TEST_F(FilterTest, SplitPreservesBitmapOnlyDuplicates) {
+    constexpr float B = 42.0f;
+    const float B_next = std::nextafterf(B, std::numeric_limits<float>::infinity());
+    ASSERT_NE(B, B_next);
+
+    constexpr ndd::idInt EXTRA = 500;
+    constexpr ndd::idInt SATURATION = ndd::filter::Bucket::MAX_SIZE + EXTRA;
+
+    auto payload = [](float v) {
+        std::ostringstream os;
+        os.precision(std::numeric_limits<float>::max_digits10);
+        os << R"({"score": )" << v << "}";
+        return os.str();
+    };
+
+    for (ndd::idInt i = 1; i <= SATURATION; ++i) {
+        expect_ok(filter->add_filters_from_json(i, payload(B)));
+    }
+
+    // First non-base insert: slide-split fallthrough lands it in ids[]
+    // alongside the all-zero deltas, creating the boundary the next
+    // insert will split on.
+    expect_ok(filter->add_filters_from_json(SATURATION + 1, payload(B_next)));
+
+    // Second insert at B: triggers the standard slide-split. Without
+    // the fix the left bitmap rebuild here drops EXTRA bitmap-only ids.
+    expect_ok(filter->add_filters_from_json(SATURATION + 2, payload(B)));
+
+    json query_eq_B = json::array({{ {"score", {{"$eq", B}}} }});
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query_eq_B));
+    EXPECT_EQ(ids.size(), SATURATION + 1)
+        << "Split rebuild must preserve bitmap-only delta-0 entries on the left.";
+}
+
+// Regression: removing every id that lives in ids[] must NOT delete a
+// bucket that still has bitmap-only entries. Pre-fix is_empty() only
+// looked at ids[], so the bucket was deleted and the bitmap-only ids
+// vanished from the inverted index even though the forward index kept
+// pointing at them.
+TEST_F(FilterTest, RemoveKeepsBucketAliveWithBitmapOnlyEntries) {
+    constexpr int B = 7;
+    constexpr ndd::idInt EXTRA = 50;
+    constexpr ndd::idInt SATURATION = ndd::filter::Bucket::MAX_SIZE + EXTRA;
+    const std::string payload =
+        std::string(R"({"score": )") + std::to_string(B) + "}";
+
+    for (ndd::idInt i = 1; i <= SATURATION; ++i) {
+        expect_ok(filter->add_filters_from_json(i, payload));
+    }
+
+    // The first MAX_SIZE inserts populated ids[]; the trailing EXTRA
+    // were absorbed bitmap-only. Remove the first MAX_SIZE -- after
+    // the last one, ids[] is empty but the bitmap still holds EXTRA
+    // ids.
+    for (ndd::idInt i = 1;
+         i <= static_cast<ndd::idInt>(ndd::filter::Bucket::MAX_SIZE); ++i) {
+        expect_ok(filter->remove_filters_from_json(i, payload));
+    }
+
+    json query_eq_B = json::array({{ {"score", {{"$eq", B}}} }});
+    auto ids = unwrap_ok(filter->getIdsMatchingFilter(query_eq_B));
+    EXPECT_EQ(ids.size(), EXTRA)
+        << "Bucket must persist while summary_bitmap is non-empty.";
+
+    // Sanity check: ids should be exactly the bitmap-only tail.
+    std::sort(ids.begin(), ids.end());
+    EXPECT_EQ(ids.front(),
+              static_cast<ndd::idInt>(ndd::filter::Bucket::MAX_SIZE + 1));
+    EXPECT_EQ(ids.back(), SATURATION);
+}
+
+// Regression: in the range slow path, a bucket whose ids[] is empty
+// but whose summary_bitmap is non-empty must contribute its
+// bitmap-only entries iff base_value lies in [min_val, max_val].
+// Pre-fix the path unconditionally skipped such buckets.
+TEST_F(FilterTest, RangeSlowPathReturnsBitmapOnlyEntries) {
+    constexpr int B = 1000;
+    constexpr ndd::idInt EXTRA = 30;
+    constexpr ndd::idInt SATURATION = ndd::filter::Bucket::MAX_SIZE + EXTRA;
+    const std::string payload =
+        std::string(R"({"score": )") + std::to_string(B) + "}";
+
+    for (ndd::idInt i = 1; i <= SATURATION; ++i) {
+        expect_ok(filter->add_filters_from_json(i, payload));
+    }
+    for (ndd::idInt i = 1;
+         i <= static_cast<ndd::idInt>(ndd::filter::Bucket::MAX_SIZE); ++i) {
+        expect_ok(filter->remove_filters_from_json(i, payload));
+    }
+
+    // Narrow range covering only B -- forces the slow path (the fast
+    // path needs base + MAX_DELTA <= max_val, which is not the case
+    // here) and lands in the empty-ids branch.
+    json in_range = json::array({{ {"score", {{"$range", {B, B}}}} }});
+    auto in_ids = unwrap_ok(filter->getIdsMatchingFilter(in_range));
+    EXPECT_EQ(in_ids.size(), EXTRA);
+
+    // Same shape but base_value is OUTSIDE the range. Bitmap-only
+    // entries must be excluded.
+    json out_range =
+        json::array({{ {"score", {{"$range", {B + 1, B + 100}}}} }});
+    auto out_ids = unwrap_ok(filter->getIdsMatchingFilter(out_range));
+    EXPECT_EQ(out_ids.size(), 0u);
+}
+
+// --- Hypothesis 4 ----------------------------------------------------
+// Claim: accepting the OLD on-disk format (legacy uint16_t count
+// between bitmap and arrays) recovers cliff-corrupted bitmap ids and
+// can grow the range result candidate set. The production reader now
+// rejects that payload shape instead of trying to salvage it.
+TEST(Hypothesis4, DeserializeRejectsLegacyCountFormat) {
+    // Manually craft an OLD-format payload:
+    //   [u32 bm_size] [bitmap bytes] [u16 count=0]
+    // i.e. cliff-truncated count, but bitmap retained the lost ids.
+
+    constexpr ndd::idInt LOST_ID_A = 7;
+    constexpr ndd::idInt LOST_ID_B = 9;
+    ndd::RoaringBitmap original;
+    original.add(LOST_ID_A);
+    original.add(LOST_ID_B);
+    original.runOptimize();
+
+    const size_t bm_size = original.getSizeInBytes();
+    std::vector<uint8_t> buffer(sizeof(uint32_t) + bm_size + sizeof(uint16_t), 0);
+    uint8_t* ptr = buffer.data();
+
+    const uint32_t bm_size_32 = static_cast<uint32_t>(bm_size);
+    std::memcpy(ptr, &bm_size_32, sizeof(uint32_t));
+    ptr += sizeof(uint32_t);
+    original.write(reinterpret_cast<char*>(ptr));
+    ptr += bm_size;
+    const uint16_t legacy_count = 0;
+    std::memcpy(ptr, &legacy_count, sizeof(uint16_t));
+
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::deserialize(
+                buffer.data(), buffer.size(), /*base_val=*/100),
+        std::runtime_error);
+}
+
+// Companion check on the read_summary_bitmap fast-path helper: it must
+// reject the same legacy-format payloads as the full deserializer, so
+// the fast path cannot silently reintroduce compatibility.
+TEST(Hypothesis4, ReadSummaryBitmapRejectsLegacyCountFormat) {
+    ndd::RoaringBitmap original;
+    for (ndd::idInt i = 0; i < 50; ++i) original.add(i * 3);
+    original.runOptimize();
+
+    const size_t bm_size = original.getSizeInBytes();
+    std::vector<uint8_t> buffer(sizeof(uint32_t) + bm_size + sizeof(uint16_t), 0);
+    uint8_t* ptr = buffer.data();
+    const uint32_t bm_size_32 = static_cast<uint32_t>(bm_size);
+    std::memcpy(ptr, &bm_size_32, sizeof(uint32_t));
+    ptr += sizeof(uint32_t);
+    original.write(reinterpret_cast<char*>(ptr));
+    ptr += bm_size;
+    const uint16_t legacy_count = 0;
+    std::memcpy(ptr, &legacy_count, sizeof(uint16_t));
+
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::deserialize(buffer.data(), buffer.size(), 0),
+        std::runtime_error);
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::read_summary_bitmap(
+                buffer.data(), buffer.size()),
+        std::runtime_error);
+}
+
+TEST(NumericBucketCorruptionTest, RejectsExtraBytesInsideDeclaredBitmapPayload) {
+    ndd::RoaringBitmap original;
+    for(ndd::idInt i = 0; i < 50; ++i) {
+        original.add(i * 5);
+    }
+    original.runOptimize();
+
+    const size_t bm_size = original.getSizeInBytes();
+    const uint32_t declared_bm_size = static_cast<uint32_t>(bm_size + 1);
+    std::vector<uint8_t> buffer(sizeof(uint32_t) + declared_bm_size, 0);
+    uint8_t* ptr = buffer.data();
+
+    std::memcpy(ptr, &declared_bm_size, sizeof(uint32_t));
+    ptr += sizeof(uint32_t);
+    original.write(reinterpret_cast<char*>(ptr));
+
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::deserialize(buffer.data(), buffer.size(), 0),
+        std::runtime_error);
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::read_summary_bitmap(
+                buffer.data(), buffer.size()),
+        std::runtime_error);
+}
+
+TEST(NumericBucketCorruptionTest, ReadBitmapPayloadReturnsOperationResultOnSuccess) {
+    ndd::RoaringBitmap original;
+    original.add(101);
+    original.add(202);
+    original.runOptimize();
+
+    std::vector<uint8_t> payload(original.getSizeInBytes());
+    original.write(reinterpret_cast<char*>(payload.data()));
+
+    auto result = ndd::filter::Bucket::read_bitmap_payload(payload.data(),
+                                                           payload.size());
+
+    ASSERT_TRUE(result.ok()) << result.message;
+    ASSERT_TRUE(result.value.has_value());
+    EXPECT_TRUE(result.value->contains(101));
+    EXPECT_TRUE(result.value->contains(202));
+    EXPECT_FALSE(result.value->contains(303));
+}
+
+TEST(NumericBucketCorruptionTest, ReadBitmapPayloadRejectsGarbageWithoutThrowing) {
+    std::vector<uint8_t> payload{0, 0, 0, 0, 7, 8, 9, 10};
+
+    auto result = ndd::filter::Bucket::read_bitmap_payload(payload.data(),
+                                                           payload.size());
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 200u);
+    EXPECT_FALSE(result.value.has_value());
+    EXPECT_NE(result.message.find("invalid or truncated bitmap payload"),
+              std::string::npos);
+}
+
+TEST(NumericBucketCorruptionTest, DeserializesValidBucketAfterPayloadValidation) {
+    ndd::filter::Bucket bucket;
+    bucket.base_value = 1000;
+    bucket.add(1000, 42);
+    bucket.add(1007, 43);
+
+    auto bytes = bucket.serialize();
+    auto decoded = ndd::filter::Bucket::deserialize(bytes.data(),
+                                                    bytes.size(),
+                                                    bucket.base_value);
+    auto bitmap_only = ndd::filter::Bucket::read_summary_bitmap(bytes.data(),
+                                                                bytes.size());
+
+    EXPECT_EQ(decoded.base_value, bucket.base_value);
+    EXPECT_EQ(decoded.ids.size(), 2u);
+    EXPECT_TRUE(decoded.summary_bitmap.contains(42));
+    EXPECT_TRUE(decoded.summary_bitmap.contains(43));
+    EXPECT_TRUE(bitmap_only.contains(42));
+    EXPECT_TRUE(bitmap_only.contains(43));
+}
+
+TEST(NumericBucketCorruptionTest, RejectsGarbageInsideDeclaredBitmapPayload) {
+    const uint32_t declared_bm_size = 8;
+    std::vector<uint8_t> buffer(sizeof(uint32_t) + declared_bm_size, 0);
+    std::memcpy(buffer.data(), &declared_bm_size, sizeof(uint32_t));
+
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::deserialize(buffer.data(), buffer.size(), 0),
+        std::runtime_error);
+    EXPECT_THROW(
+        (void)ndd::filter::Bucket::read_summary_bitmap(
+                buffer.data(), buffer.size()),
+        std::runtime_error);
+}
+
+// End-to-end recall check through the Filter API: insert N records
+// with a wide spread of numeric values, run a wide range query, and
+// compare the returned id set against a brute-force enumeration of
+// the same JSON payload. If H4 is the regression cause, the chart's
+// recall bump corresponds to results that match brute force more
+// closely on the dirty branch -- but on a freshly built DB (no cliff
+// state) this test must pass exactly. Mismatch here would mean the
+// dirty range() over-includes even on clean data, which would shift
+// the diagnosis.
+TEST_F(FilterTest, Hypothesis4_RangeMatchesBruteForceOnCleanDb) {
+    constexpr ndd::idInt N = 5000;
+    // Spread values across more than one bucket extent (MAX_DELTA = 65535)
+    // so we exercise both the fast path and the per-bucket scan.
+    auto value_for = [](ndd::idInt i) -> int {
+        return static_cast<int>((i * 37) % 200000);
+    };
+
+    for (ndd::idInt i = 1; i <= N; ++i) {
+        const std::string payload =
+            std::string(R"({"score": )") + std::to_string(value_for(i)) + "}";
+        expect_ok(filter->add_filters_from_json(i, payload));
+    }
+
+    constexpr int LO = 50000;
+    constexpr int HI = 120000;
+    json query = json::array({
+        {{"score", {{"$range", json::array({LO, HI})}}}}
+    });
+    auto got = unwrap_ok(filter->getIdsMatchingFilter(query));
+    std::sort(got.begin(), got.end());
+
+    std::vector<ndd::idInt> expected;
+    for (ndd::idInt i = 1; i <= N; ++i) {
+        const int v = value_for(i);
+        if (v >= LO && v <= HI) expected.push_back(i);
+    }
+    std::sort(expected.begin(), expected.end());
+
+    EXPECT_EQ(got, expected);
+}
+
+// =====================================================================
+// NumericRangeBench: targeted microbench against an EXISTING filter MDBX
+// directory. Runs Filter::computeFilterBitmap (which calls
+// NumericIndex::range) repeatedly for a few canned filter_rates and
+// prints per-call wall time. Compare two builds (dirty vs stashed)
+// against the SAME db path, with no concurrency, no HNSW, no HTTP.
+//
+// Activation: set ENDEE_BENCH_DB to a directory containing mdbx.dat.
+// Optional: ENDEE_BENCH_FIELD (default "id"), ENDEE_BENCH_ITERS (default 200).
+//
+// Caveat: Filter::init_environment opens the env with MDBX_WRITEMAP, so
+// no other process may hold the DB while the bench runs (stop the
+// endee server first). The bench itself only issues read queries.
+// =====================================================================
+namespace {
+struct BenchPoint {
+    const char* label;
+    int lo;
+    int hi;
+};
+
+void run_bench_point(Filter& filter,
+                     const std::string& field,
+                     const BenchPoint& pt,
+                     int iters) {
+    json query = json::array({
+        {{field, {{"$range", json::array({pt.lo, pt.hi})}}}}
+    });
+
+    // Warmup -- prime page cache, schema cache, allocator state.
+    for (int i = 0; i < 3; ++i) {
+        auto r = filter.computeFilterBitmap(query);
+        ASSERT_TRUE(r.ok()) << r.message;
+    }
+
+    size_t result_card = 0;
+    auto t0 = std::chrono::steady_clock::now();
+    for (int i = 0; i < iters; ++i) {
+        auto r = filter.computeFilterBitmap(query);
+        ASSERT_TRUE(r.ok()) << r.message;
+        result_card = r.value_or_throw().cardinality();
+    }
+    auto t1 = std::chrono::steady_clock::now();
+
+    const double total_ms =
+        std::chrono::duration<double, std::milli>(t1 - t0).count();
+    const double per_call_ms = total_ms / iters;
+
+    std::printf("  %-12s [% 8d,% 8d]  iters=%d  per_call=%.3f ms  card=%zu\n",
+                pt.label, pt.lo, pt.hi, iters, per_call_ms, result_card);
+}
+}  // namespace
+
+// Dumps internal structure of the bitmap that range() returns. Compare
+// the output between clean and dirty builds to see whether the dirty
+// path is producing a structurally different (and possibly slower to
+// query) bitmap. Also bench-times a tight contains() loop on that
+// bitmap to mirror what BitMapFilterFunctor does inside HNSW search.
+TEST(NumericRangeBench, BitmapStructureAndContainsCost) {
+    const char* db_path = std::getenv("ENDEE_BENCH_DB");
+    if (!db_path || !*db_path) GTEST_SKIP() << "Set ENDEE_BENCH_DB";
+    const char* field_env = std::getenv("ENDEE_BENCH_FIELD");
+    const std::string field = (field_env && *field_env) ? field_env : "id";
+
+    Filter filter(db_path);
+
+    struct Point { const char* label; long long lo; long long hi; };
+    const Point points[] = {
+        {"rate~0.99", 0, 9'900'000},
+        {"rate~0.80", 0, 8'000'000},
+        {"rate~0.50", 0, 5'000'000},
+        {"rate~0.01", 0,   100'000},
+    };
+
+    for (const auto& p : points) {
+        json q = json::array({{ {field, {{"$range", json::array({p.lo, p.hi})}}} }});
+        auto r = filter.computeFilterBitmap(q);
+        ASSERT_TRUE(r.ok()) << r.message;
+        auto& bm = r.value_or_throw();
+        const uint64_t card = bm.cardinality();
+
+        // Force-serialize to see the structural cost of the bitmap.
+        // The size after runOptimize is the most honest "structural cost"
+        // because OLD writes always runOptimize before persisting.
+        bm.runOptimize();
+        const size_t opt_bytes = bm.getSizeInBytes();
+        // Probe contains() cost on a fixed, stride-based set of ids inside
+        // the range. 1M lookups -- about the same order as HNSW filtered
+        // search visit count at moderate ef.
+        constexpr int N_PROBES = 1'000'000;
+        const long long stride = std::max<long long>(1, (p.hi - p.lo) / N_PROBES);
+        volatile uint64_t sink = 0;
+        auto t0 = std::chrono::steady_clock::now();
+        for (long long v = p.lo; v < p.hi && v < p.lo + (long long)N_PROBES * stride; v += stride) {
+            sink += bm.contains(static_cast<uint32_t>(v)) ? 1 : 0;
+        }
+        auto t1 = std::chrono::steady_clock::now();
+        const double total_us =
+            std::chrono::duration<double, std::micro>(t1 - t0).count();
+        const long long probes_done = (p.hi - p.lo) / stride;
+
+        std::printf("  %-10s card=%llu  bytes_after_runOpt=%zu  "
+                    "contains(%lld probes)=%.1f us  (%.1f ns/probe, hits=%llu)\n",
+                    p.label, (unsigned long long)card, opt_bytes,
+                    probes_done, total_us,
+                    total_us * 1000.0 / std::max<long long>(1, probes_done),
+                    (unsigned long long)sink);
+    }
+}
+
+TEST(NumericRangeBench, ProbeValueDistribution) {
+    const char* db_path = std::getenv("ENDEE_BENCH_DB");
+    if (!db_path || !*db_path) GTEST_SKIP() << "Set ENDEE_BENCH_DB";
+    const char* field_env = std::getenv("ENDEE_BENCH_FIELD");
+    const std::string field = (field_env && *field_env) ? field_env : "id";
+    Filter f(db_path);
+    auto probe = [&](long long lo, long long hi) {
+        json q = json::array({{ {field, {{"$range", json::array({lo, hi})}}} }});
+        auto r = f.computeFilterBitmap(q);
+        ASSERT_TRUE(r.ok()) << r.message;
+        std::printf("  range[% 12lld, % 12lld]  card=%llu\n",
+                    lo, hi, (unsigned long long)r.value_or_throw().cardinality());
+    };
+    probe(-2147483647LL, 2147483647LL);
+    probe(0, 10000000);
+    probe(0, 5000000);
+    probe(2500000, 7500000);
+    probe(-32768, 32767);
+    probe(0, 100000);
+}
+
+TEST(NumericRangeBench, RangeQueryWallClock) {
+    const char* db_path = std::getenv("ENDEE_BENCH_DB");
+    if (!db_path || !*db_path) {
+        GTEST_SKIP() << "Set ENDEE_BENCH_DB to a filter directory to run";
+    }
+    const char* field_env = std::getenv("ENDEE_BENCH_FIELD");
+    const std::string field = (field_env && *field_env) ? field_env : "id";
+    const char* iters_env = std::getenv("ENDEE_BENCH_ITERS");
+    const int iters = (iters_env && *iters_env) ? std::atoi(iters_env) : 200;
+    ASSERT_GT(iters, 0);
+
+    std::printf("NumericRangeBench: db=%s  field=%s  iters=%d\n",
+                db_path, field.c_str(), iters);
+
+    Filter filter(db_path);
+
+    // Chart-aligned filter_rate buckets. The benchmark DB has uint32
+    // values in [0, 10_000_000] with exactly one id per value (probed
+    // via ProbeValueDistribution), so filter_rate ~= (hi - lo) / 1e7.
+    const BenchPoint points[] = {
+        {"rate~0.99", 0, 9'900'000},
+        {"rate~0.80", 0, 8'000'000},
+        {"rate~0.50", 0, 5'000'000},
+        {"rate~0.01", 0,   100'000},
+    };
+
+    for (const auto& pt : points) {
+        run_bench_point(filter, field, pt, iters);
+    }
+}
+
+/**
+ * NumericRangeBench.FloatDomainVsIntegerDomain builds two temporary raw
+ * NumericIndex stores with identical integer values:
+ *   - legacy path: int_to_sortable(value)
+ *   - float-domain path: float_to_sortable(static_cast<float>(value))
+ *
+ * This isolates the index-layout and range-query cost of the shared float32
+ * numeric domain without JSON parsing or Filter schema overhead. Expect
+ * integer-heavy fields to have different bucket behavior under the float
+ * domain. Consecutive ints are dense under int_to_sortable, but their
+ * float_to_sortable bit patterns are not equally dense, so wide range scans
+ * may walk more buckets. The sample output prints bucket-count and range-time
+ * ratios to make that visible.
+ *
+ * Precision caveat: float32 has a 24-bit significand (23 stored mantissa bits
+ * plus the hidden bit). It represents every integer only up to 16,777,216; past
+ * that, adjacent integers can round to the same float32 value and therefore the
+ * same sortable key.
+ *
+ * Activation:
+ *   ENDEE_SORTABLE_PERF=1
+ *
+ * Optional:
+ *   ENDEE_SORTABLE_PERF_N      (default 200000)
+ *   ENDEE_SORTABLE_PERF_ITERS  (default 100)
+ */
+namespace {
+struct RawNumericBenchIndex {
+    std::string path;
+    MDBX_env* env = nullptr;
+    std::unique_ptr<ndd::filter::NumericIndex> index;
+
+    ~RawNumericBenchIndex() {
+        index.reset();
+        if(env != nullptr) {
+            mdbx_env_close(env);
+            env = nullptr;
+        }
+        if(!path.empty() && fs::exists(path)) {
+            fs::remove_all(path);
+        }
+    }
+
+    ndd::OperationResult<> open(const std::string& path_in) {
+        path = path_in;
+        if(fs::exists(path)) {
+            fs::remove_all(path);
+        }
+        fs::create_directories(path);
+
+        int rc = mdbx_env_create(&env);
+        if(rc != MDBX_SUCCESS) {
+            return {100, "Failed to create perf MDBX env: "
+                                 + std::string(mdbx_strerror(rc))};
+        }
+
+        rc = mdbx_env_set_maxdbs(env, 10);
+        if(rc != MDBX_SUCCESS) {
+            return {100, "Failed to set perf MDBX maxdbs: "
+                                 + std::string(mdbx_strerror(rc))};
+        }
+
+        rc = mdbx_env_set_geometry(env,
+                                   -1,
+                                   1ULL << settings::FILTER_MAP_SIZE_BITS,
+                                   1ULL << settings::FILTER_MAP_SIZE_MAX_BITS,
+                                   1ULL << settings::FILTER_MAP_SIZE_BITS,
+                                   -1,
+                                   -1);
+        if(rc != MDBX_SUCCESS) {
+            return {100, "Failed to set perf MDBX geometry: "
+                                 + std::string(mdbx_strerror(rc))};
+        }
+
+        rc = mdbx_env_open(env,
+                           path.c_str(),
+                           MDBX_WRITEMAP | MDBX_MAPASYNC | MDBX_NORDAHEAD,
+                           0664);
+        if(rc != MDBX_SUCCESS) {
+            return {100, "Failed to open perf MDBX env: "
+                                 + std::string(mdbx_strerror(rc))};
+        }
+
+        index = std::make_unique<ndd::filter::NumericIndex>(env);
+        return {SUCCESS, ""};
+    }
+};
+
+struct SortablePerfStats {
+    double build_ms = 0.0;
+    double query_ms_total = 0.0;
+    double query_ms_per_call = 0.0;
+    uint64_t cardinality = 0;
+    size_t bitmap_bytes = 0;
+    size_t bucket_count = 0;
+};
+
+ndd::OperationResult<double>
+populate_sortable_perf_index(ndd::filter::NumericIndex& index,
+                             const std::string& field,
+                             ndd::idInt n,
+                             bool use_float_domain) {
+    constexpr size_t CHUNK_SIZE = 4096;
+    std::vector<ndd::filter::NumericBatchEntry> entries;
+    entries.reserve(CHUNK_SIZE);
+
+    auto t0 = std::chrono::steady_clock::now();
+    for(ndd::idInt start = 0; start < n; start += CHUNK_SIZE) {
+        entries.clear();
+        const ndd::idInt end =
+                std::min<ndd::idInt>(n, start + static_cast<ndd::idInt>(CHUNK_SIZE));
+        for(ndd::idInt i = start; i < end; ++i) {
+            const int32_t value = static_cast<int32_t>(i);
+            const uint32_t sortable =
+                    use_float_domain
+                            ? ndd::filter::float_to_sortable(static_cast<float>(value))
+                            : ndd::filter::int_to_sortable(value);
+            entries.emplace_back(field, i + 1, sortable);
+        }
+
+        auto put_result = index.put_batch(entries);
+        if(!put_result.ok()) {
+            return {put_result.code, put_result.message};
+        }
+    }
+    auto t1 = std::chrono::steady_clock::now();
+
+    return {SUCCESS,
+            "",
+            std::chrono::duration<double, std::milli>(t1 - t0).count()};
+}
+
+ndd::OperationResult<size_t>
+count_numeric_inverted_buckets(MDBX_env* env, const std::string& field) {
+    MDBX_txn* txn = nullptr;
+    int rc = mdbx_txn_begin(env, nullptr, MDBX_TXN_RDONLY, &txn);
+    if(rc != MDBX_SUCCESS) {
+        return {100, "Failed to begin bucket-count transaction: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    MDBX_dbi dbi;
+    rc = mdbx_dbi_open(txn, "numeric_inverted", MDBX_DB_DEFAULTS, &dbi);
+    if(rc != MDBX_SUCCESS) {
+        mdbx_txn_abort(txn);
+        return {100, "Failed to open numeric_inverted for bucket count: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    MDBX_cursor* cursor = nullptr;
+    rc = mdbx_cursor_open(txn, dbi, &cursor);
+    if(rc != MDBX_SUCCESS) {
+        mdbx_txn_abort(txn);
+        return {100, "Failed to open bucket-count cursor: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+
+    const std::string prefix = field + ":";
+    size_t buckets = 0;
+    MDBX_val key;
+    MDBX_val data;
+    rc = mdbx_cursor_get(cursor, &key, &data, MDBX_FIRST);
+    while(rc == MDBX_SUCCESS) {
+        std::string key_string(static_cast<char*>(key.iov_base), key.iov_len);
+        if(key_string.rfind(prefix, 0) == 0) {
+            ++buckets;
+        }
+        rc = mdbx_cursor_get(cursor, &key, &data, MDBX_NEXT);
+    }
+
+    mdbx_cursor_close(cursor);
+    mdbx_txn_abort(txn);
+    if(rc != MDBX_NOTFOUND) {
+        return {100, "Failed while counting numeric buckets: "
+                             + std::string(mdbx_strerror(rc))};
+    }
+    return {SUCCESS, "", buckets};
+}
+
+ndd::OperationResult<SortablePerfStats>
+run_sortable_perf_range(ndd::filter::NumericIndex& index,
+                        const std::string& field,
+                        uint32_t lo,
+                        uint32_t hi,
+                        int iters,
+                        double build_ms,
+                        size_t bucket_count) {
+    for(int i = 0; i < 3; ++i) {
+        auto warmup = index.range(field, lo, hi);
+        if(!warmup.ok()) {
+            return {warmup.code, warmup.message};
+        }
+    }
+
+    SortablePerfStats stats;
+    stats.build_ms = build_ms;
+    stats.bucket_count = bucket_count;
+
+    auto t0 = std::chrono::steady_clock::now();
+    for(int i = 0; i < iters; ++i) {
+        auto range_result = index.range(field, lo, hi);
+        if(!range_result.ok()) {
+            return {range_result.code, range_result.message};
+        }
+
+        auto bitmap = std::move(range_result.value_or_throw());
+        stats.cardinality = bitmap.cardinality();
+        bitmap.runOptimize();
+        stats.bitmap_bytes = bitmap.getSizeInBytes();
+    }
+    auto t1 = std::chrono::steady_clock::now();
+
+    stats.query_ms_total =
+            std::chrono::duration<double, std::milli>(t1 - t0).count();
+    stats.query_ms_per_call = stats.query_ms_total / iters;
+    return {SUCCESS, "", stats};
+}
+}  // namespace
+
+TEST(NumericRangeBench, FloatDomainVsIntegerDomain) {
+    const char* enabled = std::getenv("ENDEE_SORTABLE_PERF");
+    if(!enabled || std::string(enabled) != "1") {
+        GTEST_SKIP() << "Set ENDEE_SORTABLE_PERF=1 to run";
+    }
+
+    const char* n_env = std::getenv("ENDEE_SORTABLE_PERF_N");
+    const ndd::idInt n =
+            (n_env && *n_env) ? static_cast<ndd::idInt>(std::strtoul(n_env, nullptr, 10))
+                              : 200000;
+    const char* iters_env = std::getenv("ENDEE_SORTABLE_PERF_ITERS");
+    const int iters = (iters_env && *iters_env) ? std::atoi(iters_env) : 100;
+    ASSERT_GE(n, 1000u);
+    ASSERT_GT(iters, 0);
+    ASSERT_LE(n, static_cast<ndd::idInt>(std::numeric_limits<int32_t>::max()));
+
+    const std::string field = "score";
+    const std::string suffix = std::to_string(std::rand());
+    RawNumericBenchIndex int_index;
+    RawNumericBenchIndex float_index;
+    auto int_open = int_index.open("./numeric_sortable_perf_int_" + suffix);
+    ASSERT_TRUE(int_open.ok()) << int_open.message;
+    auto float_open = float_index.open("./numeric_sortable_perf_float_" + suffix);
+    ASSERT_TRUE(float_open.ok()) << float_open.message;
+
+    auto int_build = populate_sortable_perf_index(*int_index.index, field, n, false);
+    ASSERT_TRUE(int_build.ok()) << int_build.message;
+    auto float_build = populate_sortable_perf_index(*float_index.index, field, n, true);
+    ASSERT_TRUE(float_build.ok()) << float_build.message;
+
+    auto int_buckets = count_numeric_inverted_buckets(int_index.env, field);
+    ASSERT_TRUE(int_buckets.ok()) << int_buckets.message;
+    auto float_buckets = count_numeric_inverted_buckets(float_index.env, field);
+    ASSERT_TRUE(float_buckets.ok()) << float_buckets.message;
+
+    struct Point {
+        const char* label;
+        int32_t lo;
+        int32_t hi;
+    };
+
+    const int32_t max_value = static_cast<int32_t>(n - 1);
+    const Point points[] = {
+        {"rate~0.99", 0, static_cast<int32_t>((static_cast<uint64_t>(n) * 99) / 100)},
+        {"rate~0.50",
+         static_cast<int32_t>(n / 4),
+         static_cast<int32_t>((static_cast<uint64_t>(n) * 3) / 4)},
+        {"rate~0.01",
+         static_cast<int32_t>(n / 2),
+         static_cast<int32_t>(n / 2 + n / 100)},
+    };
+
+    std::printf("NumericRangeBench.FloatDomainVsIntegerDomain: n=%u iters=%d\n",
+                n,
+                iters);
+    std::printf("  build_ms: int=%.3f float=%.3f ratio=%.2fx\n",
+                int_build.value_or_throw(),
+                float_build.value_or_throw(),
+                float_build.value_or_throw() / int_build.value_or_throw());
+    std::printf("  buckets : int=%zu float=%zu ratio=%.2fx\n",
+                int_buckets.value_or_throw(),
+                float_buckets.value_or_throw(),
+                static_cast<double>(float_buckets.value_or_throw())
+                        / std::max<size_t>(1, int_buckets.value_or_throw()));
+
+    for(const auto& point : points) {
+        const int32_t lo = std::min(point.lo, max_value);
+        const int32_t hi = std::min(point.hi, max_value);
+        ASSERT_LE(lo, hi);
+
+        auto int_stats = run_sortable_perf_range(
+                *int_index.index,
+                field,
+                ndd::filter::int_to_sortable(lo),
+                ndd::filter::int_to_sortable(hi),
+                iters,
+                int_build.value_or_throw(),
+                int_buckets.value_or_throw());
+        ASSERT_TRUE(int_stats.ok()) << int_stats.message;
+
+        auto float_stats = run_sortable_perf_range(
+                *float_index.index,
+                field,
+                ndd::filter::float_to_sortable(static_cast<float>(lo)),
+                ndd::filter::float_to_sortable(static_cast<float>(hi)),
+                iters,
+                float_build.value_or_throw(),
+                float_buckets.value_or_throw());
+        ASSERT_TRUE(float_stats.ok()) << float_stats.message;
+
+        ASSERT_EQ(int_stats.value_or_throw().cardinality,
+                  float_stats.value_or_throw().cardinality);
+
+        std::printf("  %-10s [%8d,%8d] card=%llu "
+                    "range_ms: int=%.3f float=%.3f ratio=%.2fx "
+                    "bitmap_bytes: int=%zu float=%zu\n",
+                    point.label,
+                    lo,
+                    hi,
+                    static_cast<unsigned long long>(
+                            int_stats.value_or_throw().cardinality),
+                    int_stats.value_or_throw().query_ms_per_call,
+                    float_stats.value_or_throw().query_ms_per_call,
+                    float_stats.value_or_throw().query_ms_per_call
+                            / int_stats.value_or_throw().query_ms_per_call,
+                    int_stats.value_or_throw().bitmap_bytes,
+                    float_stats.value_or_throw().bitmap_bytes);
+    }
+}
+
+// =====================================================================
+// NumericRangeBench_MT: same as above, but with N threads hammering
+// range() concurrently against ONE shared Filter. Each thread issues
+// computeFilterBitmap in a tight loop for a fixed wall-clock window.
+//
+// What this tells us: if dirty range() regresses here vs the clean
+// build but the single-threaded NumericRangeBench above does not,
+// the cost is concurrency-related (heap / allocator / cache-line
+// contention triggered by the dirty in-memory layout), not per-call
+// algorithmic.
+//
+// Activation: same env vars as the single-threaded bench, plus:
+//   ENDEE_BENCH_THREADS  (default 16)
+//   ENDEE_BENCH_SECONDS  (default 8)
+// =====================================================================
+namespace {
+struct MtResult {
+    uint64_t total_ops = 0;
+    uint64_t result_card_sample = 0;
+};
+
+void run_bench_point_mt(Filter& filter,
+                        const std::string& field,
+                        const BenchPoint& pt,
+                        int threads,
+                        double seconds) {
+    json query = json::array({
+        {{field, {{"$range", json::array({pt.lo, pt.hi})}}}}
+    });
+
+    // Warmup serially -- prime page cache + schema cache.
+    for (int i = 0; i < 3; ++i) {
+        auto r = filter.computeFilterBitmap(query);
+        ASSERT_TRUE(r.ok()) << r.message;
+    }
+
+    std::atomic<bool> start{false};
+    std::atomic<bool> stop{false};
+    std::vector<MtResult> per_thread(threads);
+
+    auto worker = [&](int tid) {
+        while (!start.load(std::memory_order_acquire)) {
+            std::this_thread::yield();
+        }
+        uint64_t ops = 0;
+        uint64_t card_sample = 0;
+        while (!stop.load(std::memory_order_acquire)) {
+            auto r = filter.computeFilterBitmap(query);
+            if (!r.ok()) {
+                std::fprintf(stderr, "thread %d: %s\n", tid, r.message.c_str());
+                return;
+            }
+            if ((ops & 0xFFF) == 0) {
+                card_sample = r.value_or_throw().cardinality();
+            }
+            ++ops;
+        }
+        per_thread[tid].total_ops = ops;
+        per_thread[tid].result_card_sample = card_sample;
+    };
+
+    std::vector<std::thread> ts;
+    ts.reserve(threads);
+    for (int i = 0; i < threads; ++i) ts.emplace_back(worker, i);
+
+    auto t0 = std::chrono::steady_clock::now();
+    start.store(true, std::memory_order_release);
+
+    std::this_thread::sleep_for(std::chrono::duration<double>(seconds));
+    stop.store(true, std::memory_order_release);
+
+    for (auto& t : ts) t.join();
+    auto t1 = std::chrono::steady_clock::now();
+
+    uint64_t total_ops = 0;
+    uint64_t card = 0;
+    for (const auto& r : per_thread) {
+        total_ops += r.total_ops;
+        if (r.result_card_sample) card = r.result_card_sample;
+    }
+    const double elapsed_s =
+        std::chrono::duration<double>(t1 - t0).count();
+    const double qps = total_ops / elapsed_s;
+    const double per_call_ms = (elapsed_s * 1000.0 * threads) / total_ops;
+
+    std::printf("  %-12s [% 8d,% 8d]  threads=%d  ops=%llu  qps=%.1f  "
+                "per_call_avg=%.3f ms  card=%llu\n",
+                pt.label, pt.lo, pt.hi, threads,
+                (unsigned long long)total_ops, qps, per_call_ms,
+                (unsigned long long)card);
+}
+}  // namespace
+
+TEST(NumericRangeBench, RangeQueryMultiThreaded) {
+    const char* db_path = std::getenv("ENDEE_BENCH_DB");
+    if (!db_path || !*db_path) {
+        GTEST_SKIP() << "Set ENDEE_BENCH_DB to a filter directory to run";
+    }
+    const char* field_env = std::getenv("ENDEE_BENCH_FIELD");
+    const std::string field = (field_env && *field_env) ? field_env : "id";
+    const char* threads_env = std::getenv("ENDEE_BENCH_THREADS");
+    const int threads = (threads_env && *threads_env) ? std::atoi(threads_env) : 16;
+    const char* seconds_env = std::getenv("ENDEE_BENCH_SECONDS");
+    const double seconds =
+        (seconds_env && *seconds_env) ? std::atof(seconds_env) : 8.0;
+    ASSERT_GT(threads, 0);
+    ASSERT_GT(seconds, 0.0);
+
+    std::printf("NumericRangeBench_MT: db=%s  field=%s  threads=%d  seconds=%.1f\n",
+                db_path, field.c_str(), threads, seconds);
+
+    Filter filter(db_path);
+
+    const BenchPoint points[] = {
+        {"rate~0.99", 0, 9'900'000},
+        {"rate~0.80", 0, 8'000'000},
+        {"rate~0.50", 0, 5'000'000},
+        {"rate~0.01", 0,   100'000},
+    };
+
+    for (const auto& pt : points) {
+        run_bench_point_mt(filter, field, pt, threads, seconds);
+    }
 }
diff --git a/tests/numeric_index_stress_test.cpp b/tests/numeric_index_stress_test.cpp
new file mode 100644
index 0000000000..40f22b3e55
--- /dev/null
+++ b/tests/numeric_index_stress_test.cpp
@@ -0,0 +1,370 @@
+#include <gtest/gtest.h>
+
+#include <algorithm>
+#include <cstdlib>
+#include <filesystem>
+#include <limits>
+#include <random>
+#include <sstream>
+#include <string>
+#include <unordered_map>
+#include <unordered_set>
+#include <utility>
+#include <vector>
+
+#include "filter/filter.hpp"
+#include "filter/numeric_index.hpp"
+#include "json/nlohmann_json.hpp"
+
+namespace fs = std::filesystem;
+using json = nlohmann::json;
+
+/*
+ * Stress test for the numeric inverted index invariant:
+ *   for every (id, value) in the forward index, an $eq(value) query
+ *   must return id; and the set of ids returned for value V must equal
+ *   exactly the set of ids whose forward-mapped value is V.
+ *
+ * Two complementary phases:
+ *
+ *   A. SaturatedDuplicatesThenSplit -- builds the pathological state
+ *      from the verified plan deterministically. For each anchor value
+ *      A, insert MAX_SIZE + EXTRA ids at A so the bucket saturates
+ *      with delta-0 entries and pushes EXTRA into the summary_bitmap
+ *      via Bucket::add's saturated-duplicate short-circuit. Then
+ *      insert a few ids at A's float-next-up neighbor (which lands in
+ *      the same bucket: float spacing near A puts that delta well
+ *      under MAX_DELTA). The first such insert hits the slide-split
+ *      fallthrough; the next triggers a real slide-split. Verifies
+ *      $eq(A) returns all surviving ids -- pre-fix the split rebuilds
+ *      the left bitmap from ids[] only and EXTRA ids vanish.
+ *
+ *   B. RandomChurnPlusDrain -- mixed insert / value-update / remove
+ *      workload, then drain every id still bound to an anchor. The
+ *      drain order is randomized so removes interleave bitmap-only
+ *      and ids[] entries; the model is the ground truth for the
+ *      invariant check after each phase.
+ *
+ * The Filter API is used end-to-end so the test exercises put_internal
+ * (remove-old + add-new) on updates and remove_from_buckets on removes.
+ */
+
+namespace {
+
+static void expect_ok(const ndd::OperationResult<>& r) {
+    ASSERT_TRUE(r.ok()) << r.message;
+}
+
+template <typename T>
+static T unwrap(ndd::OperationResult<T> r) {
+    EXPECT_TRUE(r.ok()) << r.message;
+    EXPECT_TRUE(r.value.has_value());
+    return std::move(*r.value);
+}
+
+/*
+ * Floats are the on-the-wire value type for numeric filters. Encode
+ * them with full precision so the JSON round-trip lands on exactly the
+ * same float (and therefore exactly the same sortable bucket key) as
+ * the C++ float we hold here.
+ */
+static std::string score_payload(float v) {
+    std::ostringstream os;
+    os.precision(std::numeric_limits<float>::max_digits10);
+    os << R"({"score": )" << v << "}";
+    return os.str();
+}
+
+struct Model {
+    std::unordered_map<ndd::idInt, float> id_to_value;
+    // Float keys here are exact: we only ever store values that came
+    // out of Model::set, which received them as floats with no further
+    // arithmetic, so equality and hashing on the bit pattern are safe.
+    std::unordered_map<float, std::unordered_set<ndd::idInt>> value_to_ids;
+
+    void set(ndd::idInt id, float value) {
+        auto it = id_to_value.find(id);
+        if(it != id_to_value.end()) {
+            auto& old_set = value_to_ids[it->second];
+            old_set.erase(id);
+            if(old_set.empty()) {
+                value_to_ids.erase(it->second);
+            }
+            it->second = value;
+        } else {
+            id_to_value.emplace(id, value);
+        }
+        value_to_ids[value].insert(id);
+    }
+
+    void erase(ndd::idInt id) {
+        auto it = id_to_value.find(id);
+        if(it == id_to_value.end()) {
+            return;
+        }
+        auto& set = value_to_ids[it->second];
+        set.erase(id);
+        if(set.empty()) {
+            value_to_ids.erase(it->second);
+        }
+        id_to_value.erase(it);
+    }
+};
+
+static void verify_eq_consistency(Filter& filter, const Model& model,
+                                  const std::string& tag) {
+    SCOPED_TRACE("verify_eq_consistency: " + tag);
+    for(const auto& [value, expected_ids] : model.value_to_ids) {
+        json q = json::array({ { {"score", { {"$eq", value} } } } });
+        auto ids = unwrap(filter.getIdsMatchingFilter(q));
+        std::unordered_set<ndd::idInt> got(ids.begin(), ids.end());
+        ASSERT_EQ(got.size(), expected_ids.size())
+            << "value=" << value
+            << " expected_count=" << expected_ids.size()
+            << " got_count=" << got.size();
+        for(ndd::idInt eid : expected_ids) {
+            ASSERT_TRUE(got.count(eid))
+                << "value=" << value << " missing id=" << eid;
+        }
+    }
+}
+
+class NumericStressFixture : public ::testing::Test {
+protected:
+    std::string db_path;
+    std::unique_ptr<Filter> filter;
+
+    void SetUp() override {
+        db_path = "./stress_db_" + std::to_string(::rand());
+        if(fs::exists(db_path)) {
+            fs::remove_all(db_path);
+        }
+        filter = std::make_unique<Filter>(db_path);
+    }
+
+    void TearDown() override {
+        filter.reset();
+        if(fs::exists(db_path)) {
+            fs::remove_all(db_path);
+        }
+    }
+};
+
+}  // namespace
+
+TEST_F(NumericStressFixture, SaturatedDuplicatesThenSplit) {
+    /*
+     * Pick a handful of unrelated anchor values. They must be far
+     * apart in sortable space so they live in different buckets and
+     * don't accidentally help each other split.
+     */
+    const std::vector<float> anchors = { 100.0f, 5'000.0f, 250'000.0f };
+    constexpr ndd::idInt EXTRA = 200;
+
+    Model model;
+    ndd::idInt next_id = 1;
+
+    for(float A : anchors) {
+        /*
+         * Phase A.1 -- saturate the bucket purely with delta-0
+         * duplicates at A. The first MAX_SIZE go into ids[]/deltas[];
+         * the trailing EXTRA fall through Bucket::add's saturated
+         * short-circuit into summary_bitmap only.
+         */
+        for(ndd::idInt i = 0; i < ndd::filter::Bucket::MAX_SIZE + EXTRA; ++i) {
+            ndd::idInt id = next_id++;
+            expect_ok(filter->add_filters_from_json(id, score_payload(A)));
+            model.set(id, A);
+        }
+
+        /*
+         * Phase A.2 -- introduce a value boundary in the same bucket.
+         * std::nextafterf(A, +inf) is one ULP above A: it lands in the
+         * same bucket (sortable delta == 1, well under MAX_DELTA). The
+         * first such insert hits the slide-split fallthrough (all
+         * existing deltas zero), placing a non-zero delta into ids[].
+         * The second insert (a duplicate of A here) now finds a value
+         * boundary and triggers a real slide-split. Pre-fix that
+         * rebuild drops the EXTRA bitmap-only ids.
+         */
+        const float A_next = std::nextafterf(A, std::numeric_limits<float>::infinity());
+        ASSERT_NE(A, A_next);
+
+        ndd::idInt boundary_id = next_id++;
+        expect_ok(filter->add_filters_from_json(boundary_id, score_payload(A_next)));
+        model.set(boundary_id, A_next);
+
+        ndd::idInt split_trigger_id = next_id++;
+        expect_ok(filter->add_filters_from_json(split_trigger_id, score_payload(A)));
+        model.set(split_trigger_id, A);
+    }
+
+    verify_eq_consistency(*filter, model, "after saturate+split per anchor");
+
+    /*
+     * A few more inserts and a final consistency sweep, to catch a
+     * regression where a damaged left bitmap survives the first
+     * verification but corrupts a subsequent operation.
+     */
+    for(float A : anchors) {
+        for(int extra_pass = 0; extra_pass < 50; ++extra_pass) {
+            ndd::idInt id = next_id++;
+            expect_ok(filter->add_filters_from_json(id, score_payload(A)));
+            model.set(id, A);
+        }
+    }
+
+    verify_eq_consistency(*filter, model, "after follow-up inserts");
+}
+
+TEST_F(NumericStressFixture, RandomChurnPlusDrain) {
+    /*
+     * Hot values: dense duplicates. Each lives in its own bucket
+     * because they are far apart in sortable space, so saturation
+     * happens per-bucket.
+     */
+    const std::vector<float> hot_values = { 1'000.0f, 50'000.0f, 1'000'000.0f };
+
+    /*
+     * Warm offsets are one ULP up from a hot value: same bucket as the
+     * hot anchor, non-zero delta. Used sparingly so a hot bucket can
+     * still saturate before any warm enters.
+     */
+    auto warm_for = [](float hot) {
+        return std::nextafterf(hot, std::numeric_limits<float>::infinity());
+    };
+
+    std::mt19937 rng(0xDEADBEEFu);  // fixed seed for reproducibility
+    std::uniform_real_distribution<double> coin(0.0, 1.0);
+    std::uniform_real_distribution<float> cold_dist(50.0f, 500'000.0f);
+
+    Model model;
+    ndd::idInt next_id = 1;
+
+    /*
+     * Warm-up: drive each hot value past MAX_SIZE so its bucket holds
+     * bitmap-only entries before random churn starts. Without this
+     * priming the random workload would interleave warm inserts
+     * before saturation and the slide-split fallthrough path would
+     * never form.
+     */
+    constexpr ndd::idInt PRIME_EXTRA = 100;
+    for(float h : hot_values) {
+        for(ndd::idInt i = 0; i < ndd::filter::Bucket::MAX_SIZE + PRIME_EXTRA; ++i) {
+            ndd::idInt id = next_id++;
+            expect_ok(filter->add_filters_from_json(id, score_payload(h)));
+            model.set(id, h);
+        }
+    }
+    verify_eq_consistency(*filter, model, "after priming");
+
+    auto pick_value = [&]() -> float {
+        const double v = coin(rng);
+        if(v < 0.60) {
+            std::uniform_int_distribution<size_t> p(0, hot_values.size() - 1);
+            return hot_values[p(rng)];
+        }
+        if(v < 0.80) {
+            std::uniform_int_distribution<size_t> p(0, hot_values.size() - 1);
+            return warm_for(hot_values[p(rng)]);
+        }
+        return cold_dist(rng);
+    };
+
+    auto pick_existing_id = [&]() -> ndd::idInt {
+        std::uniform_int_distribution<size_t> p(0, model.id_to_value.size() - 1);
+        auto it = model.id_to_value.begin();
+        std::advance(it, p(rng));
+        return it->first;
+    };
+
+    constexpr int ROUNDS = 6000;
+    constexpr int CHECK_EVERY = 1500;
+
+    for(int round = 0; round < ROUNDS; ++round) {
+        const double action_dice = coin(rng);
+        const bool can_touch_existing = !model.id_to_value.empty();
+
+        if(action_dice < 0.55 || !can_touch_existing) {
+            ndd::idInt id = next_id++;
+            float v = pick_value();
+            expect_ok(filter->add_filters_from_json(id, score_payload(v)));
+            model.set(id, v);
+        } else if(action_dice < 0.85) {
+            ndd::idInt id = pick_existing_id();
+            float v = pick_value();
+            expect_ok(filter->add_filters_from_json(id, score_payload(v)));
+            model.set(id, v);
+        } else {
+            ndd::idInt id = pick_existing_id();
+            float old_v = model.id_to_value[id];
+            expect_ok(filter->remove_filters_from_json(id, score_payload(old_v)));
+            model.erase(id);
+        }
+
+        if(round != 0 && round % CHECK_EVERY == 0) {
+            verify_eq_consistency(*filter, model,
+                                  "mid-churn round=" + std::to_string(round));
+        }
+    }
+
+    verify_eq_consistency(*filter, model, "post-churn");
+
+    /*
+     * Drain every id still bound to a hot value, in shuffled order so
+     * removes mix ids[] entries and bitmap-only entries. Verify after
+     * each batch so a buggy is_empty() (deleting a bucket while
+     * bitmap-only entries remain) is caught before subsequent removes
+     * silently reconcile state.
+     */
+    constexpr size_t DRAIN_BATCH = 25;
+    for(float h : hot_values) {
+        auto it = model.value_to_ids.find(h);
+        if(it == model.value_to_ids.end()) {
+            continue;
+        }
+        std::vector<ndd::idInt> ids_at_hot(it->second.begin(), it->second.end());
+        std::shuffle(ids_at_hot.begin(), ids_at_hot.end(), rng);
+
+        for(size_t i = 0; i < ids_at_hot.size(); i += DRAIN_BATCH) {
+            const size_t end = std::min(i + DRAIN_BATCH, ids_at_hot.size());
+            for(size_t j = i; j < end; ++j) {
+                expect_ok(filter->remove_filters_from_json(
+                    ids_at_hot[j], score_payload(h)));
+                model.erase(ids_at_hot[j]);
+            }
+            verify_eq_consistency(*filter, model,
+                                  "drain h=" + std::to_string(h)
+                                      + " batch_end=" + std::to_string(end));
+        }
+    }
+
+    verify_eq_consistency(*filter, model, "post-drain");
+
+    /*
+     * Range-query cross-check across the union of all anchors. Result
+     * must equal the model union for values inside the band. Exercises
+     * the range slow path on every bucket whose extent is not fully
+     * covered.
+     */
+    constexpr float RANGE_LO = 900.0f;
+    constexpr float RANGE_HI = 1'500'000.0f;
+    json range_q =
+        json::array({ { {"score", { {"$range", { RANGE_LO, RANGE_HI }} } } } });
+    auto range_ids = unwrap(filter->getIdsMatchingFilter(range_q));
+    std::unordered_set<ndd::idInt> got_range(range_ids.begin(), range_ids.end());
+
+    std::unordered_set<ndd::idInt> expected_range;
+    for(const auto& [value, ids_set] : model.value_to_ids) {
+        if(value >= RANGE_LO && value <= RANGE_HI) {
+            expected_range.insert(ids_set.begin(), ids_set.end());
+        }
+    }
+    ASSERT_EQ(got_range.size(), expected_range.size())
+        << "range query cardinality mismatch";
+    for(ndd::idInt eid : expected_range) {
+        ASSERT_TRUE(got_range.count(eid))
+            << "range query missing id=" << eid
+            << " (forward value=" << model.id_to_value[eid] << ")";
+    }
+}
diff --git a/tests/repo_filter.py b/tests/repo_filter.py
new file mode 100644
index 0000000000..3192bed08c
--- /dev/null
+++ b/tests/repo_filter.py
@@ -0,0 +1,145 @@
+#!/usr/bin/env python3
+"""
+Reproduce the duplicate-heavy numeric bucket cliff in endee.
+
+Inserts 65,535 vectors with identical filter value, then 1 more (=65,536),
+then 1 more (=65,537). Searches at each step. Recall collapses to 0 at the
+65,536 boundary because Bucket::serialize truncates uint16_t count to 0.
+
+Run with a fresh endee server on localhost:8080.
+"""
+
+import json
+import os
+import sys
+import time
+import requests
+import msgpack
+
+BASE = os.environ.get("ENDEE_URL", "http://localhost:8080")
+TOKEN = os.environ.get("ENDEE_TOKEN", "")
+INDEX = "bucket_repro"
+DIM = 16
+FILTER_VALUE = 100
+BATCH = 1000
+
+HEADERS = {"Content-Type": "application/json"}
+if TOKEN:
+    HEADERS["Authorization"] = f"Bearer {TOKEN}"
+
+
+def post(path, payload):
+    r = requests.post(f"{BASE}{path}", headers=HEADERS, data=json.dumps(payload))
+    if r.status_code >= 400:
+        raise RuntimeError(f"POST {path} -> {r.status_code}: {r.text}")
+    return r
+
+
+def delete(path):
+    r = requests.delete(f"{BASE}{path}", headers=HEADERS)
+    return r
+
+
+def make_vector(i):
+    # Deterministic 16-d vector that varies enough for HNSW to be meaningful
+    return [((i + j * 7) % 1000) / 1000.0 for j in range(DIM)]
+
+
+def search_filtered(k=10):
+    body = {
+        "vector": make_vector(0),
+        "k": k,
+        "filter": json.dumps([{"score": {"$eq": FILTER_VALUE}}]),
+    }
+    r = post(f"/api/v1/index/{INDEX}/search", body)
+    results = msgpack.unpackb(r.content, raw=False)
+    # results is List[VectorResult], each VectorResult is a list:
+    # [similarity, id, meta, filter, norm, vector]
+    return [row[1] for row in results]
+
+
+def search_unfiltered(k=10):
+    body = {"vector": make_vector(0), "k": k}
+    r = post(f"/api/v1/index/{INDEX}/search", body)
+    results = msgpack.unpackb(r.content, raw=False)
+    return [row[1] for row in results]
+
+
+def insert_range(lo, hi):
+    """Insert ids v{lo} .. v{hi-1}."""
+    for batch_start in range(lo, hi, BATCH):
+        batch_end = min(batch_start + BATCH, hi)
+        items = [
+            {
+                "id": f"v{i}",
+                "vector": make_vector(i),
+                "filter": json.dumps({"score": FILTER_VALUE}),
+            }
+            for i in range(batch_start, batch_end)
+        ]
+        post(f"/api/v1/index/{INDEX}/vector/insert", items)
+
+
+def report(label, total_inserted):
+    filtered = search_filtered(k=10)
+    unfiltered = search_unfiltered(k=10)
+    print(
+        f"[{label}] inserted={total_inserted:>5}  "
+        f"filtered_hits={len(filtered):>2}/10  "
+        f"unfiltered_hits={len(unfiltered):>2}/10"
+    )
+    return len(filtered)
+
+
+def main():
+    # Cleanup any prior run
+    delete(f"/api/v1/index/{INDEX}/delete")
+
+    # 1. Create index
+    post(
+        "/api/v1/index/create",
+        {
+            "index_name": INDEX,
+            "dim": DIM,
+            "space_type": "l2",
+            "precision": "float32",
+            "sparse_model": "None",
+        },
+    )
+    print(f"created index {INDEX} dim={DIM}")
+
+    # 2. Insert 65,535 vectors
+    t0 = time.time()
+    insert_range(0, 65_535)
+    print(f"inserted 65535 vectors in {time.time()-t0:.1f}s")
+
+    # 3. Sanity: filtered search works
+    pre_cliff_hits = report("pre-cliff ", 65_535)
+    assert pre_cliff_hits == 10, "expected 10 filtered hits before cliff"
+
+    # 4. The cliff: one more insert -> total 65,536
+    insert_range(65_535, 65_536)
+    cliff_hits = report("AT CLIFF  ", 65_536)
+
+    # 5. Off the cliff: one more insert -> total 65,537
+    insert_range(65_536, 65_537)
+    post_cliff_hits = report("post-cliff", 65_537)
+
+    # 6. Cleanup
+    delete(f"/api/v1/index/{INDEX}/delete")
+
+    # 7. Report
+    print()
+    print("=== Summary ===")
+    print(f"pre-cliff (65,535)  filtered hits: {pre_cliff_hits}/10")
+    print(f"AT cliff  (65,536)  filtered hits: {cliff_hits}/10  <-- expect 0")
+    print(f"post cliff (65,537) filtered hits: {post_cliff_hits}/10")
+    if cliff_hits == 0 and pre_cliff_hits > 0:
+        print("BUG REPRODUCED: filter recall dropped to zero at the cliff.")
+        sys.exit(0)
+    print("BUG NOT REPRODUCED — investigate.")
+    sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/tests/request_validation_test.cpp b/tests/request_validation_test.cpp
new file mode 100644
index 0000000000..f080a8f508
--- /dev/null
+++ b/tests/request_validation_test.cpp
@@ -0,0 +1,102 @@
+#include <gtest/gtest.h>
+#include <string>
+
+#include "core/types.hpp"
+#include "crow/json.h"
+#include "server/request_validation.hpp"
+#include "settings.hpp"
+
+namespace {
+
+const crow::json::rvalue& field_from_json(const std::string& json_body, const char* field_name) {
+    static crow::json::rvalue body;
+    body = crow::json::load(json_body);
+    return body[field_name];
+}
+
+}  // namespace
+
+TEST(RequestValidationTest, RejectsNegativePrefilterThreshold) {
+    auto result = ndd::server::parse_bounded_size(field_from_json(R"({"v": -1})", "v"),
+                                                 "filter_params.prefilter_threshold",
+                                                 0,
+                                                 settings::MAX_VECTORS_ADMIN);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_NE(result.message.find("must be between"), std::string::npos);
+}
+
+TEST(RequestValidationTest, RejectsNegativeBoostPercentage) {
+    auto result = ndd::server::parse_bounded_size(field_from_json(R"({"v": -1})", "v"),
+                                                 "filter_params.boost_percentage",
+                                                 0,
+                                                 100);
+
+    EXPECT_FALSE(result.ok());
+    EXPECT_NE(result.message.find("must be between"), std::string::npos);
+}
+
+TEST(RequestValidationTest, AcceptsValidBounds) {
+    auto zero = ndd::server::parse_bounded_size(field_from_json(R"({"v": 0})", "v"),
+                                               "filter_params.prefilter_threshold",
+                                               0,
+                                               settings::MAX_VECTORS_ADMIN);
+    ASSERT_TRUE(zero.ok()) << zero.message;
+    ASSERT_TRUE(zero.value.has_value());
+    EXPECT_EQ(*zero.value, 0u);
+
+    auto max_prefilter = ndd::server::parse_bounded_size(
+            field_from_json(R"({"v": 1000000000})", "v"),
+            "filter_params.prefilter_threshold",
+            0,
+            settings::MAX_VECTORS_ADMIN);
+    ASSERT_TRUE(max_prefilter.ok()) << max_prefilter.message;
+    ASSERT_TRUE(max_prefilter.value.has_value());
+    EXPECT_EQ(*max_prefilter.value, settings::MAX_VECTORS_ADMIN);
+
+    auto max_boost = ndd::server::parse_bounded_size(field_from_json(R"({"v": 100})", "v"),
+                                                    "filter_params.boost_percentage",
+                                                    0,
+                                                    100);
+    ASSERT_TRUE(max_boost.ok()) << max_boost.message;
+    ASSERT_TRUE(max_boost.value.has_value());
+    EXPECT_EQ(*max_boost.value, 100u);
+}
+
+TEST(RequestValidationTest, FilterParamsDefaultsRemainUnchangedWhenAbsent) {
+    ndd::FilterParams filter_params;
+
+    EXPECT_EQ(filter_params.prefilter_threshold, settings::PREFILTER_CARDINALITY_THRESHOLD);
+    EXPECT_EQ(filter_params.boost_percentage, settings::FILTER_BOOST_PERCENTAGE);
+}
+
+TEST(RequestValidationTest, RejectsOutOfRangeValues) {
+    auto prefilter = ndd::server::parse_bounded_size(
+            field_from_json(R"({"v": 1000000001})", "v"),
+            "filter_params.prefilter_threshold",
+            0,
+            settings::MAX_VECTORS_ADMIN);
+    EXPECT_FALSE(prefilter.ok());
+
+    auto boost = ndd::server::parse_bounded_size(field_from_json(R"({"v": 101})", "v"),
+                                                "filter_params.boost_percentage",
+                                                0,
+                                                100);
+    EXPECT_FALSE(boost.ok());
+}
+
+TEST(RequestValidationTest, RejectsNonIntegerValues) {
+    auto floating = ndd::server::parse_bounded_size(field_from_json(R"({"v": 1.5})", "v"),
+                                                   "filter_params.boost_percentage",
+                                                   0,
+                                                   100);
+    EXPECT_FALSE(floating.ok());
+    EXPECT_NE(floating.message.find("must be an integer"), std::string::npos);
+
+    auto string_value = ndd::server::parse_bounded_size(field_from_json(R"({"v": "5"})", "v"),
+                                                       "filter_params.boost_percentage",
+                                                       0,
+                                                       100);
+    EXPECT_FALSE(string_value.ok());
+    EXPECT_NE(string_value.message.find("must be an integer"), std::string::npos);
+}
diff --git a/tests/vector_storage_test.cpp b/tests/vector_storage_test.cpp
new file mode 100644
index 0000000000..147e00a4e6
--- /dev/null
+++ b/tests/vector_storage_test.cpp
@@ -0,0 +1,336 @@
+// Tests for VectorStorage upsert cleanup and deleteFilter meta sync.
+// These cover the two correctness gaps fixed alongside this file:
+//   1. store_vectors_batch must remove the prior filter index entries when the
+//      id_mapper signals the str_id was already live (is_new_to_db == false).
+//   2. deleteFilter must clear meta.filter so subsequent get_meta calls do not
+//      return a document whose index entries are gone.
+
+#include <gtest/gtest.h>
+#include <cstdlib>
+#include <filesystem>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "json/nlohmann_json.hpp"
+// hnswlib must be included before vector_storage.hpp: vector_storage.hpp pulls in
+// quant/dispatch.hpp first, but space.hpp (reached transitively) uses
+// ndd::quant::get_quantizer_dispatch, which is only defined further down in
+// dispatch.hpp. Routing through hnswlib.h first lets dispatch.hpp resolve
+// fully before space.hpp parses its constructor body.
+#include "hnsw/hnswlib.h"
+#include "storage/vector_storage.hpp"
+
+namespace fs = std::filesystem;
+using json = nlohmann::json;
+
+namespace {
+
+QuantVectorObject make_obj(const std::string& id, const std::string& filter_json) {
+    QuantVectorObject obj;
+    obj.id = id;
+    obj.filter = filter_json;
+    obj.norm = 1.0f;
+    // FP32 quantization with dim=4 => 16 bytes of vector payload.
+    obj.quant_vector.assign(4 * sizeof(float), 0);
+    return obj;
+}
+
+}  // namespace
+
+class VectorStorageTest : public ::testing::Test {
+protected:
+    std::string base_path;
+    std::unique_ptr<VectorStorage> storage;
+
+    void SetUp() override {
+        base_path = "./test_vs_" + std::to_string(std::rand());
+        if(fs::exists(base_path)) {
+            fs::remove_all(base_path);
+        }
+        fs::create_directories(base_path);
+        storage = std::make_unique<VectorStorage>(
+                base_path, "test_index", 4, ndd::quant::QuantizationLevel::FP32);
+    }
+
+    void TearDown() override {
+        storage.reset();
+        if(fs::exists(base_path)) {
+            fs::remove_all(base_path);
+        }
+    }
+
+    bool filter_matches(const json& filter_array, ndd::idInt id) {
+        auto result = storage->filter_store_->getIdsMatchingFilter(filter_array);
+        EXPECT_TRUE(result.ok()) << result.message;
+        if(!result.ok()) return false;
+        const auto& ids = result.value_or_throw();
+        return std::find(ids.begin(), ids.end(), id) != ids.end();
+    }
+};
+
+// Upsert path: re-inserting a live point with a different filter must drop the
+// old filter's index entries. Before the fix, the old "color":"red" mapping
+// kept matching id 42 even after the upsert wrote "color":"blue".
+TEST_F(VectorStorageTest, UpsertRemovesStaleCategoryFilter) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{42, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 42));
+
+    auto v1_new = make_obj("v1", R"({"color":"blue"})");
+    auto result = storage->store_vectors_batch({{42, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 42))
+            << "Stale 'color=red' index entry still matches id 42 after upsert";
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "blue"}}}}}), 42));
+    EXPECT_EQ(storage->get_meta(42).filter, R"({"color":"blue"})");
+}
+
+// Same upsert invariant for numeric filters: the prior numeric index entry must
+// be removed before the new one is written.
+TEST_F(VectorStorageTest, UpsertRemovesStaleNumericFilter) {
+    auto v1 = make_obj("v1", R"({"age":30})");
+    ASSERT_TRUE(storage->store_vectors_batch({{7, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"age", {{"$eq", 30}}}}}), 7));
+
+    auto v1_new = make_obj("v1", R"({"age":40})");
+    auto result = storage->store_vectors_batch({{7, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"age", {{"$eq", 30}}}}}), 7))
+            << "Stale 'age=30' index entry still matches id 7 after upsert";
+    EXPECT_TRUE(filter_matches(json::array({{{"age", {{"$eq", 40}}}}}), 7));
+    EXPECT_EQ(storage->get_meta(7).filter, R"({"age":40})");
+}
+
+// is_new_to_db == true means the slot is fresh or was reused from a deleted slot
+// whose filter index was already scrubbed. The cleanup pass must skip it; no
+// spurious meta read should occur on a slot that has no prior write.
+TEST_F(VectorStorageTest, UpsertFreshSlotSkipsCleanup) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    auto result = storage->store_vectors_batch({{100, v1}}, {true});
+    ASSERT_TRUE(result.ok()) << result.message;
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 100));
+}
+
+// If is_new_to_db is omitted (empty), we fall back to legacy "treat all as new"
+// semantics for callers that have not been updated to forward the flag.
+TEST_F(VectorStorageTest, EmptyFlagsVectorTreatsAllAsNew) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    auto result = storage->store_vectors_batch({{55, v1}});  // no flags
+    ASSERT_TRUE(result.ok()) << result.message;
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 55));
+}
+
+// Mismatched flag length is a programmer error and must be surfaced rather than
+// silently treating some entries one way and others another.
+TEST_F(VectorStorageTest, MismatchedFlagsRejected) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    auto v2 = make_obj("v2", R"({"color":"blue"})");
+    auto result = storage->store_vectors_batch({{1, v1}, {2, v2}}, {true});  // 1 flag for 2 vecs
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 1u);
+}
+
+// is_new_to_db == false claims the slot is live, but if meta does not exist
+// that is torn state from a previous partial write. Surface it instead of
+// silently overwriting.
+TEST_F(VectorStorageTest, UpsertOnMissingMetaSurfacesTornState) {
+    auto v = make_obj("v1", R"({"color":"red"})");
+    auto result = storage->store_vectors_batch({{999, v}}, {false});
+    EXPECT_FALSE(result.ok());
+    EXPECT_EQ(result.code, 103u) << result.message;
+}
+
+// Upsert from a vector that had no filter into one that does: cleanup pass
+// reads empty meta.filter, skips remove, and the new filter is added.
+TEST_F(VectorStorageTest, UpsertFromEmptyFilterToPopulatedCategory) {
+    auto v1 = make_obj("v1", "");
+    ASSERT_TRUE(storage->store_vectors_batch({{20, v1}}, {true}).ok());
+
+    auto v1_new = make_obj("v1", R"({"color":"green"})");
+    auto result = storage->store_vectors_batch({{20, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "green"}}}}}), 20));
+}
+
+TEST_F(VectorStorageTest, UpsertFromEmptyFilterToPopulatedNumeric) {
+    auto v1 = make_obj("v1", "");
+    ASSERT_TRUE(storage->store_vectors_batch({{120, v1}}, {true}).ok());
+
+    auto v1_new = make_obj("v1", R"({"score":75})");
+    auto result = storage->store_vectors_batch({{120, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_TRUE(filter_matches(json::array({{{"score", {{"$eq", 75}}}}}), 120));
+}
+
+// Upsert from a populated filter into an empty filter: the old index entries
+// must be removed, and the new filter add path is a no-op for an empty doc.
+TEST_F(VectorStorageTest, UpsertFromPopulatedFilterToEmptyCategory) {
+    auto v1 = make_obj("v1", R"({"color":"yellow"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{21, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "yellow"}}}}}), 21));
+
+    auto v1_new = make_obj("v1", "");
+    auto result = storage->store_vectors_batch({{21, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"color", {{"$eq", "yellow"}}}}}), 21))
+            << "Old 'color=yellow' index entry survived upsert to empty filter";
+    EXPECT_TRUE(storage->get_meta(21).filter.empty());
+}
+
+TEST_F(VectorStorageTest, UpsertFromPopulatedFilterToEmptyNumeric) {
+    auto v1 = make_obj("v1", R"({"score":99})");
+    ASSERT_TRUE(storage->store_vectors_batch({{121, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"score", {{"$eq", 99}}}}}), 121));
+
+    auto v1_new = make_obj("v1", "");
+    auto result = storage->store_vectors_batch({{121, v1_new}}, {false});
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"score", {{"$eq", 99}}}}}), 121))
+            << "Old 'score=99' numeric index entry survived upsert to empty filter";
+    EXPECT_TRUE(storage->get_meta(121).filter.empty());
+}
+
+// deleteFilter must clear meta.filter when the stored doc matches the input
+// document, so a get_meta call after deletion does not return a filter whose
+// index entries are gone.
+TEST_F(VectorStorageTest, DeleteFilterClearsMetaWhenMatchCategory) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{42, v1}}, {true}).ok());
+    ASSERT_EQ(storage->get_meta(42).filter, R"({"color":"red"})");
+
+    auto result = storage->deleteFilter(42, R"({"color":"red"})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 42));
+    EXPECT_TRUE(storage->get_meta(42).filter.empty())
+            << "meta.filter still set after deleteFilter: " << storage->get_meta(42).filter;
+}
+
+TEST_F(VectorStorageTest, DeleteFilterClearsMetaWhenMatchNumeric) {
+    auto v1 = make_obj("v1", R"({"score":80})");
+    ASSERT_TRUE(storage->store_vectors_batch({{142, v1}}, {true}).ok());
+    ASSERT_EQ(storage->get_meta(142).filter, R"({"score":80})");
+
+    auto result = storage->deleteFilter(142, R"({"score":80})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"score", {{"$eq", 80}}}}}), 142));
+    EXPECT_TRUE(storage->get_meta(142).filter.empty())
+            << "meta.filter still set after deleteFilter: " << storage->get_meta(142).filter;
+}
+
+// deleteFilter should leave meta untouched if the caller asks to remove a
+// document that no longer matches what is stored. Index entries are still
+// removed (best effort).
+TEST_F(VectorStorageTest, DeleteFilterLeavesMetaWhenDifferentCategory) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{42, v1}}, {true}).ok());
+
+    auto result = storage->deleteFilter(42, R"({"color":"orange"})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    // meta.filter was not the same doc we tried to remove, so it stays.
+    EXPECT_EQ(storage->get_meta(42).filter, R"({"color":"red"})");
+}
+
+TEST_F(VectorStorageTest, DeleteFilterLeavesMetaWhenDifferentNumeric) {
+    auto v1 = make_obj("v1", R"({"score":80})");
+    ASSERT_TRUE(storage->store_vectors_batch({{143, v1}}, {true}).ok());
+
+    auto result = storage->deleteFilter(143, R"({"score":81})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    // meta.filter was not the same doc we tried to remove, so it stays.
+    EXPECT_EQ(storage->get_meta(143).filter, R"({"score":80})");
+}
+
+// Explicit updateFilter path (the API surface invoked by `index_manager.updateFilters`):
+// after replacing filter A with filter B, queries against the OLD filter must no
+// longer return the vector and queries against the NEW filter must.
+TEST_F(VectorStorageTest, UpdateFilterReplacesCategoryFilter) {
+    auto v1 = make_obj("v1", R"({"color":"red"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{42, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 42));
+
+    auto result = storage->updateFilter(42, R"({"color":"blue"})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"color", {{"$eq", "red"}}}}}), 42))
+            << "Stale 'color=red' index entry still matches id 42 after updateFilter";
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "blue"}}}}}), 42));
+    EXPECT_EQ(storage->get_meta(42).filter, R"({"color":"blue"})");
+}
+
+TEST_F(VectorStorageTest, UpdateFilterReplacesNumericFilter) {
+    auto v1 = make_obj("v1", R"({"age":30})");
+    ASSERT_TRUE(storage->store_vectors_batch({{7, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"age", {{"$eq", 30}}}}}), 7));
+
+    auto result = storage->updateFilter(7, R"({"age":40})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"age", {{"$eq", 30}}}}}), 7))
+            << "Stale 'age=30' index entry still matches id 7 after updateFilter";
+    EXPECT_TRUE(filter_matches(json::array({{{"age", {{"$eq", 40}}}}}), 7));
+    EXPECT_EQ(storage->get_meta(7).filter, R"({"age":40})");
+}
+
+// updateFilter starting from an empty filter document: nothing to remove, but
+// the new filter must be added and meta must reflect it.
+TEST_F(VectorStorageTest, UpdateFilterFromEmptyCategory) {
+    auto v1 = make_obj("v1", "");
+    ASSERT_TRUE(storage->store_vectors_batch({{30, v1}}, {true}).ok());
+
+    auto result = storage->updateFilter(30, R"({"color":"green"})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "green"}}}}}), 30));
+    EXPECT_EQ(storage->get_meta(30).filter, R"({"color":"green"})");
+}
+
+TEST_F(VectorStorageTest, UpdateFilterFromEmptyNumeric) {
+    auto v1 = make_obj("v1", "");
+    ASSERT_TRUE(storage->store_vectors_batch({{130, v1}}, {true}).ok());
+
+    auto result = storage->updateFilter(130, R"({"score":42})");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_TRUE(filter_matches(json::array({{{"score", {{"$eq", 42}}}}}), 130));
+    EXPECT_EQ(storage->get_meta(130).filter, R"({"score":42})");
+}
+
+// updateFilter to an empty document: the prior filter index entries must be
+// removed and meta.filter must be cleared.
+TEST_F(VectorStorageTest, UpdateFilterToEmptyCategory) {
+    auto v1 = make_obj("v1", R"({"color":"yellow"})");
+    ASSERT_TRUE(storage->store_vectors_batch({{31, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"color", {{"$eq", "yellow"}}}}}), 31));
+
+    auto result = storage->updateFilter(31, "");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"color", {{"$eq", "yellow"}}}}}), 31))
+            << "Old 'color=yellow' index entry survived updateFilter to empty";
+    EXPECT_TRUE(storage->get_meta(31).filter.empty());
+}
+
+TEST_F(VectorStorageTest, UpdateFilterToEmptyNumeric) {
+    auto v1 = make_obj("v1", R"({"score":55})");
+    ASSERT_TRUE(storage->store_vectors_batch({{131, v1}}, {true}).ok());
+    ASSERT_TRUE(filter_matches(json::array({{{"score", {{"$eq", 55}}}}}), 131));
+
+    auto result = storage->updateFilter(131, "");
+    ASSERT_TRUE(result.ok()) << result.message;
+
+    EXPECT_FALSE(filter_matches(json::array({{{"score", {{"$eq", 55}}}}}), 131))
+            << "Old 'score=55' index entry survived updateFilter to empty";
+    EXPECT_TRUE(storage->get_meta(131).filter.empty());
+}
+