Merge pull request #6 from endee-io/dev

pankajEndee · web-flow · commit 14976c2edafc · 2026-02-24T12:08:27.000+05:30
Dev
diff --git a/README.md b/README.md
@@ -77,7 +77,7 @@ import io.endee.client.types.SpaceType;
 
 CreateIndexOptions options = CreateIndexOptions.builder("my_vectors", 384)
     .spaceType(SpaceType.COSINE)
-    .precision(Precision.INT8D)
+    .precision(Precision.INT8)
     .build();
 
 client.createIndex(options);
@@ -92,7 +92,7 @@ client.createIndex(options);
 | `spaceType` | Distance metric - `COSINE`, `L2`, or `IP` (inner product)                    | `COSINE` |
 | `m`         | Graph connectivity - higher values increase recall but use more memory       | 16       |
 | `efCon`     | Construction-time parameter - higher values improve index quality            | 128      |
-| `precision` | Quantization precision                                                       | `INT8D`  |
+| `precision` | Quantization precision                                                       | `INT8`  |
 
 ### Create a Hybrid Index
 
@@ -102,7 +102,7 @@ Hybrid indexes combine dense vector search with sparse vector search. Add the `s
 CreateIndexOptions options = CreateIndexOptions.builder("hybrid_index", 384)
     .sparseDimension(30000)    // Sparse vector dimension (vocabulary size)
     .spaceType(SpaceType.COSINE)
-    .precision(Precision.INT8D)
+    .precision(Precision.INT8)
     .build();
 
 client.createIndex(options);
@@ -189,12 +189,14 @@ for (QueryResult item : results) {
 
 **Query Parameters:**
 
-| Parameter        | Description                                             | Default  | Max  |
-| ---------------- | ------------------------------------------------------- | -------- | ---- |
-| `vector`         | Query vector (must match index dimension)               | Required | -    |
-| `topK`           | Number of results to return                             | 10       | 512  |
-| `ef`             | Search quality parameter - higher values improve recall | 128      | 1024 |
-| `includeVectors` | Include vector data in results                          | false    | -    |
+| Parameter                        | Description                                             | Default | Max       |
+| -------------------------------- | ------------------------------------------------------- | ------- | --------- |
+| `vector`                         | Query vector (must match index dimension)               | Required | -        |
+| `topK`                           | Number of results to return                             | 10      | 512       |
+| `ef`                             | Search quality parameter - higher values improve recall | 128     | 1024      |
+| `includeVectors`                 | Include vector data in results                          | false   | -         |
+| `prefilterCardinalityThreshold`  | Switch to postfiltering when estimated matches exceed this value | 10,000 | 1,000,000 |
+| `filterBoostPercentage`          | Bias results toward filter matches (0 = disabled)       | 0       | 100       |
 
 ## Filtered Querying
 
@@ -223,6 +225,29 @@ List<QueryResult> results = index.query(
 
 > **Note:** The `$range` operator supports values within **[0 - 999]**. Normalize larger values before upserting.
 
+### Filter Params
+
+Use `prefilterCardinalityThreshold` and `filterBoostPercentage` to fine-tune how filtering interacts with the ANN search:
+
+```java
+List<QueryResult> results = index.query(
+    QueryOptions.builder()
+        .vector(new double[] {0.15, 0.25 /* ... */})
+        .topK(5)
+        .filter(List.of(
+            Map.of("category", Map.of("$eq", "tech"))
+        ))
+        .prefilterCardinalityThreshold(50_000)  // Use postfilter when >50k vectors match
+        .filterBoostPercentage(20)              // Bias 20% toward filter-matching vectors
+        .build()
+);
+```
+
+| Parameter                       | Description                                                                                                                    | Default | Range             |
+| ------------------------------- | ------------------------------------------------------------------------------------------------------------------------------ | ------- | ----------------- |
+| `prefilterCardinalityThreshold` | When the estimated number of vectors matching the filter exceeds this value, postfiltering is used instead of prefiltering.    | 10,000  | 1,000–1,000,000   |
+| `filterBoostPercentage`         | Percentage by which filter-matching vectors are boosted during scoring. Set to `0` to disable. Higher values favor filtered results. | 0   | 0–100             |
+
 ## Hybrid Search
 
 ### Upserting Hybrid Vectors
@@ -340,7 +365,7 @@ IndexDescription info = index.describe();
 System.out.println(info);
 // IndexDescription{name='my_index', spaceType=COSINE, dimension=384,
 //                  sparseDimension=0, isHybrid=false, count=1000,
-//                  precision=INT8D, m=16}
+//                  precision=INT8, m=16}
 ```
 
 ### Check if Index is Hybrid
@@ -357,8 +382,8 @@ Endee supports different quantization precision levels:
 import io.endee.client.types.Precision;
 
 Precision.BINARY    // Binary quantization (1-bit) - smallest storage, fastest search
-Precision.INT8D     // 8-bit integer quantization (default) - balanced performance
-Precision.INT16D    // 16-bit integer quantization - higher precision
+Precision.INT8     // 8-bit integer quantization (default) - balanced performance
+Precision.INT16    // 16-bit integer quantization - higher precision
 Precision.FLOAT16   // 16-bit floating point - good balance
 Precision.FLOAT32   // 32-bit floating point - highest precision
 ```
@@ -368,8 +393,8 @@ Precision.FLOAT32   // 32-bit floating point - highest precision
 | Precision | Use Case                                                                  |
 | --------- | ------------------------------------------------------------------------- |
 | `BINARY`  | Very large datasets where speed and storage are critical                  |
-| `INT8D`   | Recommended for most use cases - good balance of accuracy and performance |
-| `INT16D`  | Better accuracy than INT8D but less storage than FLOAT32                  |
+| `INT8`   | Recommended for most use cases - good balance of accuracy and performance |
+| `INT16`  | Better accuracy than INT8 but less storage than FLOAT32                  |
 | `FLOAT16` | Good compromise between precision and storage for embeddings              |
 | `FLOAT32` | Maximum precision when storage is not a concern                           |
 
@@ -435,7 +460,7 @@ public class EndeeExample {
         // Create a dense index
         CreateIndexOptions createOptions = CreateIndexOptions.builder("documents", 384)
             .spaceType(SpaceType.COSINE)
-            .precision(Precision.INT8D)
+            .precision(Precision.INT8)
             .build();
 
         client.createIndex(createOptions);
@@ -515,7 +540,7 @@ CreateIndexOptions.builder(String name, int dimension)
     .spaceType(SpaceType)        // Default: COSINE
     .m(int)                      // Default: 16
     .efCon(int)                  // Default: 128
-    .precision(Precision)        // Default: INT8D
+    .precision(Precision)        // Default: INT8
     .sparseDimension(Integer)    // Optional, for hybrid indexes
     .build()
 ```
@@ -525,12 +550,14 @@ CreateIndexOptions.builder(String name, int dimension)
 ```java
 QueryOptions.builder()
     .vector(double[])                        // Required for dense search
-    .topK(int)                               // Required
-    .ef(int)                                 // Default: 128
+    .topK(int)                               // Default: 10, max 512
+    .ef(int)                                 // Default: 128, max 1024
     .filter(List<Map<String, Object>>)       // Optional
     .includeVectors(boolean)                 // Default: false
     .sparseIndices(int[])                    // Optional, for hybrid search
     .sparseValues(double[])                  // Optional, for hybrid search
+    .prefilterCardinalityThreshold(int)      // Default: 10000, range 1000–1000000
+    .filterBoostPercentage(int)              // Default: 0, range 0–100
     .build()
 ```
 
diff --git a/src/main/java/io/endee/client/Endee.java b/src/main/java/io/endee/client/Endee.java
@@ -34,7 +34,7 @@
  * // Create an index
  * CreateIndexOptions options = CreateIndexOptions.builder("my_index", 128)
  *         .spaceType(SpaceType.COSINE)
- *         .precision(Precision.INT8D)
+ *         .precision(Precision.INT8)
  *         .build();
  * client.createIndex(options);
  *
diff --git a/src/main/java/io/endee/client/Index.java b/src/main/java/io/endee/client/Index.java
@@ -71,7 +71,7 @@ public Index(String name, String token, String url, int version, IndexInfo param
         this.count = params != null ? params.getTotalElements() : 0;
         this.spaceType = params != null && params.getSpaceType() != null ? params.getSpaceType() : SpaceType.COSINE;
         this.dimension = params != null ? params.getDimension() : 0;
-        this.precision = params != null && params.getPrecision() != null ? params.getPrecision() : Precision.INT8D;
+        this.precision = params != null && params.getPrecision() != null ? params.getPrecision() : Precision.INT8;
         this.m = params != null ? params.getM() : 16;
         this.sparseDimension = params != null && params.getSparseDimension() != null ? params.getSparseDimension() : 0;
 
diff --git a/src/main/java/io/endee/client/types/CreateIndexOptions.java b/src/main/java/io/endee/client/types/CreateIndexOptions.java
@@ -9,7 +9,7 @@ public class CreateIndexOptions {
     private SpaceType spaceType = SpaceType.COSINE;
     private int m = 16;
     private int efCon = 128;
-    private Precision precision = Precision.INT8D;
+    private Precision precision = Precision.INT8;
     private Integer version = null;
     private Integer sparseDimension = null;
 
diff --git a/src/main/java/io/endee/client/types/Precision.java b/src/main/java/io/endee/client/types/Precision.java
@@ -5,8 +5,8 @@
  */
 public enum Precision {
     BINARY("binary"),
-    INT8D("int8d"),
-    INT16D("int16d"),
+    INT8("int8"),
+    INT16("int16"),
     FLOAT32("float32"),
     FLOAT16("float16");
 

Original file line number	Diff line number	Diff line change
`@@ -34,7 +34,7 @@`
`34`	`34`	`* // Create an index`
`35`	`35`	`* CreateIndexOptions options = CreateIndexOptions.builder("my_index", 128)`
`36`	`36`	`* .spaceType(SpaceType.COSINE)`
`37`		`- * .precision(Precision.INT8D)`
	`37`	`+ * .precision(Precision.INT8)`
`38`	`38`	`* .build();`
`39`	`39`	`* client.createIndex(options);`
`40`	`40`	`*`