code formatting

trvon · trvon · commit acd42a680883 · 2026-01-24T00:00:35.000-05:00
diff --git a/benchmarks/filtered_search_benchmark.cpp b/benchmarks/filtered_search_benchmark.cpp
@@ -90,9 +90,8 @@ static void BM_HNSW_Search_Filter_Bitset(benchmark::State& state) {
 
     for (auto _ : state) {
         for (const auto& q : data.queries) {
-            auto results =
-                data.index.search_with_filter(std::span<const float>{q}, k, ef,
-                                              [&](size_t id) { return data.allowed[id] != 0; });
+            auto results = data.index.search_with_filter(
+                std::span<const float>{q}, k, ef, [&](size_t id) { return data.allowed[id] != 0; });
             benchmark::DoNotOptimize(results);
         }
     }
@@ -113,9 +112,10 @@ static void BM_HNSW_Search_Filter_Set(benchmark::State& state) {
 
     for (auto _ : state) {
         for (const auto& q : data.queries) {
-            auto results = data.index.search_with_filter(
-                std::span<const float>{q}, k, ef,
-                [&](size_t id) { return data.allowed_set.contains(id); });
+            auto results =
+                data.index.search_with_filter(std::span<const float>{q}, k, ef, [&](size_t id) {
+                    return data.allowed_set.contains(id);
+                });
             benchmark::DoNotOptimize(results);
         }
     }
diff --git a/benchmarks/hnsw_768d_m_comparison.cpp b/benchmarks/hnsw_768d_m_comparison.cpp
@@ -19,18 +19,21 @@ std::vector<float> gen_vec(size_t dim, std::mt19937& rng) {
     std::uniform_real_distribution<float> dist(-1.0f, 1.0f);
     std::vector<float> vec(dim);
     float norm = 0.0f;
-    for (auto& v : vec) { v = dist(rng); norm += v * v; }
+    for (auto& v : vec) {
+        v = dist(rng);
+        norm += v * v;
+    }
     norm = std::sqrt(norm);
-    for (auto& v : vec) { v /= norm; }
+    for (auto& v : vec) {
+        v /= norm;
+    }
     return vec;
 }
 
 // Compute ground truth top-k for a single query (brute force)
-std::unordered_set<size_t> compute_gt(
-    const std::vector<float>& query,
-    const std::vector<std::vector<float>>& corpus,
-    size_t k, const CosineMetric<float>& metric
-) {
+std::unordered_set<size_t> compute_gt(const std::vector<float>& query,
+                                      const std::vector<std::vector<float>>& corpus, size_t k,
+                                      const CosineMetric<float>& metric) {
     std::vector<std::pair<size_t, float>> dists;
     dists.reserve(corpus.size());
     for (size_t i = 0; i < corpus.size(); ++i) {
@@ -40,7 +43,8 @@ std::unordered_set<size_t> compute_gt(
     std::partial_sort(dists.begin(), dists.begin() + k, dists.end(),
                       [](auto& a, auto& b) { return a.second < b.second; });
     std::unordered_set<size_t> result;
-    for (size_t i = 0; i < k; ++i) result.insert(dists[i].first);
+    for (size_t i = 0; i < k; ++i)
+        result.insert(dists[i].first);
     return result;
 }
 
@@ -51,24 +55,29 @@ int main() {
 
     printf("=================================================================\n");
     printf("768d Recall Benchmark: M=24 vs M=32\n");
-    printf("Corpus: %zu, Dim: %zu, k: %zu, Queries: %zu, Threads: %zu\n",
-           corpus_size, dim, k, num_queries, num_threads);
+    printf("Corpus: %zu, Dim: %zu, k: %zu, Queries: %zu, Threads: %zu\n", corpus_size, dim, k,
+           num_queries, num_threads);
     printf("=================================================================\n\n");
     fflush(stdout);
 
     // Generate corpus
-    printf("Generating corpus...\n"); fflush(stdout);
+    printf("Generating corpus...\n");
+    fflush(stdout);
     std::vector<std::vector<float>> vecs;
     vecs.reserve(corpus_size);
-    for (size_t i = 0; i < corpus_size; ++i) vecs.push_back(gen_vec(dim, rng));
+    for (size_t i = 0; i < corpus_size; ++i)
+        vecs.push_back(gen_vec(dim, rng));
 
     // Generate queries
-    printf("Generating queries...\n"); fflush(stdout);
+    printf("Generating queries...\n");
+    fflush(stdout);
     std::vector<std::vector<float>> qvecs;
-    for (size_t i = 0; i < num_queries; ++i) qvecs.push_back(gen_vec(dim, rng));
+    for (size_t i = 0; i < num_queries; ++i)
+        qvecs.push_back(gen_vec(dim, rng));
 
     // Parallel ground truth computation
-    printf("Computing ground truth (parallel, %zu threads)...\n", num_threads); fflush(stdout);
+    printf("Computing ground truth (parallel, %zu threads)...\n", num_threads);
+    fflush(stdout);
     auto gt_start = std::chrono::high_resolution_clock::now();
 
     std::vector<std::unordered_set<size_t>> gt_sets(num_queries);
@@ -85,42 +94,49 @@ int main() {
     for (size_t t = 0; t < num_threads; ++t) {
         size_t start = t * chunk;
         size_t end = std::min(start + chunk, num_queries);
-        if (start < end) threads.emplace_back(worker, start, end);
+        if (start < end)
+            threads.emplace_back(worker, start, end);
     }
-    for (auto& t : threads) t.join();
+    for (auto& t : threads)
+        t.join();
 
     auto gt_end = std::chrono::high_resolution_clock::now();
-    printf("Ground truth: %.1fs\n\n",
-           std::chrono::duration<double>(gt_end - gt_start).count());
+    printf("Ground truth: %.1fs\n\n", std::chrono::duration<double>(gt_end - gt_start).count());
     fflush(stdout);
 
     printf("%-6s | %-10s | %-12s | %-12s\n", "M", "ef_search", "Recall@10", "Latency(us)");
     printf("-------|------------|--------------|-------------\n");
     fflush(stdout);
 
-    for (auto [M, M_max, M_max_0] : {std::tuple{24,48,96}, std::tuple{32,64,128}}) {
+    for (auto [M, M_max, M_max_0] : {std::tuple{24, 48, 96}, std::tuple{32, 64, 128}}) {
         // Build index
         HNSWIndex<float, CosineMetric<float>>::Config cfg;
-        cfg.M = M; cfg.M_max = M_max; cfg.M_max_0 = M_max_0; cfg.ef_construction = 200;
+        cfg.M = M;
+        cfg.M_max = M_max;
+        cfg.M_max_0 = M_max_0;
+        cfg.ef_construction = 200;
         HNSWIndex<float, CosineMetric<float>> idx(cfg);
 
         auto build_start = std::chrono::high_resolution_clock::now();
         for (size_t i = 0; i < corpus_size; ++i)
             idx.insert(i, std::span<const float>{vecs[i]});
         auto build_end = std::chrono::high_resolution_clock::now();
         double build_s = std::chrono::duration<double>(build_end - build_start).count();
-        printf("M=%d built in %.1fs\n", M, build_s); fflush(stdout);
+        printf("M=%d built in %.1fs\n", M, build_s);
+        fflush(stdout);
 
         for (size_t ef : {50UL, 100UL, 200UL}) {
             size_t hits = 0;
             auto start = std::chrono::high_resolution_clock::now();
             for (size_t q = 0; q < num_queries; ++q) {
                 auto results = idx.search(std::span<const float>{qvecs[q]}, k, ef);
                 for (const auto& [id, _] : results)
-                    if (gt_sets[q].count(id)) ++hits;
+                    if (gt_sets[q].count(id))
+                        ++hits;
             }
             auto end = std::chrono::high_resolution_clock::now();
-            double lat_us = std::chrono::duration<double, std::micro>(end - start).count() / num_queries;
+            double lat_us =
+                std::chrono::duration<double, std::micro>(end - start).count() / num_queries;
             double recall = 100.0 * hits / (num_queries * k);
             printf("%-6d | %-10zu | %10.1f%% | %10.1f\n", M, ef, recall, lat_us);
             fflush(stdout);
@@ -129,6 +145,7 @@ int main() {
         fflush(stdout);
     }
 
-    printf("\nConclusion: If M=32 recall > M=24 by >3%%, consider extending Config::for_corpus()\n");
+    printf(
+        "\nConclusion: If M=32 recall > M=24 by >3%%, consider extending Config::for_corpus()\n");
     return 0;
 }
diff --git a/benchmarks/hnsw_768d_quick.cpp b/benchmarks/hnsw_768d_quick.cpp
@@ -14,9 +14,14 @@ std::vector<float> gen_vec(size_t dim, std::mt19937& rng) {
     std::uniform_real_distribution<float> dist(-1.0f, 1.0f);
     std::vector<float> vec(dim);
     float norm = 0.0f;
-    for (auto& v : vec) { v = dist(rng); norm += v * v; }
+    for (auto& v : vec) {
+        v = dist(rng);
+        norm += v * v;
+    }
     norm = std::sqrt(norm);
-    for (auto& v : vec) { v /= norm; }
+    for (auto& v : vec) {
+        v /= norm;
+    }
     return vec;
 }
 
@@ -28,19 +33,24 @@ int main() {
 
     // Generate data once
     std::vector<std::vector<float>> vecs, qvecs;
-    for (size_t i = 0; i < corpus; ++i) vecs.push_back(gen_vec(dim, rng));
-    for (size_t i = 0; i < queries; ++i) qvecs.push_back(gen_vec(dim, rng));
+    for (size_t i = 0; i < corpus; ++i)
+        vecs.push_back(gen_vec(dim, rng));
+    for (size_t i = 0; i < queries; ++i)
+        qvecs.push_back(gen_vec(dim, rng));
 
-    for (auto [M, M_max, M_max_0] : {std::tuple{24,48,96}, std::tuple{32,64,128}}) {
+    for (auto [M, M_max, M_max_0] : {std::tuple{24, 48, 96}, std::tuple{32, 64, 128}}) {
         HNSWIndex<float, CosineMetric<float>>::Config cfg;
-        cfg.M = M; cfg.M_max = M_max; cfg.M_max_0 = M_max_0; cfg.ef_construction = 200;
+        cfg.M = M;
+        cfg.M_max = M_max;
+        cfg.M_max_0 = M_max_0;
+        cfg.ef_construction = 200;
         HNSWIndex<float, CosineMetric<float>> idx(cfg);
 
         auto t1 = std::chrono::high_resolution_clock::now();
         for (size_t i = 0; i < corpus; ++i)
             idx.insert(i, std::span<const float>{vecs[i]});
         auto t2 = std::chrono::high_resolution_clock::now();
-        double build_ms = std::chrono::duration<double, std::milli>(t2-t1).count();
+        double build_ms = std::chrono::duration<double, std::milli>(t2 - t1).count();
 
         printf("M=%d: build=%.0fms", M, build_ms);
 
@@ -49,7 +59,7 @@ int main() {
             for (size_t q = 0; q < queries; ++q)
                 idx.search(std::span<const float>{qvecs[q]}, k, ef);
             auto e = std::chrono::high_resolution_clock::now();
-            double lat_us = std::chrono::duration<double, std::micro>(e-s).count() / queries;
+            double lat_us = std::chrono::duration<double, std::micro>(e - s).count() / queries;
             printf(" | ef=%zu: %.0fus", ef, lat_us);
         }
         printf("\n");
diff --git a/benchmarks/hnsw_benchmark.cpp b/benchmarks/hnsw_benchmark.cpp
@@ -449,8 +449,7 @@ static void BM_HNSW_FP16_Drift(benchmark::State& state) {
                 if (it != f32_dist.end()) {
                     ++total_hits;
                     if (it->second > 0.0f) {
-                        ratio_sum += static_cast<double>(dist) /
-                                     static_cast<double>(it->second);
+                        ratio_sum += static_cast<double>(dist) / static_cast<double>(it->second);
                         ++ratio_count;
                     }
                 }
diff --git a/include/sqlite-vec-cpp/index/hnsw.hpp b/include/sqlite-vec-cpp/index/hnsw.hpp
@@ -56,7 +56,8 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
         size_t ef_construction = 200; ///< Exploration factor during construction (100-500)
         float ml_factor = 1.0f / std::log(2.0f); ///< Layer selection multiplier (1/ln(2))
         MetricT metric{};                        ///< Distance metric (operates on float spans)
-        bool clamp_negative_distances = true; ///< Clamp negative distances to 0 (safe for L2/cosine)
+        bool clamp_negative_distances =
+            true; ///< Clamp negative distances to 0 (safe for L2/cosine)
 
         /// Create config optimized for high recall on large corpora
         /// @param corpus_size Expected number of vectors
@@ -478,9 +479,8 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
 
                 {
                     std::unique_lock lock(nodes_mutex_);
-                    auto [it, inserted] =
-                        nodes_.emplace(ids_span[i],
-                                       NodeType(ids_span[i], vectors_span[i], layer, config_.M_max));
+                    auto [it, inserted] = nodes_.emplace(
+                        ids_span[i], NodeType(ids_span[i], vectors_span[i], layer, config_.M_max));
                     if (!inserted) {
                         return;
                     }
@@ -526,8 +526,8 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
                 }
 
                 for (size_t lc = layer;; --lc) {
-                    auto candidates = beam_search_layer_batch(vector_f32, current,
-                                                              config_.ef_construction, lc);
+                    auto candidates =
+                        beam_search_layer_batch(vector_f32, current, config_.ef_construction, lc);
 
                     size_t M = (lc == 0) ? config_.M_max_0 : config_.M;
                     size_t num_connections = std::min(M, candidates.size());
@@ -824,8 +824,8 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
             // Remove edges to deleted nodes at each layer
             for (size_t layer = 0; layer < node.edges.size(); ++layer) {
                 auto& layer_edges = node.edges[layer];
-                std::erase_if(
-                    layer_edges, [this](size_t neighbor) { return is_deleted_unlocked(neighbor); });
+                std::erase_if(layer_edges,
+                              [this](size_t neighbor) { return is_deleted_unlocked(neighbor); });
             }
         }
     }
@@ -904,9 +904,7 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
             return current;
         float current_dist = distance_query_node(query, *current_node);
 
-        auto passes_filter = [&](size_t id) {
-            return !is_deleted_unlocked(id);
-        };
+        auto passes_filter = [&](size_t id) { return !is_deleted_unlocked(id); };
         size_t best_active = passes_filter(current) ? current : static_cast<size_t>(-1);
         float best_active_dist =
             passes_filter(current) ? current_dist : std::numeric_limits<float>::max();
@@ -951,9 +949,9 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
         return (best_active != static_cast<size_t>(-1)) ? best_active : current;
     }
 
-    std::vector<std::pair<size_t, float>>
-    beam_search_layer_batch(std::span<const float> query, size_t entry_point, size_t ef,
-                            size_t layer) const {
+    std::vector<std::pair<size_t, float>> beam_search_layer_batch(std::span<const float> query,
+                                                                  size_t entry_point, size_t ef,
+                                                                  size_t layer) const {
         auto cmp = [](const auto& a, const auto& b) { return a.first < b.first; };
         std::priority_queue<std::pair<float, size_t>, std::vector<std::pair<float, size_t>>,
                             decltype(cmp)>
@@ -978,9 +976,7 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
         }
         visited.visit(entry_dense);
 
-        auto passes_filter = [&](size_t id) {
-            return !is_deleted_unlocked(id);
-        };
+        auto passes_filter = [&](size_t id) { return !is_deleted_unlocked(id); };
 
         const float kDistanceEpsilon =
             config_.clamp_negative_distances ? -1e-5f : std::numeric_limits<float>::lowest();
@@ -1054,17 +1050,16 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
                                       neighbor_dist < top_candidates.top().first;
 
                 if (should_explore) {
-                    float scored =
-                        config_.clamp_negative_distances ? std::max(0.0f, neighbor_dist)
-                                                        : neighbor_dist;
+                    float scored = config_.clamp_negative_distances ? std::max(0.0f, neighbor_dist)
+                                                                    : neighbor_dist;
                     candidates.emplace(scored, neighbor);
                 }
 
                 if (passes_filter(neighbor)) {
                     if (top_candidates.size() < ef || neighbor_dist < top_candidates.top().first) {
-                        float scored =
-                            config_.clamp_negative_distances ? std::max(0.0f, neighbor_dist)
-                                                            : neighbor_dist;
+                        float scored = config_.clamp_negative_distances
+                                           ? std::max(0.0f, neighbor_dist)
+                                           : neighbor_dist;
                         top_candidates.emplace(scored, neighbor);
                         if (top_candidates.size() > ef) {
                             top_candidates.pop();
@@ -1088,7 +1083,9 @@ template <concepts::VectorElement StorageT, typename MetricT> class HNSWIndex {
         return result;
     }
 
-    void prune_connections_batch(size_t node_id, size_t layer) { prune_connections(node_id, layer); }
+    void prune_connections_batch(size_t node_id, size_t layer) {
+        prune_connections(node_id, layer);
+    }
 
     /// Greedy search (read-only, called under shared lock)
     size_t greedy_search_layer_locked(std::span<const float> query, size_t entry_point,
diff --git a/include/sqlite-vec-cpp/index/hnsw_node.hpp b/include/sqlite-vec-cpp/index/hnsw_node.hpp
@@ -49,7 +49,7 @@ template <concepts::VectorElement T> struct HNSWNode {
         std::lock_guard<std::mutex> lock(edge_mutex_);
         if (layer >= edges.size())
             return {};
-        return edges[layer];  // Return copy to avoid data race after lock release
+        return edges[layer]; // Return copy to avoid data race after lock release
     }
 
     /// Add bidirectional edge at layer (thread-safe)
diff --git a/tests/test_distances.cpp b/tests/test_distances.cpp
@@ -2,12 +2,12 @@
 #include <cmath>
 #include <iostream>
 #include <vector>
-#include <sqlite-vec-cpp/sqlite_vec.hpp>
-#include <sqlite-vec-cpp/distances/l2.hpp>
 #include <sqlite-vec-cpp/distances/cosine.hpp>
 #include <sqlite-vec-cpp/distances/inner_product.hpp>
+#include <sqlite-vec-cpp/distances/l2.hpp>
 #include <sqlite-vec-cpp/simd/avx.hpp>
 #include <sqlite-vec-cpp/simd/neon.hpp>
+#include <sqlite-vec-cpp/sqlite_vec.hpp>
 
 using namespace sqlite_vec_cpp;
 using namespace sqlite_vec_cpp::distances;
@@ -218,8 +218,8 @@ void test_simd_consistency() {
         inner_product_distance_float(std::span<const float>(a), std::span<const float>(b));
 
 #ifdef SQLITE_VEC_ENABLE_AVX
-    float l2_avx = simd::l2_distance_float_avx(std::span<const float>(a),
-                                               std::span<const float>(b));
+    float l2_avx =
+        simd::l2_distance_float_avx(std::span<const float>(a), std::span<const float>(b));
     float cosine_avx =
         simd::cosine_distance_float_avx(std::span<const float>(a), std::span<const float>(b));
     float ip_avx =
@@ -230,8 +230,8 @@ void test_simd_consistency() {
 #endif
 
 #ifdef SQLITE_VEC_ENABLE_NEON
-    float l2_neon = simd::l2_distance_float_neon(std::span<const float>(a),
-                                                 std::span<const float>(b));
+    float l2_neon =
+        simd::l2_distance_float_neon(std::span<const float>(a), std::span<const float>(b));
     float cosine_neon =
         simd::cosine_distance_float_neon(std::span<const float>(a), std::span<const float>(b));
     float ip_neon =

Original file line number	Diff line number	Diff line change
`@@ -90,9 +90,8 @@ static void BM_HNSW_Search_Filter_Bitset(benchmark::State& state) {`
`90`	`90`
`91`	`91`	`for (auto _ : state) {`
`92`	`92`	`for (const auto& q : data.queries) {`
`93`		`- auto results =`
`94`		`- data.index.search_with_filter(std::span<const float>{q}, k, ef,`
`95`		`- [&](size_t id) { return data.allowed[id] != 0; });`
	`93`	`+ auto results = data.index.search_with_filter(`
	`94`	`+ std::span<const float>{q}, k, ef, [&](size_t id) { return data.allowed[id] != 0; });`
`96`	`95`	`benchmark::DoNotOptimize(results);`
`97`	`96`	`}`
`98`	`97`	`}`
`@@ -113,9 +112,10 @@ static void BM_HNSW_Search_Filter_Set(benchmark::State& state) {`
`113`	`112`
`114`	`113`	`for (auto _ : state) {`
`115`	`114`	`for (const auto& q : data.queries) {`
`116`		`- auto results = data.index.search_with_filter(`
`117`		`- std::span<const float>{q}, k, ef,`
`118`		`- [&](size_t id) { return data.allowed_set.contains(id); });`
	`115`	`+ auto results =`
	`116`	`+ data.index.search_with_filter(std::span<const float>{q}, k, ef, [&](size_t id) {`
	`117`	`+ return data.allowed_set.contains(id);`
	`118`	`+ });`
`119`	`119`	`benchmark::DoNotOptimize(results);`
`120`	`120`	`}`
`121`	`121`	`}`
Original file line number	Diff line number	Diff line change
`@@ -449,8 +449,7 @@ static void BM_HNSW_FP16_Drift(benchmark::State& state) {`
`449`	`449`	`if (it != f32_dist.end()) {`
`450`	`450`	`++total_hits;`
`451`	`451`	`if (it->second > 0.0f) {`
`452`		`- ratio_sum += static_cast<double>(dist) /`
`453`		`- static_cast<double>(it->second);`
	`452`	`+ ratio_sum += static_cast<double>(dist) / static_cast<double>(it->second);`
`454`	`453`	`++ratio_count;`
`455`	`454`	`}`
`456`	`455`	`}`
Original file line number	Diff line number	Diff line change
`@@ -49,7 +49,7 @@ template <concepts::VectorElement T> struct HNSWNode {`
`49`	`49`	`std::lock_guard<std::mutex> lock(edge_mutex_);`
`50`	`50`	`if (layer >= edges.size())`
`51`	`51`	`return {};`
`52`		`- return edges[layer]; // Return copy to avoid data race after lock release`
	`52`	`+ return edges[layer]; // Return copy to avoid data race after lock release`
`53`	`53`	`}`
`54`	`54`
`55`	`55`	`/// Add bidirectional edge at layer (thread-safe)`