chore(ci): remove paru-bin submodule and config to fix checkout --recurse-submodules

This commit is contained in:
Andy Lee
2025-08-25 16:08:16 -07:00
parent 75c8aeee5f
commit ef4c69d128
4 changed files with 10 additions and 20 deletions

2
.gitmodules vendored
View File

@@ -14,3 +14,5 @@
[submodule "packages/leann-backend-hnsw/third_party/libzmq"]
path = packages/leann-backend-hnsw/third_party/libzmq
url = https://github.com/zeromq/libzmq.git
# Ensure CI can update this submodule; used only for Arch packaging and not required for builds.

View File

@@ -9,12 +9,12 @@ aws s3 sync s3://powerrag-diskann-rpj-wiki-20250824-224037-194d640c/diskann_rpj_
- Machine-specific; results measured locally with the current repo.
DiskANN (NQ queries, search-only)
- Command: `uv run benchmarks/bm25_diskann_baselines/run_diskann.py`
- Command: `uv run --script benchmarks/bm25_diskann_baselines/run_diskann.py`
- Settings: `recompute_embeddings=False`, embeddings precomputed (excluded from timing), batching off, caching off (`cache_mechanism=2`, `num_nodes_to_cache=0`)
- Result: avg 0.019339 s/query, QPS 51.71 (p50 ~0.018936 s, p95 ~0.023573 s)
BM25
- Command: `uv run --script ./benchmarks/run_bm25.py`
- Command: `uv run --script benchmarks/bm25_diskann_baselines/run_bm25.py`
- Settings: `k=10`, `k1=0.9`, `b=0.4`, queries=100
- Result: avg 0.026976 s/query, QPS 37.07 (p50 0.024729 s, p90 0.042158 s, p95 0.047099 s, p99 0.053520 s)

Before

Width:  |  Height:  |  Size: 1.2 KiB

After

Width:  |  Height:  |  Size: 1.2 KiB

View File

@@ -1,19 +1,8 @@
#!/usr/bin/env python3
"""
Run DiskANN with real NQ queries (search-only timing).
Steps:
- Load queries from nq_open.jsonl
- Compute embeddings (facebook/contriever-msmarco) once upfront
- Search via DiskANN (no recompute, no batching), measure per-query latency
Example:
python benchmarks/bm25_diskann_baselines/run_diskann_nq.py \
--index-dir benchmarks/data/indices/diskann_rpj_wiki \
--index-prefix ann \
--queries-file benchmarks/data/queries/nq_open.jsonl \
--num-queries 200 --top-k 10 --complexity 120 --threads 1 --beam-width 1
"""
# /// script
# dependencies = [
# "leann-backend-diskann"
# ]
# ///
import argparse
import json
@@ -47,7 +36,7 @@ def main() -> None:
ap.add_argument("--queries-file", default="benchmarks/data/queries/nq_open.jsonl")
ap.add_argument("--num-queries", type=int, default=200)
ap.add_argument("--top-k", type=int, default=10)
ap.add_argument("--complexity", type=int, default=120)
ap.add_argument("--complexity", type=int, default=62)
ap.add_argument("--threads", type=int, default=1)
ap.add_argument("--beam-width", type=int, default=1)
ap.add_argument("--cache-mechanism", type=int, default=2)

Submodule paru-bin deleted from 92a55429af