fix: restore macOS 15 build matrix and correct test path

- Add back macOS 15 configurations for Python 3.9-3.13 - Fix pytest path from test/ to tests/ (correct directory name) The macOS 15 support was accidentally missing from the matrix, and pytest was looking for the wrong directory name.
fix: correct macOS deployment targets based on Homebrew library requirements
2025-08-12 12:50:33 -07:00 · 2025-08-12 12:34:56 -07:00 · 2025-08-12 11:48:06 -07:00 · 2025-08-12 11:30:23 -07:00 · 2025-08-12 10:59:48 -07:00 · 2025-08-12 10:58:35 -07:00
6 changed files with 267 additions and 409 deletions
--- a/.github/workflows/build-reusable.yml
+++ b/.github/workflows/build-reusable.yml
@@ -64,6 +64,16 @@ jobs:
            python: '3.12'
          - os: macos-14
            python: '3.13'
          - os: macos-15
            python: '3.9'
          - os: macos-15
            python: '3.10'
          - os: macos-15
            python: '3.11'
          - os: macos-15
            python: '3.12'
          - os: macos-15
            python: '3.13'
          - os: macos-13
            python: '3.9'
          - os: macos-13
@@ -147,7 +157,14 @@ jobs:
            # Use system clang for better compatibility
            export CC=clang
            export CXX=clang++
-            export MACOSX_DEPLOYMENT_TARGET=11.0
+            # Homebrew libraries on each macOS version require matching minimum version
            if [[ "${{ matrix.os }}" == "macos-13" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=13.0
            elif [[ "${{ matrix.os }}" == "macos-14" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=14.0
            elif [[ "${{ matrix.os }}" == "macos-15" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=15.0
            fi
            uv build --wheel --python ${{ matrix.python }} --find-links ${GITHUB_WORKSPACE}/packages/leann-core/dist
          else
            uv build --wheel --python ${{ matrix.python }} --find-links ${GITHUB_WORKSPACE}/packages/leann-core/dist
@@ -161,7 +178,14 @@ jobs:
            export CC=clang
            export CXX=clang++
            # DiskANN requires macOS 13.3+ for sgesdd_ LAPACK function
-            export MACOSX_DEPLOYMENT_TARGET=13.3
+            # But Homebrew libraries on each macOS version require matching minimum version
            if [[ "${{ matrix.os }}" == "macos-13" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=13.3
            elif [[ "${{ matrix.os }}" == "macos-14" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=14.0
            elif [[ "${{ matrix.os }}" == "macos-15" ]]; then
              export MACOSX_DEPLOYMENT_TARGET=15.0
            fi
            uv build --wheel --python ${{ matrix.python }} --find-links ${GITHUB_WORKSPACE}/packages/leann-core/dist
          else
            uv build --wheel --python ${{ matrix.python }} --find-links ${GITHUB_WORKSPACE}/packages/leann-core/dist
@@ -197,10 +221,24 @@ jobs:
      - name: Repair wheels (macOS)
        if: runner.os == 'macOS'
        run: |
          # Determine deployment target based on runner OS
          # Must match the Homebrew libraries for each macOS version
          if [[ "${{ matrix.os }}" == "macos-13" ]]; then
            HNSW_TARGET="13.0"
            DISKANN_TARGET="13.3"
          elif [[ "${{ matrix.os }}" == "macos-14" ]]; then
            HNSW_TARGET="14.0"
            DISKANN_TARGET="14.0"
          elif [[ "${{ matrix.os }}" == "macos-15" ]]; then
            HNSW_TARGET="15.0"
            DISKANN_TARGET="15.0"
          fi
          # Repair HNSW wheel
          cd packages/leann-backend-hnsw
          if [ -d dist ]; then
-            delocate-wheel -w dist_repaired -v dist/*.whl
+            export MACOSX_DEPLOYMENT_TARGET=$HNSW_TARGET
            delocate-wheel -w dist_repaired -v --require-target-macos-version $HNSW_TARGET dist/*.whl
            rm -rf dist
            mv dist_repaired dist
          fi
@@ -209,7 +247,8 @@ jobs:
          # Repair DiskANN wheel
          cd packages/leann-backend-diskann
          if [ -d dist ]; then
-            delocate-wheel -w dist_repaired -v dist/*.whl
+            export MACOSX_DEPLOYMENT_TARGET=$DISKANN_TARGET
            delocate-wheel -w dist_repaired -v --require-target-macos-version $DISKANN_TARGET dist/*.whl
            rm -rf dist
            mv dist_repaired dist
          fi
@@ -249,8 +288,8 @@ jobs:
          # Activate virtual environment
          source .venv/bin/activate || source .venv/Scripts/activate
-          # Run all tests
+          # Run tests
-          pytest tests/
+          pytest -v tests/
      - name: Run sanity checks (optional)
        run: |
--- a/README.md
+++ b/README.md
@@ -468,7 +468,7 @@ leann --help
 ### Usage Examples
 ```bash
-# build from a specific directory, and my_docs is the index name(Here you can also build from multiple dict or multiple files)
+# build from a specific directory, and my_docs is the index name
 leann build my-docs --docs ./your_documents
 # Search your documents
--- a/packages/leann-backend-hnsw/CMakeLists.txt
+++ b/packages/leann-backend-hnsw/CMakeLists.txt
@@ -13,7 +13,7 @@ if(APPLE)
    else()
        message(FATAL_ERROR "Could not find libomp installation. Please install with: brew install libomp")
    endif()
-
+    
    set(OpenMP_C_FLAGS "-Xpreprocessor -fopenmp -I${HOMEBREW_PREFIX}/opt/libomp/include")
    set(OpenMP_CXX_FLAGS "-Xpreprocessor -fopenmp -I${HOMEBREW_PREFIX}/opt/libomp/include")
    set(OpenMP_C_LIB_NAMES "omp")
--- a/packages/leann-core/src/leann/cli.py
+++ b/packages/leann-core/src/leann/cli.py
@@ -5,7 +5,6 @@ from typing import Union
 from llama_index.core import SimpleDirectoryReader
 from llama_index.core.node_parser import SentenceSplitter
 from tqdm import tqdm
 from .api import LeannBuilder, LeannChat, LeannSearcher
@@ -76,14 +75,11 @@ class LeannCLI:
            formatter_class=argparse.RawDescriptionHelpFormatter,
            epilog="""
 Examples:
-  leann build my-docs --docs ./documents                                  # Build index from directory
+  leann build my-docs --docs ./documents                    # Build index named my-docs
-  leann build my-code --docs ./src ./tests ./config                      # Build index from multiple directories
+  leann build my-ppts --docs ./ --file-types .pptx,.pdf    # Index only PowerPoint and PDF files
-  leann build my-files --docs ./file1.py ./file2.txt ./docs/             # Build index from files and directories
+  leann search my-docs "query"                             # Search in my-docs index
-  leann build my-mixed --docs ./readme.md ./src/ ./config.json           # Build index from mixed files/dirs
+  leann ask my-docs "question"                             # Ask my-docs index
-  leann build my-ppts --docs ./ --file-types .pptx,.pdf                  # Index only PowerPoint and PDF files
+  leann list                                              # List all stored indexes
  leann search my-docs "query"                                           # Search in my-docs index
  leann ask my-docs "question"                                           # Ask my-docs index
  leann list                                                             # List all stored indexes
            """,
        )
@@ -95,11 +91,7 @@ Examples:
            "index_name", nargs="?", help="Index name (default: current directory name)"
        )
        build_parser.add_argument(
-            "--docs",
+            "--docs", type=str, default=".", help="Documents directory (default: current directory)"
            type=str,
            nargs="+",
            default=["."],
            help="Documents directories and/or files (default: current directory)",
        )
        build_parser.add_argument(
            "--backend", type=str, default="hnsw", choices=["hnsw", "diskann"]
@@ -243,32 +235,6 @@ Examples:
        """Check if a file should be excluded using gitignore parser."""
        return gitignore_matches(str(relative_path))
    def _is_git_submodule(self, path: Path) -> bool:
        """Check if a path is a git submodule."""
        try:
            # Find the git repo root
            current_dir = Path.cwd()
            while current_dir != current_dir.parent:
                if (current_dir / ".git").exists():
                    gitmodules_path = current_dir / ".gitmodules"
                    if gitmodules_path.exists():
                        # Read .gitmodules to check if this path is a submodule
                        gitmodules_content = gitmodules_path.read_text()
                        # Convert path to relative to git root
                        try:
                            relative_path = path.resolve().relative_to(current_dir)
                            # Check if this path appears in .gitmodules
                            return f"path = {relative_path}" in gitmodules_content
                        except ValueError:
                            # Path is not under git root
                            return False
                    break
                current_dir = current_dir.parent
            return False
        except Exception:
            # If anything goes wrong, assume it's not a submodule
            return False
    def list_indexes(self):
        print("Stored LEANN indexes:")
@@ -298,9 +264,7 @@ Examples:
            valid_projects.append(current_path)
        if not valid_projects:
-            print(
+            print("No indexes found. Use 'leann build <name> --docs <dir>' to create one.")
                "No indexes found. Use 'leann build <name> --docs <dir> [<dir2> ...]' to create one."
            )
            return
        total_indexes = 0
@@ -347,88 +311,56 @@ Examples:
                    print(f'  leann search {example_name} "your query"')
                    print(f"  leann ask {example_name} --interactive")
-    def load_documents(
+    def load_documents(self, docs_dir: str, custom_file_types: Union[str, None] = None):
-        self, docs_paths: Union[str, list], custom_file_types: Union[str, None] = None
+        print(f"Loading documents from {docs_dir}...")
    ):
        # Handle both single path (string) and multiple paths (list) for backward compatibility
        if isinstance(docs_paths, str):
            docs_paths = [docs_paths]
        # Separate files and directories
        files = []
        directories = []
        for path in docs_paths:
            path_obj = Path(path)
            if path_obj.is_file():
                files.append(str(path_obj))
            elif path_obj.is_dir():
                # Check if this is a git submodule - if so, skip it
                if self._is_git_submodule(path_obj):
                    print(f"⚠️  Skipping git submodule: {path}")
                    continue
                directories.append(str(path_obj))
            else:
                print(f"⚠️  Warning: Path '{path}' does not exist, skipping...")
                continue
        # Print summary of what we're processing
        total_items = len(files) + len(directories)
        items_desc = []
        if files:
            items_desc.append(f"{len(files)} file{'s' if len(files) > 1 else ''}")
        if directories:
            items_desc.append(
                f"{len(directories)} director{'ies' if len(directories) > 1 else 'y'}"
            )
        print(f"Loading documents from {' and '.join(items_desc)} ({total_items} total):")
        if files:
            print(f"  📄 Files: {', '.join([Path(f).name for f in files])}")
        if directories:
            print(f"  📁 Directories: {', '.join(directories)}")
        if custom_file_types:
            print(f"Using custom file types: {custom_file_types}")
-        all_documents = []
+        # Build gitignore parser
        gitignore_matches = self._build_gitignore_parser(docs_dir)
-        # First, process individual files if any
+        # Try to use better PDF parsers first, but only if PDFs are requested
-        if files:
+        documents = []
-            print(f"\n🔄 Processing {len(files)} individual file{'s' if len(files) > 1 else ''}...")
+        docs_path = Path(docs_dir)
-            # Load individual files using SimpleDirectoryReader with input_files
+        # Check if we should process PDFs
-            # Note: We skip gitignore filtering for explicitly specified files
+        should_process_pdfs = custom_file_types is None or ".pdf" in custom_file_types
            try:
                # Group files by their parent directory for efficient loading
                from collections import defaultdict
-                files_by_dir = defaultdict(list)
+        if should_process_pdfs:
-                for file_path in files:
+            for file_path in docs_path.rglob("*.pdf"):
-                    parent_dir = str(Path(file_path).parent)
+                # Check if file matches any exclude pattern
-                    files_by_dir[parent_dir].append(file_path)
+                relative_path = file_path.relative_to(docs_path)
                if self._should_exclude_file(relative_path, gitignore_matches):
                    continue
-                # Load files from each parent directory
+                print(f"Processing PDF: {file_path}")
-                for parent_dir, file_list in files_by_dir.items():
+
-                    print(
+                # Try PyMuPDF first (best quality)
-                        f"  Loading {len(file_list)} file{'s' if len(file_list) > 1 else ''} from {parent_dir}"
+                text = extract_pdf_text_with_pymupdf(str(file_path))
-                    )
+                if text is None:
                    # Try pdfplumber
                    text = extract_pdf_text_with_pdfplumber(str(file_path))
                if text:
                    # Create a simple document structure
                    from llama_index.core import Document
                    doc = Document(text=text, metadata={"source": str(file_path)})
                    documents.append(doc)
                else:
                    # Fallback to default reader
                    print(f"Using default reader for {file_path}")
                    try:
-                        file_docs = SimpleDirectoryReader(
+                        default_docs = SimpleDirectoryReader(
-                            parent_dir,
+                            str(file_path.parent),
                            input_files=file_list,
                            filename_as_id=True,
                            required_exts=[file_path.suffix],
                        ).load_data()
-                        all_documents.extend(file_docs)
+                        documents.extend(default_docs)
                        print(
                            f"    ✅ Loaded {len(file_docs)} document{'s' if len(file_docs) > 1 else ''}"
                        )
                    except Exception as e:
-                        print(f"    ❌ Warning: Could not load files from {parent_dir}: {e}")
+                        print(f"Warning: Could not process {file_path}: {e}")
-            except Exception as e:
+        # Load other file types with default reader
                print(f"❌ Error processing individual files: {e}")
        # Define file extensions to process
        if custom_file_types:
            # Parse custom file types from comma-separated string
            code_extensions = [ext.strip() for ext in custom_file_types.split(",") if ext.strip()]
@@ -490,106 +422,41 @@ Examples:
                ".py",
                ".jl",
            ]
        # Try to load other file types, but don't fail if none are found
        try:
            # Create a custom file filter function using our PathSpec
            def file_filter(file_path: str) -> bool:
                """Return True if file should be included (not excluded)"""
                try:
                    docs_path_obj = Path(docs_dir)
                    file_path_obj = Path(file_path)
                    relative_path = file_path_obj.relative_to(docs_path_obj)
                    return not self._should_exclude_file(relative_path, gitignore_matches)
                except (ValueError, OSError):
                    return True  # Include files that can't be processed
-        # Process each directory
+            other_docs = SimpleDirectoryReader(
-        if directories:
+                docs_dir,
-            print(
+                recursive=True,
-                f"\n🔄 Processing {len(directories)} director{'ies' if len(directories) > 1 else 'y'}..."
+                encoding="utf-8",
-            )
+                required_exts=code_extensions,
                file_extractor={},  # Use default extractors
                filename_as_id=True,
            ).load_data(show_progress=True)
-        for docs_dir in directories:
+            # Filter documents after loading based on gitignore rules
-            print(f"Processing directory: {docs_dir}")
+            filtered_docs = []
-            # Build gitignore parser for each directory
+            for doc in other_docs:
-            gitignore_matches = self._build_gitignore_parser(docs_dir)
+                file_path = doc.metadata.get("file_path", "")
                if file_filter(file_path):
                    filtered_docs.append(doc)
-            # Try to use better PDF parsers first, but only if PDFs are requested
+            documents.extend(filtered_docs)
-            documents = []
+        except ValueError as e:
-            docs_path = Path(docs_dir)
+            if "No files found" in str(e):
-
+                print("No additional files found for other supported types.")
-            # Check if we should process PDFs
+            else:
-            should_process_pdfs = custom_file_types is None or ".pdf" in custom_file_types
+                raise e
            if should_process_pdfs:
                for file_path in docs_path.rglob("*.pdf"):
                    # Check if file matches any exclude pattern
                    try:
                        relative_path = file_path.relative_to(docs_path)
                        if self._should_exclude_file(relative_path, gitignore_matches):
                            continue
                    except ValueError:
                        # Skip files that can't be made relative to docs_path
                        print(f"⚠️  Skipping file outside directory scope: {file_path}")
                        continue
                    print(f"Processing PDF: {file_path}")
                    # Try PyMuPDF first (best quality)
                    text = extract_pdf_text_with_pymupdf(str(file_path))
                    if text is None:
                        # Try pdfplumber
                        text = extract_pdf_text_with_pdfplumber(str(file_path))
                    if text:
                        # Create a simple document structure
                        from llama_index.core import Document
                        doc = Document(text=text, metadata={"source": str(file_path)})
                        documents.append(doc)
                    else:
                        # Fallback to default reader
                        print(f"Using default reader for {file_path}")
                        try:
                            default_docs = SimpleDirectoryReader(
                                str(file_path.parent),
                                filename_as_id=True,
                                required_exts=[file_path.suffix],
                            ).load_data()
                            documents.extend(default_docs)
                        except Exception as e:
                            print(f"Warning: Could not process {file_path}: {e}")
            # Load other file types with default reader
            try:
                # Create a custom file filter function using our PathSpec
                def file_filter(
                    file_path: str, docs_dir=docs_dir, gitignore_matches=gitignore_matches
                ) -> bool:
                    """Return True if file should be included (not excluded)"""
                    try:
                        docs_path_obj = Path(docs_dir)
                        file_path_obj = Path(file_path)
                        relative_path = file_path_obj.relative_to(docs_path_obj)
                        return not self._should_exclude_file(relative_path, gitignore_matches)
                    except (ValueError, OSError):
                        return True  # Include files that can't be processed
                other_docs = SimpleDirectoryReader(
                    docs_dir,
                    recursive=True,
                    encoding="utf-8",
                    required_exts=code_extensions,
                    file_extractor={},  # Use default extractors
                    filename_as_id=True,
                ).load_data(show_progress=True)
                # Filter documents after loading based on gitignore rules
                filtered_docs = []
                for doc in other_docs:
                    file_path = doc.metadata.get("file_path", "")
                    if file_filter(file_path):
                        filtered_docs.append(doc)
                documents.extend(filtered_docs)
            except ValueError as e:
                if "No files found" in str(e):
                    print(f"No additional files found for other supported types in {docs_dir}.")
                else:
                    raise e
            all_documents.extend(documents)
            print(f"Loaded {len(documents)} documents from {docs_dir}")
        documents = all_documents
        all_texts = []
@@ -640,9 +507,7 @@ Examples:
            ".jl",
        }
-        print("start chunking documents")
+        for doc in documents:
        # Add progress bar for document chunking
        for doc in tqdm(documents, desc="Chunking documents", unit="doc"):
            # Check if this is a code file based on source path
            source_path = doc.metadata.get("source", "")
            is_code_file = any(source_path.endswith(ext) for ext in code_file_exts)
@@ -658,7 +523,7 @@ Examples:
        return all_texts
    async def build_index(self, args):
-        docs_paths = args.docs
+        docs_dir = args.docs
        # Use current directory name if index_name not provided
        if args.index_name:
            index_name = args.index_name
@@ -669,25 +534,13 @@ Examples:
        index_dir = self.indexes_dir / index_name
        index_path = self.get_index_path(index_name)
-        # Display all paths being indexed with file/directory distinction
+        print(f"📂 Indexing: {Path(docs_dir).resolve()}")
        files = [p for p in docs_paths if Path(p).is_file()]
        directories = [p for p in docs_paths if Path(p).is_dir()]
        print(f"📂 Indexing {len(docs_paths)} path{'s' if len(docs_paths) > 1 else ''}:")
        if files:
            print(f"  📄 Files ({len(files)}):")
            for i, file_path in enumerate(files, 1):
                print(f"    {i}. {Path(file_path).resolve()}")
        if directories:
            print(f"  📁 Directories ({len(directories)}):")
            for i, dir_path in enumerate(directories, 1):
                print(f"    {i}. {Path(dir_path).resolve()}")
        if index_dir.exists() and not args.force:
            print(f"Index '{index_name}' already exists. Use --force to rebuild.")
            return
-        all_texts = self.load_documents(docs_paths, args.file_types)
+        all_texts = self.load_documents(docs_dir, args.file_types)
        if not all_texts:
            print("No documents found")
            return
@@ -723,7 +576,7 @@ Examples:
        if not self.index_exists(index_name):
            print(
-                f"Index '{index_name}' not found. Use 'leann build {index_name} --docs <dir> [<dir2> ...]' to create it."
+                f"Index '{index_name}' not found. Use 'leann build {index_name} --docs <dir>' to create it."
            )
            return
@@ -750,7 +603,7 @@ Examples:
        if not self.index_exists(index_name):
            print(
-                f"Index '{index_name}' not found. Use 'leann build {index_name} --docs <dir> [<dir2> ...]' to create it."
+                f"Index '{index_name}' not found. Use 'leann build {index_name} --docs <dir>' to create it."
            )
            return
--- a/packages/leann-core/src/leann/embedding_compute.py
+++ b/packages/leann-core/src/leann/embedding_compute.py
@@ -6,6 +6,7 @@ Preserves all optimization parameters to ensure performance
 import logging
 import os
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from typing import Any
 import numpy as np
@@ -373,9 +374,7 @@ def compute_embeddings_ollama(
    texts: list[str], model_name: str, is_build: bool = False, host: str = "http://localhost:11434"
 ) -> np.ndarray:
    """
-    Compute embeddings using Ollama API with simplified batch processing.
+    Compute embeddings using Ollama API.
    Uses batch size of 32 for MPS/CPU and 128 for CUDA to optimize performance.
    Args:
        texts: List of texts to compute embeddings for
@@ -439,19 +438,12 @@ def compute_embeddings_ollama(
            if any(emb in base_name for emb in ["embed", "bge", "minilm", "e5"]):
                embedding_models.append(model)
-        # Check if model exists (handle versioned names) and resolve to full name
+        # Check if model exists (handle versioned names)
-        resolved_model_name = None
+        model_found = any(
-        for name in model_names:
+            model_name == name.split(":")[0] or model_name == name for name in model_names
-            # Exact match
+        )
            if model_name == name:
                resolved_model_name = name
                break
            # Match without version tag (use the versioned name)
            elif model_name == name.split(":")[0]:
                resolved_model_name = name
                break
-        if not resolved_model_name:
+        if not model_found:
            error_msg = f"❌ Model '{model_name}' not found in local Ollama.\n\n"
            # Suggest pulling the model
@@ -473,11 +465,6 @@ def compute_embeddings_ollama(
            error_msg += "\n📚 Browse more: https://ollama.com/library"
            raise ValueError(error_msg)
        # Use the resolved model name for all subsequent operations
        if resolved_model_name != model_name:
            logger.info(f"Resolved model name '{model_name}' to '{resolved_model_name}'")
        model_name = resolved_model_name
        # Verify the model supports embeddings by testing it
        try:
            test_response = requests.post(
@@ -498,147 +485,162 @@ def compute_embeddings_ollama(
    except requests.exceptions.RequestException as e:
        logger.warning(f"Could not verify model existence: {e}")
-    # Determine batch size based on device availability
+    # Process embeddings with optimized concurrent processing
-    # Check for CUDA/MPS availability using torch if available
+    import requests
    batch_size = 32  # Default for MPS/CPU
    try:
        import torch
-        if torch.cuda.is_available():
+    def get_single_embedding(text_idx_tuple):
-            batch_size = 128  # CUDA gets larger batch size
+        """Helper function to get embedding for a single text."""
-        elif hasattr(torch.backends, "mps") and torch.backends.mps.is_available():
+        text, idx = text_idx_tuple
-            batch_size = 32  # MPS gets smaller batch size
+        max_retries = 3
-    except ImportError:
+        retry_count = 0
        # If torch is not available, use conservative batch size
        batch_size = 32
-    logger.info(f"Using batch size: {batch_size}")
+        # Truncate very long texts to avoid API issues
        truncated_text = text[:8000] if len(text) > 8000 else text
-    def get_batch_embeddings(batch_texts):
+        while retry_count < max_retries:
-        """Get embeddings for a batch of texts."""
+            try:
-        all_embeddings = []
+                response = requests.post(
-        failed_indices = []
+                    f"{host}/api/embeddings",
                    json={"model": model_name, "prompt": truncated_text},
                    timeout=30,
                )
                response.raise_for_status()
-        for i, text in enumerate(batch_texts):
+                result = response.json()
-            max_retries = 3
+                embedding = result.get("embedding")
            retry_count = 0
-            # Truncate very long texts to avoid API issues
+                if embedding is None:
-            truncated_text = text[:8000] if len(text) > 8000 else text
+                    raise ValueError(f"No embedding returned for text {idx}")
-            while retry_count < max_retries:
+
-                try:
+                return idx, embedding
-                    response = requests.post(
+
-                        f"{host}/api/embeddings",
+            except requests.exceptions.Timeout:
-                        json={"model": model_name, "prompt": truncated_text},
+                retry_count += 1
-                        timeout=30,
+                if retry_count >= max_retries:
                    logger.warning(f"Timeout for text {idx} after {max_retries} retries")
                    return idx, None
            except Exception as e:
                if retry_count >= max_retries - 1:
                    logger.error(f"Failed to get embedding for text {idx}: {e}")
                    return idx, None
                retry_count += 1
        return idx, None
    # Determine if we should use concurrent processing
    use_concurrent = (
        len(texts) > 5 and not is_build
    )  # Don't use concurrent in build mode to avoid overwhelming
    max_workers = min(4, len(texts))  # Limit concurrent requests to avoid overwhelming Ollama
    all_embeddings = [None] * len(texts)  # Pre-allocate list to maintain order
    failed_indices = []
    if use_concurrent:
        logger.info(
            f"Using concurrent processing with {max_workers} workers for {len(texts)} texts"
        )
        with ThreadPoolExecutor(max_workers=max_workers) as executor:
            # Submit all tasks
            future_to_idx = {
                executor.submit(get_single_embedding, (text, idx)): idx
                for idx, text in enumerate(texts)
            }
            # Add progress bar for concurrent processing
            try:
                if is_build or len(texts) > 10:
                    from tqdm import tqdm
                    futures_iterator = tqdm(
                        as_completed(future_to_idx),
                        total=len(texts),
                        desc="Computing Ollama embeddings",
                    )
-                    response.raise_for_status()
+                else:
-
+                    futures_iterator = as_completed(future_to_idx)
-                    result = response.json()
+            except ImportError:
-                    embedding = result.get("embedding")
+                futures_iterator = as_completed(future_to_idx)
                    if embedding is None:
                        raise ValueError(f"No embedding returned for text {i}")
                    if not isinstance(embedding, list) or len(embedding) == 0:
                        raise ValueError(f"Invalid embedding format for text {i}")
                    all_embeddings.append(embedding)
                    break
                except requests.exceptions.Timeout:
                    retry_count += 1
                    if retry_count >= max_retries:
                        logger.warning(f"Timeout for text {i} after {max_retries} retries")
                        failed_indices.append(i)
                        all_embeddings.append(None)
                        break
            # Collect results as they complete
            for future in futures_iterator:
                try:
                    idx, embedding = future.result()
                    if embedding is not None:
                        all_embeddings[idx] = embedding
                    else:
                        failed_indices.append(idx)
                except Exception as e:
-                    retry_count += 1
+                    idx = future_to_idx[future]
-                    if retry_count >= max_retries:
+                    logger.error(f"Exception for text {idx}: {e}")
-                        logger.error(f"Failed to get embedding for text {i}: {e}")
+                    failed_indices.append(idx)
                        failed_indices.append(i)
                        all_embeddings.append(None)
                        break
        return all_embeddings, failed_indices
    # Process texts in batches
    all_embeddings = []
    all_failed_indices = []
    # Setup progress bar if needed
    show_progress = is_build or len(texts) > 10
    try:
        if show_progress:
            from tqdm import tqdm
    except ImportError:
        show_progress = False
    # Process batches
    num_batches = (len(texts) + batch_size - 1) // batch_size
    if show_progress:
        batch_iterator = tqdm(range(num_batches), desc="Computing Ollama embeddings")
    else:
-        batch_iterator = range(num_batches)
+        # Sequential processing with progress bar
        show_progress = is_build or len(texts) > 10
-    for batch_idx in batch_iterator:
+        try:
-        start_idx = batch_idx * batch_size
+            if show_progress:
-        end_idx = min(start_idx + batch_size, len(texts))
+                from tqdm import tqdm
        batch_texts = texts[start_idx:end_idx]
-        batch_embeddings, batch_failed = get_batch_embeddings(batch_texts)
+                iterator = tqdm(
                    enumerate(texts), total=len(texts), desc="Computing Ollama embeddings"
                )
            else:
                iterator = enumerate(texts)
        except ImportError:
            iterator = enumerate(texts)
-        # Adjust failed indices to global indices
+        for idx, text in iterator:
-        global_failed = [start_idx + idx for idx in batch_failed]
+            result_idx, embedding = get_single_embedding((text, idx))
-        all_failed_indices.extend(global_failed)
+            if embedding is not None:
-        all_embeddings.extend(batch_embeddings)
+                all_embeddings[idx] = embedding
            else:
                failed_indices.append(idx)
    # Handle failed embeddings
-    if all_failed_indices:
+    if failed_indices:
-        if len(all_failed_indices) == len(texts):
+        if len(failed_indices) == len(texts):
            raise RuntimeError("Failed to compute any embeddings")
-        logger.warning(
+        logger.warning(f"Failed to compute embeddings for {len(failed_indices)}/{len(texts)} texts")
            f"Failed to compute embeddings for {len(all_failed_indices)}/{len(texts)} texts"
        )
        # Use zero embeddings as fallback for failed ones
        valid_embedding = next((e for e in all_embeddings if e is not None), None)
        if valid_embedding:
            embedding_dim = len(valid_embedding)
-            for i, embedding in enumerate(all_embeddings):
+            for idx in failed_indices:
-                if embedding is None:
+                all_embeddings[idx] = [0.0] * embedding_dim
                    all_embeddings[i] = [0.0] * embedding_dim
-    # Remove None values
+    # Remove None values and convert to numpy array
    all_embeddings = [e for e in all_embeddings if e is not None]
-    if not all_embeddings:
+    # Validate embedding dimensions before creating numpy array
-        raise RuntimeError("No valid embeddings were computed")
+    if all_embeddings:
        expected_dim = len(all_embeddings[0])
        inconsistent_dims = []
        for i, embedding in enumerate(all_embeddings):
            if len(embedding) != expected_dim:
                inconsistent_dims.append((i, len(embedding)))
-    # Validate embedding dimensions
+        if inconsistent_dims:
-    expected_dim = len(all_embeddings[0])
+            error_msg = f"Ollama returned inconsistent embedding dimensions. Expected {expected_dim}, but got:\n"
-    inconsistent_dims = []
+            for idx, dim in inconsistent_dims[:10]:  # Show first 10 inconsistent ones
-    for i, embedding in enumerate(all_embeddings):
+                error_msg += f"  - Text {idx}: {dim} dimensions\n"
-        if len(embedding) != expected_dim:
+            if len(inconsistent_dims) > 10:
-            inconsistent_dims.append((i, len(embedding)))
+                error_msg += f"  ... and {len(inconsistent_dims) - 10} more\n"
-
+            error_msg += (
-    if inconsistent_dims:
+                f"\nThis is likely an Ollama API bug with model '{model_name}'. Please try:\n"
-        error_msg = f"Ollama returned inconsistent embedding dimensions. Expected {expected_dim}, but got:\n"
+            )
-        for idx, dim in inconsistent_dims[:10]:  # Show first 10 inconsistent ones
+            error_msg += "1. Restart Ollama service: 'ollama serve'\n"
-            error_msg += f"  - Text {idx}: {dim} dimensions\n"
+            error_msg += f"2. Re-pull the model: 'ollama pull {model_name}'\n"
-        if len(inconsistent_dims) > 10:
+            error_msg += (
-            error_msg += f"  ... and {len(inconsistent_dims) - 10} more\n"
+                "3. Use sentence-transformers instead: --embedding-mode sentence-transformers\n"
-        error_msg += f"\nThis is likely an Ollama API bug with model '{model_name}'. Please try:\n"
+            )
-        error_msg += "1. Restart Ollama service: 'ollama serve'\n"
+            error_msg += "4. Report this issue to Ollama: https://github.com/ollama/ollama/issues"
-        error_msg += f"2. Re-pull the model: 'ollama pull {model_name}'\n"
+            raise ValueError(error_msg)
        error_msg += (
            "3. Use sentence-transformers instead: --embedding-mode sentence-transformers\n"
        )
        error_msg += "4. Report this issue to Ollama: https://github.com/ollama/ollama/issues"
        raise ValueError(error_msg)
    # Convert to numpy array and normalize
    embeddings = np.array(all_embeddings, dtype=np.float32)
--- a/packages/leann-mcp/README.md
+++ b/packages/leann-mcp/README.md
@@ -45,42 +45,6 @@ leann build my-project --docs ./
 claude
 ```
 ## 🚀 Advanced Usage Examples
 ### Index Entire Git Repository
 ```bash
 # Index all tracked files in your git repository, note right now we will skip submodules, but we can add it back easily if you want
 leann build my-repo --docs $(git ls-files) --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 # Index only specific file types from git
 leann build my-python-code --docs $(git ls-files "*.py") --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 ```
 ### Multiple Directories and Files
 ```bash
 # Index multiple directories
 leann build my-codebase --docs ./src ./tests ./docs ./config --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 # Mix files and directories
 leann build my-project --docs ./README.md ./src/ ./package.json ./docs/ --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 # Specific files only
 leann build my-configs --docs ./tsconfig.json ./package.json ./webpack.config.js --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 ```
 ### Advanced Git Integration
 ```bash
 # Index recently modified files
 leann build recent-changes --docs $(git diff --name-only HEAD~10..HEAD) --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 # Index files matching pattern
 leann build frontend --docs $(git ls-files "*.tsx" "*.ts" "*.jsx" "*.js") --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 # Index documentation and config files
 leann build docs-and-configs --docs $(git ls-files "*.md" "*.yml" "*.yaml" "*.json" "*.toml") --embedding-mode sentence-transformers --embedding-model all-MiniLM-L6-v2 --backend hnsw
 ```
 **Try this in Claude Code:**
 ```
 Help me understand this codebase. List available indexes and search for authentication patterns.
Author	SHA1	Message	Date
Andy Lee	3dc130760a	fix: restore macOS 15 build matrix and correct test path - Add back macOS 15 configurations for Python 3.9-3.13 - Fix pytest path from test/ to tests/ (correct directory name) The macOS 15 support was accidentally missing from the matrix, and pytest was looking for the wrong directory name.	2025-08-12 12:50:33 -07:00
Andy Lee	2761067b7b	fix: correct macOS deployment targets based on Homebrew library requirements The key insight is that Homebrew libraries on each macOS version are compiled for that specific version: - macOS 13: Libraries require macOS 13.0 minimum - macOS 14: Libraries require macOS 14.0 minimum - macOS 15: Libraries require macOS 15.0 minimum We cannot build wheels for older macOS versions than what the bundled Homebrew libraries require. This means: - macOS 13 runners: Build for macOS 13.0+ (HNSW) and 13.3+ (DiskANN) - macOS 14 runners: Build for macOS 14.0+ - macOS 15 runners: Build for macOS 15.0+ This ensures delocate-wheel succeeds by matching deployment targets with the actual minimum versions required by system libraries.	2025-08-12 12:34:56 -07:00
Andy Lee	5f57f4763b	fix: add macOS 15 support to deployment target configuration The issue extends to macOS 15 runners where Homebrew libraries are built for macOS 15. We must handle all runner versions explicitly: - macOS 13 runners: Can build for macOS 11.0 (HNSW) and 13.3 (DiskANN) - macOS 14 runners: Must build for macOS 14.0 (system libraries) - macOS 15 runners: Must build for macOS 15.0 (system libraries) This ensures wheels are properly tagged for their actual minimum supported macOS version, matching the bundled libraries.	2025-08-12 11:48:06 -07:00
Andy Lee	9e01e69038	fix: match deployment target with runner OS for library compatibility The issue is that Homebrew libraries on macOS 14 runners are built for macOS 14 and cannot be downgraded. We must use different deployment targets based on the runner OS: - macOS 13 runners: Can build for macOS 11.0 (HNSW) and 13.3 (DiskANN) - macOS 14 runners: Must build for macOS 14.0 (due to system libraries) This ensures delocate-wheel succeeds by matching the deployment target with the actual minimum version required by bundled libraries.	2025-08-12 11:30:23 -07:00
Andy Lee	d336f3dbf6	fix: use macOS 13.3 for DiskANN backend as required by LAPACK DiskANN requires macOS 13.3+ for sgesdd_ LAPACK function, so we must use 13.3 as the deployment target, not 13.0.	2025-08-12 10:59:48 -07:00
Andy Lee	acf3034171	fix: ensure wheels are compatible with older macOS versions - Set MACOSX_DEPLOYMENT_TARGET=11.0 for HNSW backend (broad compatibility) - Set MACOSX_DEPLOYMENT_TARGET=13.0 for DiskANN backend (required for LAPACK) - Add --require-target-macos-version to delocate-wheel commands - This fixes CI failures on macos-13 runners while maintaining M4 Mac support Fixes the issue where wheels built on macos-14 runners were incorrectly tagged as macosx_14_0, preventing installation on macos-13 runners.	2025-08-12 10:58:35 -07:00
Andy Lee	04623b6be0	feat: add macOS 15 support for M4 Mac compatibility - Add macos-15 CI builds for Python 3.9-3.13 - Update MACOSX_DEPLOYMENT_TARGET from 11.0/13.3 to 14.0 for broader compatibility - Addresses issue #34 with Mac M4 wheel compatibility 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>	2025-08-12 00:06:19 -07:00