vespa-engine · thomasht86 · Dec 1, 2025 · Oct 22, 2025 · Oct 22, 2025 · Oct 22, 2025
diff --git a/examples/README.md b/examples/README.md
@@ -0,0 +1,104 @@
+# NanoBEIR Evaluation Example
+
+This example demonstrates how to use the `vespa.nanobeir` module to easily configure and run NanoBEIR evaluations with different embedding models.
+
+## Overview
+
+The `vespa.nanobeir` module provides utilities to simplify the creation of Vespa applications for information retrieval evaluation. It handles the complexity of configuring different embedding models with varying dimensions, tokenizers, and binary vs. float embeddings.
+
+## Key Features
+
+- **Model-centric configuration**: All model-specific parameters (dimension, tokenizer, binarization) are encapsulated in a `ModelConfig` object
+- **Automatic field type selection**: The embedding field type is automatically set to `tensor<float>` or `tensor<int8>` based on whether embeddings are binarized
+- **Automatic indexing configuration**: For binarized embeddings, `pack_bits` is automatically added to the indexing statement
+- **Distance metric selection**: Uses hamming distance for binarized embeddings and cosine similarity (angular distance) for float embeddings
+- **Predefined models**: Includes configurations for common models like e5-small-v2, e5-base-v2, snowflake-arctic-embed, and bge-m3
+
+## Usage
+
+### Basic Example
+
+```python
+from vespa.nanobeir import get_model_config, create_evaluation_package
+
+# Get a predefined model configuration
+config = get_model_config("e5-small-v2")
+
+# Create a complete application package
+package = create_evaluation_package(config, app_name="myeval")
+
+# Deploy to Vespa Cloud or local Docker
+# ... (deployment code)
+```
+
+### Custom Model Configuration
+
+```python
+from vespa.nanobeir import ModelConfig, create_embedder_component, create_embedding_field
+
+# Define a custom model
+config = ModelConfig(
+    model_id="my-custom-model",
+    embedding_dim=512,
+    tokenizer_id="bert-base-uncased",
+    binarized=False,
+)
+
+# Create individual components
+embedder = create_embedder_component(config)
+embedding_field = create_embedding_field(config)
+```
+
+### Binary Embeddings
+
+```python
+from vespa.nanobeir import ModelConfig
+
+# Configure for binary embeddings
+config = ModelConfig(
+    model_id="bge-m3",
+    embedding_dim=1024,  # Before packing
+    binarized=True,
+)
+
+# The resulting field will be tensor<int8>(x[128]) with pack_bits in indexing
+# The ranking profile will use hamming distance
+```
+
+## Running the Example
+
+```bash
+# From the repository root
+uv run python examples/nanobeir_evaluation_example.py
+```
+
+This will demonstrate:
+1. Creating packages for different float embedding models (e5-small-v2, e5-base-v2)
+2. Creating a package for binary embeddings (bge-m3-binary)
+3. Creating a package with custom model configuration
+4. Listing all available predefined models
+
+## Available Predefined Models
+
+- `e5-small-v2`: 384-dimensional float embeddings
+- `e5-base-v2`: 768-dimensional float embeddings
+- `snowflake-arctic-embed-xs`: 384-dimensional float embeddings
+- `snowflake-arctic-embed-s`: 384-dimensional float embeddings
+- `snowflake-arctic-embed-m`: 768-dimensional float embeddings
+- `bge-m3-binary`: 1024-dimensional binary embeddings (packed to 128 int8 values)
+
+## Next Steps
+
+After creating an application package:
+
+1. **Deploy to Vespa**: Use `VespaCloud` or `VespaDocker` to deploy your application
+2. **Feed documents**: Load the NanoBEIR dataset and feed documents to Vespa
+3. **Run evaluation**: Use `VespaEvaluator` or `VespaMatchEvaluator` to evaluate retrieval quality
+4. **Compare models**: Run the same evaluation with different model configurations to compare performance
+
+## Related Documentation
+
+- [vespa.nanobeir API Reference](../vespa/nanobeir.py)
+- [vespa.evaluation API Reference](../vespa/evaluation.py)
+- [Vespa Documentation - Embeddings](https://docs.vespa.ai/en/embedding.html)
+- [Vespa Documentation - Binary Quantization](https://docs.vespa.ai/en/embedding.html#binary-quantization)
diff --git a/examples/nanobeir_evaluation_example.py b/examples/nanobeir_evaluation_example.py
@@ -0,0 +1,196 @@
+#!/usr/bin/env python3
+"""
+Example script demonstrating NanoBEIR evaluation with different models.
+
+This script shows how to easily switch between different embedding models
+for evaluation, handling differences in embedding dimensions, tokenizers,
+and binary vs. float embeddings.
+"""
+
+from vespa.nanobeir import (
+    ModelConfig,
+    get_model_config,
+    create_embedder_component,
+    create_embedding_field,
+    create_evaluation_package,
+)
+
+
+def main():
+    """
+    Main function demonstrating evaluation setup with different models.
+    """
+    print("NanoBEIR Evaluation Example")
+    print("=" * 60)
+
+    # Example 1: Single model by name (e5-small-v2)
+    print("\n1. Single model: e5-small-v2 (float embeddings, 384 dim)")
+    print("-" * 60)
+    package_e5_small = create_evaluation_package(
+        "e5-small-v2",
+        app_name="nanobeirsmall",
+    )
+    config_e5_small = get_model_config("e5-small-v2")
+    print(f"   Model: {config_e5_small.model_id}")
+    print(f"   Embedding dim: {config_e5_small.embedding_dim}")
+    print(f"   Binarized: {config_e5_small.binarized}")
+    print(f"   Component ID: {config_e5_small.component_id}")
+    embedding_field = package_e5_small.schema.document.fields[2]
+    print(f"   Schema embedding field name: {embedding_field.name}")
+    print(f"   Schema embedding field type: {embedding_field.type}")
+    print(f"   Number of components: {len(package_e5_small.components)}")
+    print(f"   Number of rank profiles: {len(package_e5_small.schema.rank_profiles)}")
+    profile_names = [
+        p.name if hasattr(p, "name") else str(p)
+        for p in package_e5_small.schema.rank_profiles
+    ]
+    print(f"   Rank profile names: {profile_names}")
+
+    # Example 2: Single model with custom config
+    print("\n2. Single model with custom config (512 dim)")
+    print("-" * 60)
+    custom_config = ModelConfig(
+        model_id="custom-embedding-model",
+        embedding_dim=512,
+        tokenizer_id="bert-base-uncased",
+        binarized=False,
+    )
+    package_custom = create_evaluation_package(
+        custom_config,
+        app_name="nanobeircustom",
+    )
+    print(f"   Model: {custom_config.model_id}")
+    print(f"   Tokenizer: {custom_config.tokenizer_id}")
+    print(f"   Embedding dim: {custom_config.embedding_dim}")
+    embedding_field = package_custom.schema.document.fields[2]
+    print(f"   Schema embedding field name: {embedding_field.name}")
+    print(f"   Schema embedding field type: {embedding_field.type}")
+
+    # Example 3: Multiple models (e5-small-v2 and e5-base-v2)
+    print("\n3. Multiple models: e5-small-v2 (384 dim) + e5-base-v2 (768 dim)")
+    print("-" * 60)
+    package_multi = create_evaluation_package(
+        ["e5-small-v2", "e5-base-v2"],
+        app_name="nanobeirmulti",
+    )
+    print("   Number of models: 2")
+    print(f"   Number of components: {len(package_multi.components)}")
+    print(f"   Component IDs: {[c.id for c in package_multi.components]}")
+    embedding_fields = [
+        f
+        for f in package_multi.schema.document.fields
+        if f.name.startswith("embedding")
+    ]
+    print(f"   Number of embedding fields: {len(embedding_fields)}")
+    print(f"   Embedding field names: {[f.name for f in embedding_fields]}")
+    print(f"   Embedding field types: {[f.type for f in embedding_fields]}")
+    print(f"   Number of rank profiles: {len(package_multi.schema.rank_profiles)}")
+    profile_names_multi = [
+        p.name if hasattr(p, "name") else str(p)
+        for p in package_multi.schema.rank_profiles
+    ]
+    print(f"   Rank profile names: {profile_names_multi}")
+
+    # Example 4: Multiple models with mixed configs (name + custom config)
+    print("\n4. Multiple models: e5-small-v2 + custom model (mixed configs)")
+    print("-" * 60)
+    custom_mixed = ModelConfig(
+        model_id="my-custom-embedder",
+        embedding_dim=256,
+        binarized=False,
+    )
+    package_mixed = create_evaluation_package(
+        ["e5-small-v2", custom_mixed],
+        app_name="nanobeirmixed",
+    )
+    print(f"   Number of components: {len(package_mixed.components)}")
+    print(f"   Component IDs: {[c.id for c in package_mixed.components]}")
+    embedding_fields_mixed = [
+        f
+        for f in package_mixed.schema.document.fields
+        if f.name.startswith("embedding")
+    ]
+    print(f"   Embedding field names: {[f.name for f in embedding_fields_mixed]}")
+    print(f"   Embedding field types: {[f.type for f in embedding_fields_mixed]}")
+
+    # Example 5: ModernBERT with advanced configuration
+    print("\n5. Single model: nomic-ai-modernbert (ModernBERT-based, 768 dim)")
+    print("-" * 60)
+    config_modernbert = get_model_config("nomic-ai-modernbert")
+    package_modernbert = create_evaluation_package(
+        "nomic-ai-modernbert",
+        app_name="nanobeirmodern",
+    )
+    print(f"   Model: {config_modernbert.model_id}")
+    print(f"   Embedding dim: {config_modernbert.embedding_dim}")
+    print(f"   Max tokens: {config_modernbert.max_tokens}")
+    print(f"   Transformer output: {config_modernbert.transformer_output}")
+    print(f"   Query prepend: {config_modernbert.query_prepend}")
+    print(f"   Document prepend: {config_modernbert.document_prepend}")
+    embedding_field = package_modernbert.schema.document.fields[2]
+    print(f"   Schema embedding field name: {embedding_field.name}")
+    print(f"   Schema embedding field type: {embedding_field.type}")
+    print(f"   Distance metric: {embedding_field.ann.distance_metric}")
+
+    # Example 6: List all available predefined models
+    print("\n6. Available predefined models:")
+    print("-" * 60)
+    from vespa.nanobeir import COMMON_MODELS
+
+    for model_name, config in COMMON_MODELS.items():
+        binary_str = " (binary)" if config.binarized else ""
+        print(f"   - {model_name}: {config.embedding_dim} dim{binary_str}")
+
+    # Example 7: Advanced configuration with URL-based models
+    print("\n7. Advanced configuration: URL-based model with custom parameters")
+    print("-" * 60)
+    gte_config = ModelConfig(
+        model_id="gte-multilingual-base",
+        embedding_dim=768,
+        component_id="gte_multilingual",
+        model_url="https://huggingface.co/onnx-community/gte-multilingual-base/resolve/main/onnx/model_quantized.onnx",
+        tokenizer_url="https://huggingface.co/onnx-community/gte-multilingual-base/resolve/main/tokenizer.json",
+        transformer_output="token_embeddings",
+        max_tokens=8192,
+        query_prepend="Represent this sentence for searching relevant passages: ",
+        document_prepend="passage: ",
+    )
+
+    embedder = create_embedder_component(gte_config)
+    embedding_field = create_embedding_field(gte_config)
+
+    print(f"   Model: {gte_config.model_id}")
+    print(f"   Embedding dim: {gte_config.embedding_dim}")
+    print(f"   Component ID: {embedder.id}")
+    print(f"   Max tokens: {gte_config.max_tokens}")
+    print(f"   Transformer output: {gte_config.transformer_output}")
+    print(f"   Query prepend: {gte_config.query_prepend[:50]}...")
+    print(f"   Document prepend: {gte_config.document_prepend}")
+    print(f"   Number of parameters: {len(embedder.parameters)}")
+    print(f"   Schema embedding field type: {embedding_field.type}")
+
+    print("\n" + "=" * 60)
+    print("Example complete!")
+    print("\nNext steps:")
+    print("1. Deploy the package to Vespa Cloud or local Docker")
+    print("2. Load NanoBEIR dataset and feed documents")
+    print("3. Run evaluation using VespaEvaluator or VespaMatchEvaluator")
+    print("4. Compare results across different models")
+    print("\nAdvanced features demonstrated:")
+    print("- Using predefined model configurations")
+    print("- Creating custom model configurations")
+    print("- Single model setup with simple function call")
+    print("- Multiple model setup with automatic field/component naming")
+    print("- Mixed model configurations (predefined + custom)")
+    print("- Binary vs. float embeddings")
+    print("- URL-based model loading")
+    print("- Additional embedder parameters (transformer-output, max-tokens, prepend)")
+    print("\nKey benefits of multi-model support:")
+    print("- Evaluate multiple models in single deployment")
+    print("- Compare model performance side-by-side")
+    print("- Automatic conflict resolution (fields/components named uniquely)")
+    print("- Each model gets its own set of rank profiles")
+
+
+if __name__ == "__main__":
+    main()