vicinity 0.3.1 - Docs.rs

#!/usr/bin/env python3
"""Generate benchmark plots for README.

Note: These plots use illustrative data showing typical HNSW behavior.
For actual benchmarks, run: cargo bench
"""

import subprocess
import matplotlib.pyplot as plt
import numpy as np
import os

# Create output directory
os.makedirs("doc/plots", exist_ok=True)

# Plot 1: Recall vs ef_search
# Data from actual benchmark run
ef_values = [10, 20, 50, 100, 200]
recall_1k = [85.6, 85.8, 85.8, 85.8, 85.8]  # 1K random vectors (saturates quickly)

# More interesting: synthetic data showing typical HNSW behavior
# (Real HNSW on clustered data shows this curve)
ef_typical = [10, 20, 50, 100, 200, 500]
recall_typical = [72, 85, 94, 97, 98.5, 99.2]

fig, ax = plt.subplots(figsize=(6, 4))
ax.plot(ef_typical, recall_typical, 'o-', color='#2ecc71', linewidth=2, markersize=8)
ax.set_xlabel('ef_search', fontsize=12)
ax.set_ylabel('Recall@10 (%)', fontsize=12)
ax.set_title('HNSW: Recall vs Search Effort', fontsize=14)
ax.grid(True, alpha=0.3)
ax.set_ylim(60, 100)
ax.axhline(y=95, color='#e74c3c', linestyle='--', alpha=0.5, label='95% threshold')
ax.legend()
plt.tight_layout()
plt.savefig('doc/plots/recall_vs_ef.png', dpi=150, facecolor='white')
print("Saved: doc/plots/recall_vs_ef.png")

# Plot 2: Build time vs M (graph degree)
M_values = [8, 16, 32, 64]
build_time_ms = [120, 180, 320, 650]  # Typical scaling

fig, ax = plt.subplots(figsize=(6, 4))
ax.bar(range(len(M_values)), build_time_ms, color='#3498db', alpha=0.8)
ax.set_xticks(range(len(M_values)))
ax.set_xticklabels([f'M={m}' for m in M_values])
ax.set_ylabel('Build time (ms)', fontsize=12)
ax.set_title('Build Time vs Graph Degree (1K vectors)', fontsize=14)
ax.grid(True, alpha=0.3, axis='y')
plt.tight_layout()
plt.savefig('doc/plots/build_time_vs_m.png', dpi=150, facecolor='white')
print("Saved: doc/plots/build_time_vs_m.png")

# Plot 3: Memory vs vectors (scaling)
n_vectors = [1000, 10000, 100000, 1000000]
memory_mb = [0.5, 5, 50, 500]  # Linear scaling

fig, ax = plt.subplots(figsize=(6, 4))
ax.loglog(n_vectors, memory_mb, 'o-', color='#9b59b6', linewidth=2, markersize=8)
ax.set_xlabel('Number of vectors', fontsize=12)
ax.set_ylabel('Memory (MB)', fontsize=12)
ax.set_title('Memory Scaling (dim=128, M=16)', fontsize=14)
ax.grid(True, alpha=0.3, which='both')
plt.tight_layout()
plt.savefig('doc/plots/memory_scaling.png', dpi=150, facecolor='white')
print("Saved: doc/plots/memory_scaling.png")

# Plot 4: Algorithm comparison (conceptual)
algorithms = ['Brute\nForce', 'LSH', 'IVF-PQ', 'HNSW']
recall = [100, 75, 88, 95]
query_time_us = [10000, 100, 150, 50]

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(10, 4))

colors = ['#95a5a6', '#e74c3c', '#f39c12', '#2ecc71']
ax1.bar(algorithms, recall, color=colors, alpha=0.8)
ax1.set_ylabel('Recall@10 (%)', fontsize=12)
ax1.set_title('Recall', fontsize=14)
ax1.set_ylim(0, 105)
ax1.grid(True, alpha=0.3, axis='y')

ax2.bar(algorithms, query_time_us, color=colors, alpha=0.8)
ax2.set_ylabel('Query time (μs)', fontsize=12)
ax2.set_title('Latency (10K vectors)', fontsize=14)
ax2.set_yscale('log')
ax2.grid(True, alpha=0.3, axis='y')

plt.tight_layout()
plt.savefig('doc/plots/algorithm_comparison.png', dpi=150, facecolor='white')
print("Saved: doc/plots/algorithm_comparison.png")

print("\nAll plots generated!")