const { existsSync, mkdirSync } = require('fs');
const { join } = require('path');
const { homedir } = require('os');
const CODEGRAPH_DIR = join(homedir(), '.codegraph');
const MODELS_DIR = join(CODEGRAPH_DIR, 'models');
const MODEL_ID = 'nomic-ai/nomic-embed-text-v1.5';
async function downloadModel() {
if (!existsSync(CODEGRAPH_DIR)) {
mkdirSync(CODEGRAPH_DIR, { recursive: true });
}
if (!existsSync(MODELS_DIR)) {
mkdirSync(MODELS_DIR, { recursive: true });
}
const modelCachePath = join(MODELS_DIR, MODEL_ID.replace('/', '/'));
if (existsSync(modelCachePath)) {
console.log('Embedding model already downloaded.');
return;
}
console.log('Downloading embedding model (~130MB)...');
console.log('This is a one-time download for semantic code search.\n');
try {
const { pipeline, env } = await import('@xenova/transformers');
env.cacheDir = MODELS_DIR;
await pipeline('feature-extraction', MODEL_ID, {
progress_callback: (progress) => {
if (progress.status === 'progress' && progress.file && progress.progress !== undefined) {
const fileName = progress.file.split('/').pop();
const percent = Math.round(progress.progress);
process.stdout.write(`\rDownloading ${fileName}... ${percent}% `);
} else if (progress.status === 'done') {
process.stdout.write('\n');
}
},
});
console.log('\nEmbedding model ready!');
} catch (error) {
console.log('\nNote: Could not download embedding model.');
console.log('Semantic search will download it on first use.');
if (process.env.DEBUG) {
console.error(error);
}
}
}
downloadModel().catch(() => {
process.exit(0);
});