feat: remove API worker and batch size configurations; update CodexLens settings for v2

2026-03-19 18:58:47 +08:00 · 2026-03-17 20:44:26 +08:00
parent f37189dc64
commit ef2c5a58e1
11 changed files with 313 additions and 142 deletions
--- a/ccw/frontend/src/components/codexlens/OverviewTab.test.tsx
+++ b/ccw/frontend/src/components/codexlens/OverviewTab.test.tsx
@@ -20,8 +20,6 @@ const mockStatus: CodexLensVenvStatus = {
 const mockConfig: CodexLensConfig = {
  index_dir: '~/.codexlens/indexes',
  index_count: 100,
  api_max_workers: 4,
  api_batch_size: 8,
 };
 // Mock window.alert
@@ -243,8 +241,6 @@ describe('OverviewTab', () => {
      const emptyConfig: CodexLensConfig = {
        index_dir: '',
        index_count: 0,
        api_max_workers: 4,
        api_batch_size: 8,
      };
      render(
--- a/ccw/frontend/src/components/codexlens/SettingsTab.test.tsx
+++ b/ccw/frontend/src/components/codexlens/SettingsTab.test.tsx
@@ -54,8 +54,6 @@ import {
 const mockConfig: CodexLensConfig = {
  index_dir: '~/.codexlens/indexes',
  index_count: 100,
  api_max_workers: 4,
  api_batch_size: 8,
 };
 const mockEnv: Record<string, string> = {
@@ -75,8 +73,6 @@ function setupDefaultMocks() {
    config: mockConfig,
    indexDir: mockConfig.index_dir,
    indexCount: 100,
    apiMaxWorkers: 4,
    apiBatchSize: 8,
    isLoading: false,
    error: null,
    refetch: vi.fn(),
@@ -298,8 +294,6 @@ describe('SettingsTab', () => {
        config: mockConfig,
        indexDir: mockConfig.index_dir,
        indexCount: 100,
        apiMaxWorkers: 4,
        apiBatchSize: 8,
        isLoading: true,
        error: null,
        refetch: vi.fn(),
--- a/ccw/frontend/src/components/codexlens/SettingsTab.tsx
+++ b/ccw/frontend/src/components/codexlens/SettingsTab.tsx
@@ -1,8 +1,8 @@
 // ========================================
 // CodexLens Settings Tab
 // ========================================
-// Structured form for CodexLens env configuration
+// Structured form for CodexLens v2 env configuration
-// Renders 5 groups: embedding, reranker, concurrency, cascade, chunking
+// Renders 4 groups: embedding, reranker, search, indexing
 // Plus a general config section (index_dir)
 import { useState, useEffect, useCallback, useMemo } from 'react';
@@ -33,12 +33,10 @@ export function SettingsTab({ enabled = true }: SettingsTabProps) {
  const { formatMessage } = useIntl();
  const { success, error: showError } = useNotifications();
-  // Fetch current config (index_dir, workers, batch_size)
+  // Fetch current config (index_dir, index_count)
  const {
    config,
    indexCount,
    apiMaxWorkers,
    apiBatchSize,
    isLoading: isLoadingConfig,
    refetch: refetchConfig,
  } = useCodexLensConfig({ enabled });
@@ -199,25 +197,13 @@ export function SettingsTab({ enabled = true }: SettingsTabProps) {
    <div className="space-y-6">
      {/* Current Info Card */}
      <Card className="p-4 bg-muted/30">
-        <div className="grid grid-cols-1 md:grid-cols-3 gap-4 text-sm">
+        <div className="text-sm">
          <div>
            <span className="text-muted-foreground">
              {formatMessage({ id: 'codexlens.settings.currentCount' })}
            </span>
            <p className="text-foreground font-medium">{indexCount}</p>
          </div>
          <div>
            <span className="text-muted-foreground">
              {formatMessage({ id: 'codexlens.settings.currentWorkers' })}
            </span>
            <p className="text-foreground font-medium">{apiMaxWorkers}</p>
          </div>
          <div>
            <span className="text-muted-foreground">
              {formatMessage({ id: 'codexlens.settings.currentBatchSize' })}
            </span>
            <p className="text-foreground font-medium">{apiBatchSize}</p>
          </div>
        </div>
      </Card>
--- a/ccw/frontend/src/hooks/useCodexLens.test.tsx
+++ b/ccw/frontend/src/hooks/useCodexLens.test.tsx
@@ -65,8 +65,6 @@ const mockDashboardData = {
  config: {
    index_dir: '~/.codexlens/indexes',
    index_count: 100,
    api_max_workers: 4,
    api_batch_size: 8,
  },
  semantic: { available: true },
 };
@@ -165,8 +163,6 @@ describe('useCodexLens Hook', () => {
      const mockConfig = {
        index_dir: '~/.codexlens/indexes',
        index_count: 100,
        api_max_workers: 4,
        api_batch_size: 8,
      };
      vi.mocked(api.fetchCodexLensConfig).mockResolvedValue(mockConfig);
@@ -177,8 +173,6 @@ describe('useCodexLens Hook', () => {
      expect(api.fetchCodexLensConfig).toHaveBeenCalledOnce();
      expect(result.current.indexDir).toBe('~/.codexlens/indexes');
      expect(result.current.indexCount).toBe(100);
      expect(result.current.apiMaxWorkers).toBe(4);
      expect(result.current.apiBatchSize).toBe(8);
    });
  });
@@ -253,14 +247,10 @@ describe('useCodexLens Hook', () => {
      const updateResult = await result.current.updateConfig({
        index_dir: '~/.codexlens/indexes',
        api_max_workers: 8,
        api_batch_size: 16,
      });
      expect(api.updateCodexLensConfig).toHaveBeenCalledWith({
        index_dir: '~/.codexlens/indexes',
        api_max_workers: 8,
        api_batch_size: 16,
      });
      expect(updateResult.success).toBe(true);
      expect(updateResult.message).toBe('Config updated');
--- a/ccw/frontend/src/hooks/useCodexLens.ts
+++ b/ccw/frontend/src/hooks/useCodexLens.ts
@@ -259,8 +259,6 @@ export interface UseCodexLensConfigReturn {
  config: CodexLensConfig | undefined;
  indexDir: string;
  indexCount: number;
  apiMaxWorkers: number;
  apiBatchSize: number;
  isLoading: boolean;
  error: Error | null;
  refetch: () => Promise<void>;
@@ -288,8 +286,6 @@ export function useCodexLensConfig(options: UseCodexLensConfigOptions = {}): Use
    config: query.data,
    indexDir: query.data?.index_dir ?? '~/.codexlens/indexes',
    indexCount: query.data?.index_count ?? 0,
    apiMaxWorkers: query.data?.api_max_workers ?? 4,
    apiBatchSize: query.data?.api_batch_size ?? 8,
    isLoading: query.isLoading,
    error: query.error,
    refetch,
@@ -530,7 +526,7 @@ export function useCodexLensIgnorePatterns(options: UseCodexLensIgnorePatternsOp
 // ========== Mutation Hooks ==========
 export interface UseUpdateCodexLensConfigReturn {
-  updateConfig: (config: { index_dir: string; api_max_workers?: number; api_batch_size?: number }) => Promise<{ success: boolean; message?: string }>;
+  updateConfig: (config: { index_dir: string }) => Promise<{ success: boolean; message?: string }>;
  isUpdating: boolean;
  error: Error | null;
 }
--- a/ccw/frontend/src/lib/api.ts
+++ b/ccw/frontend/src/lib/api.ts
@@ -5273,8 +5273,6 @@ export interface CodexLensStatusData {
 export interface CodexLensConfig {
  index_dir: string;
  index_count: number;
  api_max_workers: number;
  api_batch_size: number;
 }
 /**
@@ -5530,8 +5528,6 @@ export async function fetchCodexLensConfig(): Promise<CodexLensConfig> {
 */
 export async function updateCodexLensConfig(config: {
  index_dir: string;
  api_max_workers?: number;
  api_batch_size?: number;
 }): Promise<{ success: boolean; message?: string; error?: string }> {
  return fetchApi('/api/codexlens/config', {
    method: 'POST',
--- a/ccw/frontend/src/pages/CodexLensManagerPage.test.tsx
+++ b/ccw/frontend/src/pages/CodexLensManagerPage.test.tsx
@@ -63,8 +63,6 @@ const mockDashboardData = {
  config: {
    index_dir: '~/.codexlens/indexes',
    index_count: 100,
    api_max_workers: 4,
    api_batch_size: 8,
  },
  semantic: { available: true },
 };
--- a/ccw/src/core/routes/codexlens/config-handlers.ts
+++ b/ccw/src/core/routes/codexlens/config-handlers.ts
@@ -11,7 +11,13 @@ import {
  executeCodexLens,
  isIndexingInProgress,
  uninstallCodexLens,
  useCodexLensV2,
 } from '../../../tools/codex-lens.js';
 import {
  executeV2ListModels,
  executeV2DownloadModel,
  executeV2DeleteModel,
 } from '../../../tools/smart-search.js';
 import type { RouteContext } from '../types.js';
 import { EXEC_TIMEOUTS } from '../../../utils/exec-constants.js';
 import { extractJSON } from './utils.js';
@@ -268,7 +274,7 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
  if (pathname === '/api/codexlens/config' && req.method === 'GET') {
    try {
      const venvStatus = await checkVenvStatus();
-      let responseData = { index_dir: '~/.codexlens/indexes', index_count: 0, api_max_workers: 4, api_batch_size: 8 };
+      let responseData = { index_dir: '~/.codexlens/indexes', index_count: 0 };
      // If not installed, return default config without executing CodexLens
      if (!venvStatus.ready) {
@@ -290,13 +296,6 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
          if (config.success && config.result) {
            // CLI returns index_dir (not index_root)
            responseData.index_dir = config.result.index_dir || config.result.index_root || responseData.index_dir;
            // Extract API settings
            if (config.result.api_max_workers !== undefined) {
              responseData.api_max_workers = config.result.api_max_workers;
            }
            if (config.result.api_batch_size !== undefined) {
              responseData.api_batch_size = config.result.api_batch_size;
            }
          }
        } catch (e: unknown) {
          console.error('[CodexLens] Failed to parse config:', e instanceof Error ? e.message : String(e));
@@ -340,10 +339,8 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
  // API: CodexLens Config - POST (Set configuration)
  if (pathname === '/api/codexlens/config' && req.method === 'POST') {
    handlePostRequest(req, res, async (body: unknown) => {
-      const { index_dir, api_max_workers, api_batch_size } = body as {
+      const { index_dir } = body as {
        index_dir?: unknown;
        api_max_workers?: unknown;
        api_batch_size?: unknown;
      };
      if (!index_dir) {
@@ -377,20 +374,6 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
        return { success: false, error: 'Invalid path: path traversal not allowed', status: 400 };
      }
      // Validate api settings
      if (api_max_workers !== undefined) {
        const workers = Number(api_max_workers);
        if (isNaN(workers) || workers < 1 || workers > 32) {
          return { success: false, error: 'api_max_workers must be between 1 and 32', status: 400 };
        }
      }
      if (api_batch_size !== undefined) {
        const batch = Number(api_batch_size);
        if (isNaN(batch) || batch < 1 || batch > 64) {
          return { success: false, error: 'api_batch_size must be between 1 and 64', status: 400 };
        }
      }
      try {
        // Set index_dir
        const result = await executeCodexLens(['config', 'set', 'index_dir', indexDirStr, '--json']);
@@ -398,14 +381,6 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
          return { success: false, error: result.error || 'Failed to update index_dir', status: 500 };
        }
        // Set API settings if provided
        if (api_max_workers !== undefined) {
          await executeCodexLens(['config', 'set', 'api_max_workers', String(api_max_workers), '--json']);
        }
        if (api_batch_size !== undefined) {
          await executeCodexLens(['config', 'set', 'api_batch_size', String(api_batch_size), '--json']);
        }
        return { success: true, message: 'Configuration updated successfully' };
      } catch (err: unknown) {
        return { success: false, error: err instanceof Error ? err.message : String(err), status: 500 };
@@ -568,6 +543,22 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
  // API: CodexLens Model List (list available embedding AND reranker models)
  if (pathname === '/api/codexlens/models' && req.method === 'GET') {
    try {
      // v2 bridge: single list-models command returns all models with type
      if (useCodexLensV2()) {
        const result = await executeV2ListModels();
        if (result.success && result.status) {
          // v2 bridge returns array directly as status
          const models = Array.isArray(result.status) ? result.status : [];
          res.writeHead(200, { 'Content-Type': 'application/json' });
          res.end(JSON.stringify({ success: true, result: { models } }));
        } else {
          res.writeHead(500, { 'Content-Type': 'application/json' });
          res.end(JSON.stringify({ success: false, error: result.error || 'Failed to list models' }));
        }
        return true;
      }
      // v1 fallback: fetch embedding and reranker models separately
      // Check if CodexLens is installed first (without auto-installing)
      const venvStatus = await checkVenvStatus();
      if (!venvStatus.ready) {
@@ -625,10 +616,27 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
  // API: CodexLens Model Download (download embedding or reranker model by profile)
  if (pathname === '/api/codexlens/models/download' && req.method === 'POST') {
    handlePostRequest(req, res, async (body) => {
-      const { profile, model_type } = body as { profile?: unknown; model_type?: unknown };
+      const { profile, model_type, model_name } = body as { profile?: unknown; model_type?: unknown; model_name?: unknown };
      // v2 bridge: accepts model_name (HF name) directly; v1 uses profile names
      const resolvedProfile = typeof profile === 'string' && profile.trim().length > 0 ? profile.trim() : undefined;
      const resolvedModelName = typeof model_name === 'string' && model_name.trim().length > 0 ? model_name.trim() : undefined;
      const resolvedModelType = typeof model_type === 'string' ? model_type.trim() : undefined;
      // v2 bridge: download by model name
      if (useCodexLensV2()) {
        const nameToDownload = resolvedModelName || resolvedProfile;
        if (!nameToDownload) {
          return { success: false, error: 'model_name or profile is required', status: 400 };
        }
        const result = await executeV2DownloadModel(nameToDownload);
        if (result.success) {
          const data = (result.status && typeof result.status === 'object') ? result.status as Record<string, unknown> : {};
          return { success: true, ...data };
        }
        return { success: false, error: result.error, status: 500 };
      }
      // v1 fallback
      if (!resolvedProfile) {
        return { success: false, error: 'profile is required', status: 400 };
      }
@@ -705,6 +713,17 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
        return { success: false, error: 'Invalid model_name format. Expected: org/model-name', status: 400 };
      }
      // v2 bridge: download-model handles any HF model name directly
      if (useCodexLensV2()) {
        const result = await executeV2DownloadModel(resolvedModelName);
        if (result.success) {
          const data = (result.status && typeof result.status === 'object') ? result.status as Record<string, unknown> : {};
          return { success: true, ...data };
        }
        return { success: false, error: result.error, status: 500 };
      }
      // v1 fallback
      try {
        const result = await executeCodexLens([
          'model-download-custom', resolvedModelName,
@@ -732,10 +751,26 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
  // API: CodexLens Model Delete (delete embedding or reranker model by profile)
  if (pathname === '/api/codexlens/models/delete' && req.method === 'POST') {
    handlePostRequest(req, res, async (body) => {
-      const { profile, model_type } = body as { profile?: unknown; model_type?: unknown };
+      const { profile, model_type, model_name } = body as { profile?: unknown; model_type?: unknown; model_name?: unknown };
      const resolvedProfile = typeof profile === 'string' && profile.trim().length > 0 ? profile.trim() : undefined;
      const resolvedModelName = typeof model_name === 'string' && model_name.trim().length > 0 ? model_name.trim() : undefined;
      const resolvedModelType = typeof model_type === 'string' ? model_type.trim() : undefined;
      // v2 bridge: delete by model name
      if (useCodexLensV2()) {
        const nameToDelete = resolvedModelName || resolvedProfile;
        if (!nameToDelete) {
          return { success: false, error: 'model_name or profile is required', status: 400 };
        }
        const result = await executeV2DeleteModel(nameToDelete);
        if (result.success) {
          const data = (result.status && typeof result.status === 'object') ? result.status as Record<string, unknown> : {};
          return { success: true, ...data };
        }
        return { success: false, error: result.error, status: 500 };
      }
      // v1 fallback
      if (!resolvedProfile) {
        return { success: false, error: 'profile is required', status: 400 };
      }
@@ -1077,8 +1112,8 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
            const trimmed = line.trim();
            // Preserve comment lines that aren't our headers
            if (trimmed.startsWith('#') && !trimmed.includes('Managed by CCW')) {
-              if (!trimmed.includes('Reranker API') && !trimmed.includes('Embedding API') &&
+              if (!trimmed.includes('Reranker Configuration') && !trimmed.includes('Embedding Configuration') &&
-                  !trimmed.includes('LiteLLM Config') && !trimmed.includes('CodexLens Settings') &&
+                  !trimmed.includes('Search Pipeline') && !trimmed.includes('Indexing Settings') &&
                  !trimmed.includes('Other Settings') && !trimmed.includes('CodexLens Environment')) {
                existingComments.push(line);
              }
@@ -1116,9 +1151,20 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
        // Merge: update known keys from payload, preserve unknown keys
        const knownKeys = new Set([
-          'RERANKER_API_KEY', 'RERANKER_API_BASE', 'RERANKER_MODEL',
+          // v2 embedding
-          'EMBEDDING_API_KEY', 'EMBEDDING_API_BASE', 'EMBEDDING_MODEL',
+          'CODEXLENS_EMBEDDING_BACKEND', 'CODEXLENS_EMBEDDING_MODEL', 'CODEXLENS_USE_GPU',
-          'LITELLM_API_KEY', 'LITELLM_API_BASE', 'LITELLM_MODEL'
+          'CODEXLENS_EMBED_BATCH_SIZE', 'CODEXLENS_EMBED_API_URL', 'CODEXLENS_EMBED_API_KEY',
          'CODEXLENS_EMBED_API_MODEL', 'CODEXLENS_EMBED_API_ENDPOINTS', 'CODEXLENS_EMBED_DIM',
          'CODEXLENS_EMBED_API_CONCURRENCY', 'CODEXLENS_EMBED_API_MAX_TOKENS',
          // v2 reranker
          'CODEXLENS_RERANKER_BACKEND', 'CODEXLENS_RERANKER_MODEL', 'CODEXLENS_RERANKER_TOP_K',
          'CODEXLENS_RERANKER_BATCH_SIZE', 'CODEXLENS_RERANKER_API_URL',
          'CODEXLENS_RERANKER_API_KEY', 'CODEXLENS_RERANKER_API_MODEL',
          // v2 search pipeline
          'CODEXLENS_BINARY_TOP_K', 'CODEXLENS_ANN_TOP_K', 'CODEXLENS_FTS_TOP_K', 'CODEXLENS_FUSION_K',
          // v2 indexing
          'CODEXLENS_CODE_AWARE_CHUNKING', 'CODEXLENS_INDEX_WORKERS', 'CODEXLENS_MAX_FILE_SIZE',
          'CODEXLENS_HNSW_EF', 'CODEXLENS_HNSW_M',
        ]);
        // Apply updates from payload
@@ -1143,12 +1189,12 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
          lines.push(...existingComments, '');
        }
-        // Group by prefix
+        // Group by semantic category (v2 env var naming)
        const groups: Record<string, string[]> = {
          'EMBED': [],
          'RERANKER': [],
-          'EMBEDDING': [],
+          'SEARCH': [],
-          'LITELLM': [],
+          'INDEX': [],
          'CODEXLENS': [],
          'OTHER': []
        };
@@ -1161,29 +1207,29 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
            .replace(/\n/g, '\\n')   // Escape newlines
            .replace(/\r/g, '\\r');  // Escape carriage returns
          const line = `${key}="${escapedValue}"`;
-          if (key.startsWith('RERANKER_')) groups['RERANKER'].push(line);
+          if (key.includes('EMBED') || key === 'CODEXLENS_USE_GPU') groups['EMBED'].push(line);
-          else if (key.startsWith('EMBEDDING_')) groups['EMBEDDING'].push(line);
+          else if (key.includes('RERANKER')) groups['RERANKER'].push(line);
-          else if (key.startsWith('LITELLM_')) groups['LITELLM'].push(line);
+          else if (key.includes('BINARY_TOP_K') || key.includes('ANN_TOP_K') || key.includes('FTS_TOP_K') || key.includes('FUSION_K')) groups['SEARCH'].push(line);
-          else if (key.startsWith('CODEXLENS_')) groups['CODEXLENS'].push(line);
+          else if (key.includes('INDEX') || key.includes('HNSW') || key.includes('MAX_FILE_SIZE') || key.includes('CODE_AWARE')) groups['INDEX'].push(line);
          else groups['OTHER'].push(line);
        }
        // Add grouped content
        if (groups['EMBED'].length) {
          lines.push('# Embedding Configuration');
          lines.push(...groups['EMBED'], '');
        }
        if (groups['RERANKER'].length) {
-          lines.push('# Reranker API Configuration');
+          lines.push('# Reranker Configuration');
          lines.push(...groups['RERANKER'], '');
        }
-        if (groups['EMBEDDING'].length) {
+        if (groups['SEARCH'].length) {
-          lines.push('# Embedding API Configuration');
+          lines.push('# Search Pipeline');
-          lines.push(...groups['EMBEDDING'], '');
+          lines.push(...groups['SEARCH'], '');
        }
-        if (groups['LITELLM'].length) {
+        if (groups['INDEX'].length) {
-          lines.push('# LiteLLM Configuration');
+          lines.push('# Indexing Settings');
-          lines.push(...groups['LITELLM'], '');
+          lines.push(...groups['INDEX'], '');
        }
        if (groups['CODEXLENS'].length) {
          lines.push('# CodexLens Settings');
          lines.push(...groups['CODEXLENS'], '');
        }
        if (groups['OTHER'].length) {
          lines.push('# Other Settings');
@@ -1199,48 +1245,43 @@ export async function handleCodexLensConfigRoutes(ctx: RouteContext): Promise<bo
          const settingsContent = await readFile(settingsPath, 'utf-8');
          settings = JSON.parse(settingsContent);
        } catch {
-          // File doesn't exist, create default structure
+          // File doesn't exist, create default structure (v2 sections)
-          settings = { embedding: {}, reranker: {}, api: {}, cascade: {}, staged: {}, llm: {}, parsing: {}, indexing: {} };
+          settings = { embedding: {}, reranker: {}, search: {}, indexing: {} };
        }
-        // Map env vars to settings.json structure
+        // Map env vars to settings.json structure (v2 schema)
        const envToSettings: Record<string, { path: string[], transform?: (v: string) => any }> = {
          // Embedding
          'CODEXLENS_EMBEDDING_BACKEND': { path: ['embedding', 'backend'] },
          'CODEXLENS_EMBEDDING_MODEL': { path: ['embedding', 'model'] },
-          'CODEXLENS_USE_GPU': { path: ['embedding', 'use_gpu'], transform: v => v === 'true' },
+          'CODEXLENS_USE_GPU': { path: ['embedding', 'device'] },
-          'CODEXLENS_AUTO_EMBED_MISSING': { path: ['embedding', 'auto_embed_missing'], transform: v => v === 'true' },
+          'CODEXLENS_EMBED_BATCH_SIZE': { path: ['embedding', 'batch_size'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_EMBEDDING_STRATEGY': { path: ['embedding', 'strategy'] },
+          'CODEXLENS_EMBED_API_URL': { path: ['embedding', 'api_url'] },
-          'CODEXLENS_EMBEDDING_COOLDOWN': { path: ['embedding', 'cooldown'], transform: v => parseFloat(v) },
+          'CODEXLENS_EMBED_API_KEY': { path: ['embedding', 'api_key'] },
          'CODEXLENS_EMBED_API_MODEL': { path: ['embedding', 'api_model'] },
          'CODEXLENS_EMBED_API_ENDPOINTS': { path: ['embedding', 'api_endpoints'] },
          'CODEXLENS_EMBED_DIM': { path: ['embedding', 'dim'], transform: v => parseInt(v, 10) },
          'CODEXLENS_EMBED_API_CONCURRENCY': { path: ['embedding', 'api_concurrency'], transform: v => parseInt(v, 10) },
          'CODEXLENS_EMBED_API_MAX_TOKENS': { path: ['embedding', 'api_max_tokens_per_batch'], transform: v => parseInt(v, 10) },
          // Reranker
          'CODEXLENS_RERANKER_BACKEND': { path: ['reranker', 'backend'] },
          'CODEXLENS_RERANKER_MODEL': { path: ['reranker', 'model'] },
          'CODEXLENS_RERANKER_ENABLED': { path: ['reranker', 'enabled'], transform: v => v === 'true' },
          'CODEXLENS_RERANKER_TOP_K': { path: ['reranker', 'top_k'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_API_MAX_WORKERS': { path: ['api', 'max_workers'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_RERANKER_BATCH_SIZE': { path: ['reranker', 'batch_size'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_API_BATCH_SIZE': { path: ['api', 'batch_size'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_RERANKER_API_URL': { path: ['reranker', 'api_url'] },
-          'CODEXLENS_API_BATCH_SIZE_DYNAMIC': { path: ['api', 'batch_size_dynamic'], transform: v => v === 'true' },
+          'CODEXLENS_RERANKER_API_KEY': { path: ['reranker', 'api_key'] },
-          'CODEXLENS_API_BATCH_SIZE_UTILIZATION': { path: ['api', 'batch_size_utilization_factor'], transform: v => parseFloat(v) },
+          'CODEXLENS_RERANKER_API_MODEL': { path: ['reranker', 'api_model'] },
-          'CODEXLENS_API_BATCH_SIZE_MAX': { path: ['api', 'batch_size_max'], transform: v => parseInt(v, 10) },
+          // Search pipeline
-          'CODEXLENS_CHARS_PER_TOKEN': { path: ['api', 'chars_per_token_estimate'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_BINARY_TOP_K': { path: ['search', 'binary_top_k'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_CASCADE_STRATEGY': { path: ['cascade', 'strategy'] },
+          'CODEXLENS_ANN_TOP_K': { path: ['search', 'ann_top_k'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_CASCADE_COARSE_K': { path: ['cascade', 'coarse_k'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_FTS_TOP_K': { path: ['search', 'fts_top_k'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_CASCADE_FINE_K': { path: ['cascade', 'fine_k'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_FUSION_K': { path: ['search', 'fusion_k'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_STAGED_STAGE2_MODE': { path: ['staged', 'stage2_mode'] },
+          // Indexing
-          'CODEXLENS_STAGED_CLUSTERING_STRATEGY': { path: ['staged', 'clustering_strategy'] },
+          'CODEXLENS_CODE_AWARE_CHUNKING': { path: ['indexing', 'code_aware_chunking'], transform: v => v === 'true' },
-          'CODEXLENS_STAGED_CLUSTERING_MIN_SIZE': { path: ['staged', 'clustering_min_size'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_INDEX_WORKERS': { path: ['indexing', 'workers'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_ENABLE_STAGED_RERANK': { path: ['staged', 'enable_rerank'], transform: v => v === 'true' },
+          'CODEXLENS_MAX_FILE_SIZE': { path: ['indexing', 'max_file_size_bytes'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_LLM_ENABLED': { path: ['llm', 'enabled'], transform: v => v === 'true' },
+          'CODEXLENS_HNSW_EF': { path: ['indexing', 'hnsw_ef'], transform: v => parseInt(v, 10) },
-          'CODEXLENS_LLM_BATCH_SIZE': { path: ['llm', 'batch_size'], transform: v => parseInt(v, 10) },
+          'CODEXLENS_HNSW_M': { path: ['indexing', 'hnsw_M'], transform: v => parseInt(v, 10) },
          'CODEXLENS_USE_ASTGREP': { path: ['parsing', 'use_astgrep'], transform: v => v === 'true' },
          'CODEXLENS_STATIC_GRAPH_ENABLED': { path: ['indexing', 'static_graph_enabled'], transform: v => v === 'true' },
          'CODEXLENS_STATIC_GRAPH_RELATIONSHIP_TYPES': {
            path: ['indexing', 'static_graph_relationship_types'],
            transform: v => v
              .split(',')
              .map((t) => t.trim())
              .filter((t) => t.length > 0),
          },
          'LITELLM_EMBEDDING_MODEL': { path: ['embedding', 'model'] },
          'LITELLM_RERANKER_MODEL': { path: ['reranker', 'model'] }
        };
        // Apply env vars to settings
--- a/ccw/src/tools/smart-search.ts
+++ b/ccw/src/tools/smart-search.ts
@@ -2356,6 +2356,28 @@ async function executeV2BridgeCommand(
  });
 }
 /**
 * List known models via v2 bridge (list-models subcommand).
 * Returns JSON array of {name, type, installed, cache_path}.
 */
 export async function executeV2ListModels(): Promise<SearchResult> {
  return executeV2BridgeCommand('list-models', []);
 }
 /**
 * Download a single model by name via v2 bridge (download-model subcommand).
 */
 export async function executeV2DownloadModel(modelName: string): Promise<SearchResult> {
  return executeV2BridgeCommand('download-model', [modelName], { timeout: 600000 });
 }
 /**
 * Delete a model from cache via v2 bridge (delete-model subcommand).
 */
 export async function executeV2DeleteModel(modelName: string): Promise<SearchResult> {
  return executeV2BridgeCommand('delete-model', [modelName]);
 }
 /**
 * Action: init (v2) - Initialize index and sync files.
 */
--- a/codex-lens-v2/src/codexlens_search/bridge.py
+++ b/codex-lens-v2/src/codexlens_search/bridge.py
@@ -386,6 +386,47 @@ def cmd_download_models(args: argparse.Namespace) -> None:
    })
 def cmd_list_models(args: argparse.Namespace) -> None:
    """List known embed/reranker models with cache status."""
    from codexlens_search import model_manager
    config = _create_config(args)
    models = model_manager.list_known_models(config)
    _json_output(models)
 def cmd_download_model(args: argparse.Namespace) -> None:
    """Download a single model by name."""
    from codexlens_search import model_manager
    config = _create_config(args)
    model_name = args.model_name
    model_manager.ensure_model(model_name, config)
    cached = model_manager._model_is_cached(
        model_name, model_manager._resolve_cache_dir(config)
    )
    _json_output({
        "status": "downloaded" if cached else "failed",
        "model": model_name,
    })
 def cmd_delete_model(args: argparse.Namespace) -> None:
    """Delete a model from cache."""
    from codexlens_search import model_manager
    config = _create_config(args)
    model_name = args.model_name
    deleted = model_manager.delete_model(model_name, config)
    _json_output({
        "status": "deleted" if deleted else "not_found",
        "model": model_name,
    })
 def cmd_status(args: argparse.Namespace) -> None:
    """Report index statistics."""
    from codexlens_search.indexing.metadata import MetadataStore
@@ -490,6 +531,17 @@ def _build_parser() -> argparse.ArgumentParser:
    p_dl = sub.add_parser("download-models", help="Download embed + reranker models")
    p_dl.add_argument("--embed-model", help="Override embed model name")
    # list-models
    sub.add_parser("list-models", help="List known models with cache status")
    # download-model (single model by name)
    p_dl_single = sub.add_parser("download-model", help="Download a single model by name")
    p_dl_single.add_argument("model_name", help="HuggingFace model name (e.g. BAAI/bge-small-en-v1.5)")
    # delete-model
    p_del = sub.add_parser("delete-model", help="Delete a model from cache")
    p_del.add_argument("model_name", help="HuggingFace model name to delete")
    # status
    sub.add_parser("status", help="Report index statistics")
@@ -528,6 +580,9 @@ def main() -> None:
        "sync": cmd_sync,
        "watch": cmd_watch,
        "download-models": cmd_download_models,
        "list-models": cmd_list_models,
        "download-model": cmd_download_model,
        "delete-model": cmd_delete_model,
        "status": cmd_status,
    }
--- a/codex-lens-v2/src/codexlens_search/model_manager.py
+++ b/codex-lens-v2/src/codexlens_search/model_manager.py
@@ -137,6 +137,103 @@ def _ensure_model_onnx(model_dir: Path) -> None:
            return
 def list_known_models(config: Config) -> list[dict]:
    """Return info for known embed/reranker models with cache status.
    Checks config defaults plus common alternative models.
    Returns list of dicts with keys: name, type, installed, cache_path.
    """
    cache_dir = _resolve_cache_dir(config)
    base = cache_dir or _default_fastembed_cache()
    # Known embedding models
    embed_models = [
        config.embed_model,
        "BAAI/bge-small-en-v1.5",
        "BAAI/bge-base-en-v1.5",
        "BAAI/bge-large-en-v1.5",
        "sentence-transformers/all-MiniLM-L6-v2",
    ]
    # Known reranker models
    reranker_models = [
        config.reranker_model,
        "Xenova/ms-marco-MiniLM-L-6-v2",
        "BAAI/bge-reranker-base",
        "BAAI/bge-reranker-v2-m3",
    ]
    seen: set[str] = set()
    results: list[dict] = []
    for name in embed_models:
        if name in seen:
            continue
        seen.add(name)
        cache_path = _find_model_cache_path(name, base)
        results.append({
            "name": name,
            "type": "embedding",
            "installed": cache_path is not None,
            "cache_path": cache_path,
        })
    for name in reranker_models:
        if name in seen:
            continue
        seen.add(name)
        cache_path = _find_model_cache_path(name, base)
        results.append({
            "name": name,
            "type": "reranker",
            "installed": cache_path is not None,
            "cache_path": cache_path,
        })
    return results
 def delete_model(model_name: str, config: Config) -> bool:
    """Remove a model from the HF/fastembed cache.
    Returns True if deleted, False if not found.
    """
    import shutil
    cache_dir = _resolve_cache_dir(config)
    base = cache_dir or _default_fastembed_cache()
    cache_path = _find_model_cache_path(model_name, base)
    if cache_path is None:
        log.warning("Model %s not found in cache", model_name)
        return False
    shutil.rmtree(cache_path)
    log.info("Deleted model %s from %s", model_name, cache_path)
    return True
 def _find_model_cache_path(model_name: str, base: str) -> str | None:
    """Find the cache directory path for a model, or None if not cached."""
    base_path = Path(base)
    if not base_path.exists():
        return None
    # Exact match first
    safe_name = model_name.replace("/", "--")
    model_dir = base_path / f"models--{safe_name}"
    if _dir_has_onnx(model_dir):
        return str(model_dir)
    # Partial match: fastembed remaps some model names
    short_name = model_name.split("/")[-1].lower()
    for d in base_path.iterdir():
        if short_name in d.name.lower() and _dir_has_onnx(d):
            return str(d)
    return None
 def get_cache_kwargs(config: Config) -> dict:
    """Return kwargs to pass to fastembed constructors for cache_dir."""
    cache_dir = _resolve_cache_dir(config)