Files
Claude-Code-Workflow/codex-lens/tests/test_token_storage.py
catlog22 17af615fe2 Add help view and core memory styles
- Introduced styles for the help view including tab transitions, accordion animations, search highlighting, and responsive design.
- Implemented core memory styles with modal base styles, memory card designs, and knowledge graph visualization.
- Enhanced dark mode support across various components.
- Added loading states and empty state designs for better user experience.
2025-12-18 18:29:45 +08:00

369 lines
14 KiB
Python

"""Integration tests for token metadata storage and retrieval."""
import pytest
import tempfile
from pathlib import Path
from codexlens.entities import Symbol, IndexedFile
from codexlens.storage.sqlite_store import SQLiteStore
from codexlens.storage.dir_index import DirIndexStore
from codexlens.storage.migration_manager import MigrationManager
class TestTokenMetadataStorage:
"""Tests for storing and retrieving token metadata."""
def test_sqlite_store_saves_token_count(self):
"""Test that SQLiteStore saves token_count for symbols."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "test.db"
store = SQLiteStore(db_path)
with store:
# Create indexed file with symbols containing token counts
symbols = [
Symbol(
name="func1",
kind="function",
range=(1, 5),
token_count=42,
symbol_type="function_definition"
),
Symbol(
name="func2",
kind="function",
range=(7, 12),
token_count=73,
symbol_type="function_definition"
),
]
indexed_file = IndexedFile(
path=str(Path(tmpdir) / "test.py"),
language="python",
symbols=symbols
)
content = "def func1():\n pass\n\ndef func2():\n pass\n"
store.add_file(indexed_file, content)
# Retrieve symbols and verify token_count is saved
retrieved_symbols = store.search_symbols("func", limit=10)
assert len(retrieved_symbols) == 2
# Check that symbols have token_count attribute
# Note: search_symbols currently doesn't return token_count
# This test verifies the data is stored correctly in the database
def test_dir_index_store_saves_token_count(self):
"""Test that DirIndexStore saves token_count for symbols."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "_index.db"
store = DirIndexStore(db_path)
with store:
symbols = [
Symbol(
name="calculate",
kind="function",
range=(1, 10),
token_count=128,
symbol_type="function_definition"
),
]
file_id = store.add_file(
name="math.py",
full_path=Path(tmpdir) / "math.py",
content="def calculate(x, y):\n return x + y\n",
language="python",
symbols=symbols
)
assert file_id > 0
# Verify file was stored
file_entry = store.get_file(Path(tmpdir) / "math.py")
assert file_entry is not None
assert file_entry.name == "math.py"
def test_migration_adds_token_columns(self):
"""Test that migrations properly handle token_count and symbol_type columns.
Note: Migration 002 adds these columns, but migration 005 removes them
as they were identified as unused/redundant. New databases should not
have these columns.
"""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "test.db"
store = SQLiteStore(db_path)
with store:
# Apply migrations
conn = store._get_connection()
manager = MigrationManager(conn)
manager.apply_migrations()
# Verify columns do NOT exist after all migrations
# (migration_005 removes token_count and symbol_type)
cursor = conn.execute("PRAGMA table_info(symbols)")
columns = {row[1] for row in cursor.fetchall()}
# These columns should NOT be present after migration_005
assert "token_count" not in columns, "token_count should be removed by migration_005"
assert "symbol_type" not in columns, "symbol_type should be removed by migration_005"
# Index on symbol_type should also not exist
cursor = conn.execute(
"SELECT name FROM sqlite_master WHERE type='index' AND name='idx_symbols_type'"
)
index = cursor.fetchone()
assert index is None, "idx_symbols_type should not exist after migration_005"
def test_batch_insert_preserves_token_metadata(self):
"""Test that batch insert preserves token metadata."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "test.db"
store = SQLiteStore(db_path)
with store:
files_data = []
for i in range(5):
symbols = [
Symbol(
name=f"func{i}",
kind="function",
range=(1, 3),
token_count=10 + i,
symbol_type="function_definition"
),
]
indexed_file = IndexedFile(
path=str(Path(tmpdir) / f"test{i}.py"),
language="python",
symbols=symbols
)
content = f"def func{i}():\n pass\n"
files_data.append((indexed_file, content))
# Batch insert
store.add_files(files_data)
# Verify all files were stored
stats = store.stats()
assert stats["files"] == 5
assert stats["symbols"] == 5
def test_symbol_type_defaults_to_kind(self):
"""Test that symbol_type defaults to kind when not specified."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "_index.db"
store = DirIndexStore(db_path)
with store:
# Symbol without explicit symbol_type
symbols = [
Symbol(
name="MyClass",
kind="class",
range=(1, 10),
token_count=200
),
]
store.add_file(
name="module.py",
full_path=Path(tmpdir) / "module.py",
content="class MyClass:\n pass\n",
language="python",
symbols=symbols
)
# Verify it was stored (symbol_type should default to 'class')
file_entry = store.get_file(Path(tmpdir) / "module.py")
assert file_entry is not None
def test_null_token_count_allowed(self):
"""Test that NULL token_count is allowed for backward compatibility."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "test.db"
store = SQLiteStore(db_path)
with store:
# Symbol without token_count (None)
symbols = [
Symbol(
name="legacy_func",
kind="function",
range=(1, 5)
),
]
indexed_file = IndexedFile(
path=str(Path(tmpdir) / "legacy.py"),
language="python",
symbols=symbols
)
content = "def legacy_func():\n pass\n"
store.add_file(indexed_file, content)
# Should not raise an error
stats = store.stats()
assert stats["symbols"] == 1
def test_search_by_symbol_type(self):
"""Test searching/filtering symbols by symbol_type."""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "_index.db"
store = DirIndexStore(db_path)
with store:
# Add symbols with different types
symbols = [
Symbol(
name="MyClass",
kind="class",
range=(1, 10),
symbol_type="class_definition"
),
Symbol(
name="my_function",
kind="function",
range=(12, 15),
symbol_type="function_definition"
),
Symbol(
name="my_method",
kind="method",
range=(5, 8),
symbol_type="method_definition"
),
]
store.add_file(
name="code.py",
full_path=Path(tmpdir) / "code.py",
content="class MyClass:\n def my_method(self):\n pass\n\ndef my_function():\n pass\n",
language="python",
symbols=symbols
)
# Search for functions only
function_symbols = store.search_symbols("my", kind="function", limit=10)
assert len(function_symbols) == 1
assert function_symbols[0].name == "my_function"
# Search for methods only
method_symbols = store.search_symbols("my", kind="method", limit=10)
assert len(method_symbols) == 1
assert method_symbols[0].name == "my_method"
class TestTokenCountAccuracy:
"""Tests for symbol storage accuracy.
Note: token_count and symbol_type columns were removed in migration_005
as they were identified as unused/redundant. These tests now verify
that symbols are stored correctly with their basic fields.
"""
def test_stored_token_count_matches_original(self):
"""Test that symbols are stored correctly (token_count no longer stored).
Note: token_count field was removed from schema. This test verifies
that symbols are still stored correctly with basic fields.
"""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "test.db"
store = SQLiteStore(db_path)
with store:
symbols = [
Symbol(
name="complex_func",
kind="function",
range=(1, 20),
token_count=256 # This field is accepted but not stored
),
]
indexed_file = IndexedFile(
path=str(Path(tmpdir) / "test.py"),
language="python",
symbols=symbols
)
content = "def complex_func():\n # Some complex logic\n pass\n"
store.add_file(indexed_file, content)
# Verify symbol is stored with basic fields
conn = store._get_connection()
cursor = conn.execute(
"SELECT name, kind, start_line, end_line FROM symbols WHERE name = ?",
("complex_func",)
)
row = cursor.fetchone()
assert row is not None
assert row["name"] == "complex_func"
assert row["kind"] == "function"
assert row["start_line"] == 1
assert row["end_line"] == 20
def test_100_percent_storage_accuracy(self):
"""Test that 100% of symbols are stored correctly.
Note: token_count field was removed from schema. This test verifies
that symbols are stored correctly with basic fields.
"""
with tempfile.TemporaryDirectory() as tmpdir:
db_path = Path(tmpdir) / "_index.db"
store = DirIndexStore(db_path)
with store:
# Store symbols
file_entries = []
for i in range(100):
symbol_name = f"func{i}"
symbols = [
Symbol(
name=symbol_name,
kind="function",
range=(1, 2),
token_count=10 + i * 3 # Accepted but not stored
)
]
file_path = Path(tmpdir) / f"file{i}.py"
file_entries.append((
f"file{i}.py",
file_path,
f"def {symbol_name}():\n pass\n",
"python",
symbols
))
count = store.add_files_batch(file_entries)
assert count == 100
# Verify all symbols are stored correctly
conn = store._get_connection()
cursor = conn.execute(
"SELECT name, kind, start_line, end_line FROM symbols ORDER BY name"
)
rows = cursor.fetchall()
assert len(rows) == 100
# Verify each symbol has correct basic fields
for row in rows:
assert row["kind"] == "function"
assert row["start_line"] == 1
assert row["end_line"] == 2