Fix compress endpoint to use request.messages correctly

This commit is contained in:
Lukas Parsons 2026-03-22 22:47:49 -04:00
parent 9ad11f5be4
commit 5505d2b217

View file

@ -19,7 +19,8 @@ from schemas import (
Convention as ConventionSchema,
MemoryBase,
Memory as MemorySchema,
ContextBundle
ContextBundle,
CompressionRequest
)
from rag import build_context_bundle, clear_cache as clear_rag_cache
from compression import compress_conversation, count_tokens
@ -442,7 +443,7 @@ async def compress_messages_endpoint(
ollama_model=config.compression.ollama_model,
ollama_url=config.compression.ollama_url
)
original_tokens = sum(count_tokens(m.get("content", "")) for m in messages)
original_tokens = sum(count_tokens(m.get("content", "")) for m in request.messages)
compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed)
return {