Fix compress endpoint to use request.messages correctly

This commit is contained in:
Lukas Parsons 2026-03-22 22:47:49 -04:00
parent 9ad11f5be4
commit 5505d2b217

View file

@ -19,7 +19,8 @@ from schemas import (
Convention as ConventionSchema, Convention as ConventionSchema,
MemoryBase, MemoryBase,
Memory as MemorySchema, Memory as MemorySchema,
ContextBundle ContextBundle,
CompressionRequest
) )
from rag import build_context_bundle, clear_cache as clear_rag_cache from rag import build_context_bundle, clear_cache as clear_rag_cache
from compression import compress_conversation, count_tokens from compression import compress_conversation, count_tokens
@ -442,7 +443,7 @@ async def compress_messages_endpoint(
ollama_model=config.compression.ollama_model, ollama_model=config.compression.ollama_model,
ollama_url=config.compression.ollama_url ollama_url=config.compression.ollama_url
) )
original_tokens = sum(count_tokens(m.get("content", "")) for m in messages) original_tokens = sum(count_tokens(m.get("content", "")) for m in request.messages)
compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed) compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed)
return { return {