Fix compress endpoint to use request.messages correctly
This commit is contained in:
parent
9ad11f5be4
commit
5505d2b217
1 changed files with 3 additions and 2 deletions
5
main.py
5
main.py
|
|
@ -19,7 +19,8 @@ from schemas import (
|
|||
Convention as ConventionSchema,
|
||||
MemoryBase,
|
||||
Memory as MemorySchema,
|
||||
ContextBundle
|
||||
ContextBundle,
|
||||
CompressionRequest
|
||||
)
|
||||
from rag import build_context_bundle, clear_cache as clear_rag_cache
|
||||
from compression import compress_conversation, count_tokens
|
||||
|
|
@ -442,7 +443,7 @@ async def compress_messages_endpoint(
|
|||
ollama_model=config.compression.ollama_model,
|
||||
ollama_url=config.compression.ollama_url
|
||||
)
|
||||
original_tokens = sum(count_tokens(m.get("content", "")) for m in messages)
|
||||
original_tokens = sum(count_tokens(m.get("content", "")) for m in request.messages)
|
||||
compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed)
|
||||
|
||||
return {
|
||||
|
|
|
|||
Loading…
Add table
Reference in a new issue