Fix compress endpoint to use request.messages correctly
This commit is contained in:
parent
9ad11f5be4
commit
5505d2b217
1 changed files with 3 additions and 2 deletions
5
main.py
5
main.py
|
|
@ -19,7 +19,8 @@ from schemas import (
|
||||||
Convention as ConventionSchema,
|
Convention as ConventionSchema,
|
||||||
MemoryBase,
|
MemoryBase,
|
||||||
Memory as MemorySchema,
|
Memory as MemorySchema,
|
||||||
ContextBundle
|
ContextBundle,
|
||||||
|
CompressionRequest
|
||||||
)
|
)
|
||||||
from rag import build_context_bundle, clear_cache as clear_rag_cache
|
from rag import build_context_bundle, clear_cache as clear_rag_cache
|
||||||
from compression import compress_conversation, count_tokens
|
from compression import compress_conversation, count_tokens
|
||||||
|
|
@ -442,7 +443,7 @@ async def compress_messages_endpoint(
|
||||||
ollama_model=config.compression.ollama_model,
|
ollama_model=config.compression.ollama_model,
|
||||||
ollama_url=config.compression.ollama_url
|
ollama_url=config.compression.ollama_url
|
||||||
)
|
)
|
||||||
original_tokens = sum(count_tokens(m.get("content", "")) for m in messages)
|
original_tokens = sum(count_tokens(m.get("content", "")) for m in request.messages)
|
||||||
compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed)
|
compressed_tokens = sum(count_tokens(m.get("content", "")) for m in compressed)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
|
|
|
||||||
Loading…
Add table
Reference in a new issue