ai-skills-api/config.yaml

38 lines
No EOL
1.4 KiB
YAML

# AI Skills API Configuration
# Server settings
host: "0.0.0.0"
port: 8675
database_url: "sqlite+aiosqlite:///./ai.db"
# CORS origins (restrict in production)
cors_origins: ["*"]
# RAG (Retrieval Augmented Generation) settings
rag:
max_skills: 3 # Number of skills to include in context
max_conventions: 2 # Number of conventions to include
max_snippets: 2 # Number of code snippets to include
min_skill_score: 0.3 # Minimum similarity threshold for skills (0-1)
min_snippet_score: 0.25 # Minimum similarity for snippets (0-1)
embedding_model: "all-MiniLM-L6-v2" # Sentence transformer model
# Compression settings
compression:
enabled: true
strategy: "ollama" # "extractive" (sumy), "ollama" (phi-3-mini), or "none"
keep_last_n: 3 # Number of recent exchanges to keep uncompressed
max_tokens: 2000 # Target token budget for conversation history
ollama_model: "phi3:mini" # Only used if strategy is "ollama"
ollama_url: "http://ollama:11434" # Ollama API endpoint (uses docker service name)
# Authentication (set and forget - simple API key)
auth:
enabled: false # Set to true to require API key on all endpoints
api_key: "change-me-in-production" # Change this if enabling auth
header_name: "X-API-Key"
# Logging configuration
logging:
level: "INFO"
format: "json" # "json" for structured logs, "text" for human readable