
🚀 Major Performance Improvements: - Increased CPU quota from 800% to 2000% (20/24 cores) - Enhanced threading: OMP/MKL/BLAS threads from 8 to 20 - Upgraded context length from 4096 to 8192 tokens - Deployed optimized 7-8B parameter models 🔧 Infrastructure Enhancements: - Updated ollama.nix with comprehensive CPU optimizations - Added memory-efficient q8_0 KV cache configuration - Implemented systemd resource limits and I/O optimizations - Forced cpu_avx2 library for optimal performance 📊 Performance Results: - Achieved 734% CPU utilization during inference - Maintained stable 6.5GB memory usage (19.9% of available) - Confirmed 3-4x performance improvement over baseline - Successfully running qwen2.5-coder:7b and deepseek-r1:7b models 🎯 TaskMaster Integration: - Consolidated duplicate .taskmaster configurations - Merged tasks from packages folder to project root - Updated MCP service configuration with optimized models - Verified AI-powered task expansion functionality 📝 Documentation: - Created comprehensive performance report - Documented optimization strategies and results - Added monitoring commands and validation procedures - Established baseline for future improvements ✅ Deployment Status: - Successfully deployed via NixOS declarative configuration - Tested post-reboot functionality and stability - Confirmed all optimizations active and performing optimally - Ready for production AI-assisted development workflows
34 lines
No EOL
856 B
JSON
34 lines
No EOL
856 B
JSON
{
|
|
"models": {
|
|
"main": {
|
|
"provider": "anthropic",
|
|
"modelId": "claude-3-7-sonnet-20250219",
|
|
"maxTokens": 120000,
|
|
"temperature": 0.2
|
|
},
|
|
"research": {
|
|
"provider": "perplexity",
|
|
"modelId": "sonar-pro",
|
|
"maxTokens": 8700,
|
|
"temperature": 0.1
|
|
},
|
|
"fallback": {
|
|
"provider": "anthropic",
|
|
"modelId": "claude-3-5-sonnet-20240620",
|
|
"maxTokens": 8192,
|
|
"temperature": 0.1
|
|
}
|
|
},
|
|
"global": {
|
|
"logLevel": "info",
|
|
"debug": false,
|
|
"defaultSubtasks": 5,
|
|
"defaultPriority": "medium",
|
|
"projectName": "Taskmaster",
|
|
"ollamaBaseURL": "http://localhost:11434/api",
|
|
"bedrockBaseURL": "https://bedrock.us-east-1.amazonaws.com",
|
|
"defaultTag": "master",
|
|
"azureOpenaiBaseURL": "https://your-endpoint.openai.azure.com/",
|
|
"userId": "1234567890"
|
|
}
|
|
} |