secubox-openwrt/package/secubox/secubox-app-localai/files/etc/config/localai
CyberMind-FR 55914b8b3c feat(localai): Update to LocalAI v3.10.0
- Updated default version from v2.25.0 to v3.10.0
- Fixed binary URL format: local-ai-v3.10.0-linux-arm64
- Updated Docker image tag to v3.10.0-ffmpeg

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-01-21 18:34:05 +01:00

58 lines
1.8 KiB
Plaintext

config main 'main'
option enabled '0'
option api_port '8080'
option api_host '0.0.0.0'
option data_path '/srv/localai'
option models_path '/srv/localai/models'
option memory_limit '2g'
option threads '4'
option context_size '2048'
option debug '0'
option cors '1'
# Runtime: 'lxc', 'docker', 'podman', or 'auto' (auto-detect)
option runtime 'auto'
# LXC settings (for runtime=lxc)
config lxc 'lxc'
option path '/srv/lxc'
option version 'v3.10.0'
# Docker/Podman settings (for runtime=docker or podman)
config docker 'docker'
option image 'localai/localai:v3.10.0-ffmpeg'
# Default model to load on startup
config model 'default'
option enabled '1'
option name 'tinyllama'
option backend 'llama-cpp'
# Model presets - GGUF format for llama-cpp backend
config preset 'tinyllama'
option name 'tinyllama'
option url 'https://huggingface.co/TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF/resolve/main/tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf'
option size '669M'
option type 'text-generation'
option description 'TinyLlama 1.1B - Ultra-lightweight'
config preset 'phi2'
option name 'phi-2'
option url 'https://huggingface.co/TheBloke/phi-2-GGUF/resolve/main/phi-2.Q4_K_M.gguf'
option size '1.6G'
option type 'text-generation'
option description 'Microsoft Phi-2 - Compact and efficient'
config preset 'mistral'
option name 'mistral-7b'
option url 'https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_K_M.gguf'
option size '4.1G'
option type 'text-generation'
option description 'Mistral 7B Instruct - High quality assistant'
config preset 'gte_small'
option name 'gte-small'
option url 'https://huggingface.co/Supabase/gte-small/resolve/main/model.onnx'
option size '67M'
option type 'embeddings'
option description 'GTE Small - Fast embeddings'