Files
EverOS/config.example.toml
tomtan 0910affc78
Some checks failed
CI / lint (push) Has been cancelled
CI / unit tests (push) Has been cancelled
CI / integration tests (push) Has been cancelled
CI / package build (push) Has been cancelled
Commit lint / pull request title (push) Has been cancelled
Commit lint / commit messages (push) Has been cancelled
Save local modifications for syncing
2026-06-10 10:05:52 +08:00

70 lines
2.4 KiB
TOML

# Example user-level config — copy to ~/.everos/config.toml.
#
# cp config.example.toml ~/.everos/config.toml
# $EDITOR ~/.everos/config.toml # fill in api_key / base_url
#
# Override priority (low → high):
#
# src/everos/config/default.toml
# < ~/.everos/config.toml (THIS FILE)
# < .env in the working directory
# < EVEROS_<SECTION>__<KEY> process envs
# < programmatic init args
#
# The path is configurable: set EVEROS_CONFIG_FILE=/path/to/your.toml to
# point at any location. Missing file = silently skipped (no error).
#
# Comment out anything you do not need — only the fields you set here
# override the shipped defaults; everything else falls back to
# src/everos/config/default.toml.
# ── LLM ───────────────────────────────────────────────
# OpenAI-protocol chat-completions endpoint used by the algo extractors.
[llm]
model = "gpt-4o-mini"
api_key = "sk-..."
base_url = "https://api.openai.com/v1"
timeout_seconds = 180.0
# ── Multimodal LLM ───────────────────────────────────
# Independent vision/audio-capable chat-completions endpoint for parsing.
[multimodal]
model = "google/gemini-3-flash-preview"
api_key = "sk-..."
base_url = "https://openrouter.ai/api/v1"
timeout_seconds = 180.0
resize_images_for_vlm = true
max_concurrency = 4
# ── Embedding ─────────────────────────────────────────
[embedding]
model = "Qwen/Qwen3-Embedding-4B"
api_key = "..."
base_url = "https://api.deepinfra.com/v1/openai"
# Runtime knobs (defaults shown):
timeout_seconds = 30.0
max_retries = 3
batch_size = 10
max_concurrent = 5
# ── Rerank ────────────────────────────────────────────
[rerank]
model = "Qwen/Qwen3-Reranker-4B"
api_key = "..."
base_url = "https://api.deepinfra.com/v1/inference"
timeout_seconds = 30.0
max_retries = 3
batch_size = 10
max_concurrent = 5
# ── Other tunables you may want to override here ──────
# [memory]
# root = "~/.everos"
# timezone = "Asia/Shanghai"
#
# [sqlite]
# busy_timeout_ms = 10000
#
# [lancedb]
# read_consistency_seconds = 5.0