hermes-agent/hermes_cli/config.py at main · NousResearch/hermes-agent

History

5081 lines (4615 loc) · 211 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

626

627

628

629

630

631

632

633

634

635

636

637

638

639

640

641

642

643

644

645

646

647

648

649

650

651

652

653

654

655

656

657

658

659

660

661

662

663

664

665

666

667

668

669

670

671

672

673

674

675

676

677

678

679

680

681

682

683

684

685

686

687

688

689

690

691

692

693

694

695

696

697

698

699

700

701

702

703

704

705

706

707

708

709

710

711

712

713

714

715

716

717

718

719

720

721

722

723

724

725

726

727

728

729

730

731

732

733

734

735

736

737

738

739

740

741

742

743

744

745

746

747

748

749

750

751

752

753

754

755

756

757

758

759

760

761

762

763

764

765

766

767

768

769

770

771

772

773

774

775

776

777

778

779

780

781

782

783

784

785

786

787

788

789

790

791

792

793

794

795

796

797

798

799

800

801

802

803

804

805

806

807

808

809

810

811

812

813

814

815

816

817

818

819

820

821

822

823

824

825

826

827

828

829

830

831

832

833

834

835

836

837

838

839

840

841

842

843

844

845

846

847

848

849

850

851

852

853

854

855

856

857

858

859

860

861

862

863

864

865

866

867

868

869

870

871

872

873

874

875

876

877

878

879

880

881

882

883

884

885

886

887

888

889

890

891

892

893

894

895

896

897

898

899

900

901

902

903

904

905

906

907

908

909

910

911

912

913

914

915

916

917

918

919

920

921

922

923

924

925

926

927

928

929

930

931

932

933

934

935

936

937

938

939

940

941

942

943

944

945

946

947

948

949

950

951

952

953

954

955

956

957

958

959

960

961

962

963

964

965

966

967

968

969

970

971

972

973

974

975

976

977

978

979

980

981

982

983

984

985

986

987

988

989

990

991

992

993

994

995

996

997

998

999

1000

"""

Configuration management for Hermes Agent.

Config files are stored in ~/.hermes/ for easy access:

- ~/.hermes/config.yaml - All settings (model, toolsets, terminal, etc.)

- ~/.hermes/.env - API keys and secrets

This module provides:

- hermes config - Show current configuration

- hermes config edit - Open config in editor

- hermes config set - Set a specific value

- hermes config wizard - Re-run setup wizard

"""

import copy

import logging

import os

import platform

import re

import stat

import subprocess

import sys

import tempfile

from dataclasses import dataclass

from pathlib import Path

from typing import Dict, Any, Optional, List, Tuple

logger = logging.getLogger(__name__)

_IS_WINDOWS = platform.system() == "Windows"

_ENV_VAR_NAME_RE = re.compile(r"^[A-Za-z_][A-Za-z0-9_]*$")

_LAST_EXPANDED_CONFIG_BY_PATH: Dict[str, Any] = {}

# (path, mtime_ns, size) -> cached expanded config dict.

# load_config() returns a deepcopy of the cached value when the file

# hasn't changed since the last load, skipping yaml.safe_load +

# _deep_merge + _normalize_* + _expand_env_vars (~13 ms/call).

# save_config() + migrate_config() write via atomic_yaml_write which

# produces a fresh inode, so stat() sees a new mtime_ns and the next

# load repopulates automatically — no explicit invalidation hook.

_LOAD_CONFIG_CACHE: Dict[str, Tuple[int, int, Dict[str, Any]]] = {}

# (path, mtime_ns, size) -> cached raw yaml dict. Same pattern as

# _LOAD_CONFIG_CACHE but for read_raw_config() — used when callers want

# the user's on-disk values without defaults merged in.

_RAW_CONFIG_CACHE: Dict[str, Tuple[int, int, Dict[str, Any]]] = {}

# Env var names written to .env that aren't in OPTIONAL_ENV_VARS

# (managed by setup/provider flows directly).

_EXTRA_ENV_KEYS = frozenset({

"OPENAI_API_KEY", "OPENAI_BASE_URL",

"ANTHROPIC_API_KEY", "ANTHROPIC_TOKEN",

"DISCORD_HOME_CHANNEL", "DISCORD_HOME_CHANNEL_NAME",

"TELEGRAM_HOME_CHANNEL", "TELEGRAM_HOME_CHANNEL_NAME",

"SLACK_HOME_CHANNEL", "SLACK_HOME_CHANNEL_NAME",

"SIGNAL_ACCOUNT", "SIGNAL_HTTP_URL",

"SIGNAL_ALLOWED_USERS", "SIGNAL_GROUP_ALLOWED_USERS",

"SIGNAL_HOME_CHANNEL", "SIGNAL_HOME_CHANNEL_NAME",

"SMS_HOME_CHANNEL", "SMS_HOME_CHANNEL_NAME",

"DINGTALK_CLIENT_ID", "DINGTALK_CLIENT_SECRET",

"DINGTALK_HOME_CHANNEL", "DINGTALK_HOME_CHANNEL_NAME",

"FEISHU_APP_ID", "FEISHU_APP_SECRET", "FEISHU_ENCRYPT_KEY", "FEISHU_VERIFICATION_TOKEN",

"FEISHU_HOME_CHANNEL", "FEISHU_HOME_CHANNEL_NAME",

"YUANBAO_HOME_CHANNEL", "YUANBAO_HOME_CHANNEL_NAME",

"WECOM_BOT_ID", "WECOM_SECRET",

"WECOM_CALLBACK_CORP_ID", "WECOM_CALLBACK_CORP_SECRET", "WECOM_CALLBACK_AGENT_ID",

"WECOM_CALLBACK_TOKEN", "WECOM_CALLBACK_ENCODING_AES_KEY",

"WECOM_CALLBACK_HOST", "WECOM_CALLBACK_PORT",

"WECOM_HOME_CHANNEL", "WECOM_HOME_CHANNEL_NAME",

"WEIXIN_ACCOUNT_ID", "WEIXIN_TOKEN", "WEIXIN_BASE_URL", "WEIXIN_CDN_BASE_URL",

"WEIXIN_HOME_CHANNEL", "WEIXIN_HOME_CHANNEL_NAME", "WEIXIN_DM_POLICY", "WEIXIN_GROUP_POLICY",

"WEIXIN_ALLOWED_USERS", "WEIXIN_GROUP_ALLOWED_USERS", "WEIXIN_ALLOW_ALL_USERS",

"BLUEBUBBLES_SERVER_URL", "BLUEBUBBLES_PASSWORD",

"BLUEBUBBLES_HOME_CHANNEL", "BLUEBUBBLES_HOME_CHANNEL_NAME",

"QQ_APP_ID", "QQ_CLIENT_SECRET", "QQBOT_HOME_CHANNEL", "QQBOT_HOME_CHANNEL_NAME",

"QQ_HOME_CHANNEL", "QQ_HOME_CHANNEL_NAME", # legacy aliases (pre-rename, still read for back-compat)

"QQ_ALLOWED_USERS", "QQ_GROUP_ALLOWED_USERS", "QQ_ALLOW_ALL_USERS", "QQ_MARKDOWN_SUPPORT",

"QQ_STT_API_KEY", "QQ_STT_BASE_URL", "QQ_STT_MODEL",

"IRC_SERVER", "IRC_PORT", "IRC_NICKNAME", "IRC_CHANNEL",

"IRC_USE_TLS", "IRC_SERVER_PASSWORD", "IRC_NICKSERV_PASSWORD",

"TERMINAL_ENV", "TERMINAL_SSH_KEY", "TERMINAL_SSH_PORT",

"WHATSAPP_MODE", "WHATSAPP_ENABLED",

"MATTERMOST_HOME_CHANNEL", "MATTERMOST_HOME_CHANNEL_NAME", "MATTERMOST_REPLY_MODE",

"MATRIX_PASSWORD", "MATRIX_ENCRYPTION", "MATRIX_DEVICE_ID", "MATRIX_HOME_ROOM",

"MATRIX_REQUIRE_MENTION", "MATRIX_FREE_RESPONSE_ROOMS", "MATRIX_AUTO_THREAD", "MATRIX_DM_AUTO_THREAD",

"MATRIX_RECOVERY_KEY",

# Langfuse observability plugin — optional tuning keys + standard SDK vars.

# Activation is via plugins.enabled (opt-in through `hermes plugins enable

# observability/langfuse` or `hermes tools → Langfuse`); credentials gate

# the plugin at runtime.

"HERMES_LANGFUSE_ENV",

"HERMES_LANGFUSE_RELEASE",

"HERMES_LANGFUSE_SAMPLE_RATE",

"HERMES_LANGFUSE_MAX_CHARS",

"HERMES_LANGFUSE_DEBUG",

"LANGFUSE_PUBLIC_KEY",

"LANGFUSE_SECRET_KEY",

"LANGFUSE_BASE_URL",

})

import yaml

from hermes_cli.colors import Colors, color

from hermes_cli.default_soul import DEFAULT_SOUL_MD

# =============================================================================

# Managed mode (NixOS declarative config)

# =============================================================================

_MANAGED_TRUE_VALUES = ("true", "1", "yes")

_MANAGED_SYSTEM_NAMES = {

"brew": "Homebrew",

"homebrew": "Homebrew",

"nix": "NixOS",

"nixos": "NixOS",

}

def get_managed_system() -> Optional[str]:

"""Return the package manager owning this install, if any."""

raw = os.getenv("HERMES_MANAGED", "").strip()

if raw:

normalized = raw.lower()

if normalized in _MANAGED_TRUE_VALUES:

return "NixOS"

return _MANAGED_SYSTEM_NAMES.get(normalized, raw)

managed_marker = get_hermes_home() / ".managed"

if managed_marker.exists():

return "NixOS"

return None

def is_managed() -> bool:

"""Check if Hermes is running in package-manager-managed mode.

Two signals: the HERMES_MANAGED env var (set by the systemd service),

or a .managed marker file in HERMES_HOME (set by the NixOS activation

script, so interactive shells also see it).

"""

return get_managed_system() is not None

def get_managed_update_command() -> Optional[str]:

"""Return the preferred upgrade command for a managed install."""

managed_system = get_managed_system()

if managed_system == "Homebrew":

return "brew upgrade hermes-agent"

if managed_system == "NixOS":

return "sudo nixos-rebuild switch"

return None

def recommended_update_command() -> str:

"""Return the best update command for the current installation."""

return get_managed_update_command() or "hermes update"

def format_managed_message(action: str = "modify this Hermes installation") -> str:

"""Build a user-facing error for managed installs."""

managed_system = get_managed_system() or "a package manager"

raw = os.getenv("HERMES_MANAGED", "").strip().lower()

if managed_system == "NixOS":

env_hint = "true" if raw in _MANAGED_TRUE_VALUES else raw or "true"

return (

f"Cannot {action}: this Hermes installation is managed by NixOS "

f"(HERMES_MANAGED={env_hint}).\n"

"Edit services.hermes-agent.settings in your configuration.nix and run:\n"

" sudo nixos-rebuild switch"

)

if managed_system == "Homebrew":

env_hint = raw or "homebrew"

return (

f"Cannot {action}: this Hermes installation is managed by Homebrew "

f"(HERMES_MANAGED={env_hint}).\n"

"Use:\n"

" brew upgrade hermes-agent"

)

return (

f"Cannot {action}: this Hermes installation is managed by {managed_system}.\n"

"Use your package manager to upgrade or reinstall Hermes."

)

def managed_error(action: str = "modify configuration"):

"""Print user-friendly error for managed mode."""

print(format_managed_message(action), file=sys.stderr)

# =============================================================================

# Container-aware CLI (NixOS container mode)

# =============================================================================

def get_container_exec_info() -> Optional[dict]:

"""Read container mode metadata from HERMES_HOME/.container-mode.

Returns a dict with keys: backend, container_name, exec_user, hermes_bin

or None if container mode is not active, we're already inside the

container, or HERMES_DEV=1 is set.

The .container-mode file is written by the NixOS activation script when

container.enable = true. It tells the host CLI to exec into the container

instead of running locally.

"""

if os.environ.get("HERMES_DEV") == "1":

return None

from hermes_constants import is_container

if is_container():

return None

container_mode_file = get_hermes_home() / ".container-mode"

try:

info = {}

with open(container_mode_file, "r") as f:

for line in f:

line = line.strip()

if "=" in line and not line.startswith("#"):

key, _, value = line.partition("=")

info[key.strip()] = value.strip()

except FileNotFoundError:

return None

# All other exceptions (PermissionError, malformed data, etc.) propagate

backend = info.get("backend", "docker")

container_name = info.get("container_name", "hermes-agent")

exec_user = info.get("exec_user", "hermes")

hermes_bin = info.get("hermes_bin", "/data/current-package/bin/hermes")

return {

"backend": backend,

"container_name": container_name,

"exec_user": exec_user,

"hermes_bin": hermes_bin,

}

# =============================================================================

# Config paths

# =============================================================================

# Re-export from hermes_constants — canonical definition lives there.

from hermes_constants import get_hermes_home # noqa: F811,E402

from utils import atomic_replace

def get_config_path() -> Path:

"""Get the main config file path."""

return get_hermes_home() / "config.yaml"

def get_env_path() -> Path:

"""Get the .env file path (for API keys)."""

return get_hermes_home() / ".env"

def get_project_root() -> Path:

"""Get the project installation directory."""

return Path(__file__).parent.parent.resolve()

def _secure_dir(path):

"""Set directory to owner-only access (0700 by default). No-op on Windows.

Skipped in managed mode — the NixOS module sets group-readable

permissions (0750) so interactive users in the hermes group can

share state with the gateway service.

The mode can be overridden via the HERMES_HOME_MODE environment variable

(e.g. HERMES_HOME_MODE=0701) for deployments where a web server (nginx,

caddy, etc.) needs to traverse HERMES_HOME to reach a served subdirectory.

The execute-only bit on a directory permits cd-through without exposing

directory listings.

"""

if is_managed():

return

try:

mode_str = os.environ.get("HERMES_HOME_MODE", "").strip()

mode = int(mode_str, 8) if mode_str else 0o700

except ValueError:

mode = 0o700

try:

os.chmod(path, mode)

except (OSError, NotImplementedError):

pass

def _is_container() -> bool:

"""Detect if we're running inside a Docker/Podman/LXC container.

When Hermes runs in a container with volume-mounted config files, forcing

0o600 permissions breaks multi-process setups where the gateway and

dashboard run as different UIDs or the volume mount requires broader

permissions.

"""

# Explicit opt-out

if os.environ.get("HERMES_CONTAINER") or os.environ.get("HERMES_SKIP_CHMOD"):

return True

# Docker / Podman marker file

if os.path.exists("/.dockerenv"):

return True

# LXC / cgroup-based detection

try:

with open("/proc/1/cgroup", "r") as f:

cgroup_content = f.read()

if "docker" in cgroup_content or "lxc" in cgroup_content or "kubepods" in cgroup_content:

return True

except (OSError, IOError):

pass

return False

def _secure_file(path):

"""Set file to owner-only read/write (0600). No-op on Windows.

Skipped in managed mode — the NixOS activation script sets

group-readable permissions (0640) on config files.

Skipped in containers — Docker/Podman volume mounts often need broader

permissions. Set HERMES_SKIP_CHMOD=1 to force-skip on other systems.

"""

if is_managed() or _is_container():

return

try:

if os.path.exists(str(path)):

os.chmod(path, 0o600)

except (OSError, NotImplementedError):

pass

def _ensure_default_soul_md(home: Path) -> None:

"""Seed a default SOUL.md into HERMES_HOME if the user doesn't have one yet."""

soul_path = home / "SOUL.md"

if soul_path.exists():

return

soul_path.write_text(DEFAULT_SOUL_MD, encoding="utf-8")

_secure_file(soul_path)

def ensure_hermes_home():

"""Ensure ~/.hermes directory structure exists with secure permissions.

In managed mode (NixOS), dirs are created by the activation script with

setgid + group-writable (2770). We skip mkdir and set umask(0o007) so

any files created (e.g. SOUL.md) are group-writable (0660).

"""

home = get_hermes_home()

if is_managed():

old_umask = os.umask(0o007)

try:

_ensure_hermes_home_managed(home)

finally:

os.umask(old_umask)

else:

home.mkdir(parents=True, exist_ok=True)

_secure_dir(home)

for subdir in ("cron", "sessions", "logs", "logs/curator", "memories"):

d = home / subdir

d.mkdir(parents=True, exist_ok=True)

_secure_dir(d)

_ensure_default_soul_md(home)

def _ensure_hermes_home_managed(home: Path):

"""Managed-mode variant: verify dirs exist (activation creates them), seed SOUL.md."""

if not home.is_dir():

raise RuntimeError(

f"HERMES_HOME {home} does not exist. "

"Run 'sudo nixos-rebuild switch' first."

)

for subdir in ("cron", "sessions", "logs", "memories"):

d = home / subdir

if not d.is_dir():

raise RuntimeError(

f"{d} does not exist. "

"Run 'sudo nixos-rebuild switch' first."

)

# Curator reports dir is a sub-path of logs/; create it if missing.

# In managed mode the activation script may not know about this subdir,

# so we mkdir it ourselves (it's inside an already-secured logs/ dir).

(home / "logs" / "curator").mkdir(parents=True, exist_ok=True)

# Inside umask(0o007) scope — SOUL.md will be created as 0660

_ensure_default_soul_md(home)

# =============================================================================

# Config loading/saving

# =============================================================================

DEFAULT_CONFIG = {

"model": "",

"providers": {},

"fallback_providers": [],

"credential_pool_strategies": {},

"toolsets": ["hermes-cli"],

"agent": {

"max_turns": 90,

# Inactivity timeout for gateway agent execution (seconds).

# The agent can run indefinitely as long as it's actively calling

# tools or receiving API responses. Only fires when the agent has

# been completely idle for this duration. 0 = unlimited.

"gateway_timeout": 1800,

# Graceful drain timeout for gateway stop/restart (seconds).

# The gateway stops accepting new work, waits for running agents

# to finish, then interrupts any remaining runs after the timeout.

# 0 = no drain, interrupt immediately.

# 180s is calibrated for realistic in-flight agent turns: a typical

# coding conversation mid-reasoning runs 60–150s per call, so a 60s

# budget routinely interrupted legitimate work on /restart. Raise

# further in config.yaml if you run very-long-reasoning models.

"restart_drain_timeout": 180,

# Max app-level retry attempts for API errors (connection drops,

# provider timeouts, 5xx, etc.) before the agent surfaces the

# failure. The OpenAI SDK already does its own low-level retries

# (max_retries=2 default) for transient network errors; this is

# the Hermes-level retry loop that wraps the whole call. Lower

# this to 1 if you use fallback providers and want fast failover

# on flaky primaries; raise it if you prefer to tolerate longer

# provider hiccups on a single provider.

"api_max_retries": 3,

"service_tier": "",

# Tool-use enforcement: injects system prompt guidance that tells the

# model to actually call tools instead of describing intended actions.

# Values: "auto" (default — applies to gpt/codex models), true/false

# (force on/off for all models), or a list of model-name substrings

# to match (e.g. ["gpt", "codex", "gemini", "qwen"]).

"tool_use_enforcement": "auto",

# Staged inactivity warning: send a warning to the user at this

# threshold before escalating to a full timeout. The warning fires

# once per run and does not interrupt the agent. 0 = disable warning.

"gateway_timeout_warning": 900,

# Periodic "still working" notification interval (seconds).

# Sends a status message every N seconds so the user knows the

# agent hasn't died during long tasks. 0 = disable notifications.

# Lower values mean faster feedback on slow tasks but more chat

# noise; 180s is a compromise that catches spinning weak-model runs

# (60+ tool iterations with tiny output) before users assume the

# bot is dead and /restart.

"gateway_notify_interval": 180,

# Freshness window for the gateway auto-continue note (seconds).

# After a gateway crash/restart/SIGTERM mid-run, the next user

# message gets a "[System note: your previous turn was

# interrupted — process the unfinished tool result(s) first]"

# prepended so the model picks up where it left off. That's the

# right behaviour while the interruption is fresh, but stale

# markers (transcript last touched hours or days ago) can revive

# an unrelated old task when the user's next message starts new

# work. This window is the max age of the last persisted

# transcript row for which we still inject the continue note.

# Default 3600s comfortably covers a long turn (gateway_timeout

# default is 1800s) plus runtime slack. Set to 0 to disable the

# gate and restore pre-fix behaviour (always inject).

"gateway_auto_continue_freshness": 3600,

# How user-attached images are presented to the main model on each turn.

# "auto" — attach natively when the active model reports

# supports_vision=True AND the user hasn't explicitly

# configured auxiliary.vision.provider. Otherwise fall

# back to text (vision_analyze pre-analysis).

# "native" — always attach natively; non-vision models will either

# error at the provider or get a last-chance text fallback

# (see run_agent._prepare_messages_for_api).

# "text" — always pre-analyze with vision_analyze and prepend the

# description as text; the main model never sees pixels.

# Affects gateway platforms, the TUI, and CLI /attach. vision_analyze

# remains available as a tool regardless of this setting — the routing

# only controls how inbound user images are presented.

"image_input_mode": "auto",

"disabled_toolsets": [],

"terminal": {

"backend": "local",

"modal_mode": "auto",

"cwd": ".", # Use current directory

"timeout": 180,

# Environment variables to pass through to sandboxed execution

# (terminal and execute_code). Skill-declared required_environment_variables

# are passed through automatically; this list is for non-skill use cases.

"env_passthrough": [],

# Extra files to source in the login shell when building the

# per-session environment snapshot. Use this when tools like nvm,

# pyenv, asdf, or custom PATH entries are registered by files that

# a bash login shell would skip — most commonly ``~/.bashrc``

# (bash doesn't source bashrc in non-interactive login mode) or

# zsh-specific files like ``~/.zshrc`` / ``~/.zprofile``.

# Paths support ``~`` / ``${VAR}``. Missing files are silently

# skipped. When empty, Hermes auto-sources ``~/.profile``,

# ``~/.bash_profile``, and ``~/.bashrc`` (in that order) if the

# snapshot shell is bash (this is the ``auto_source_bashrc``

# behaviour — disable with that key if you want strict login-only

# semantics).

"shell_init_files": [],

# When true (default), Hermes sources the user's shell rc files

# (``~/.profile``, ``~/.bash_profile``, ``~/.bashrc``) in the

# login shell used to build the environment snapshot. This

# captures PATH additions, shell functions, and aliases — which a

# plain ``bash -l -c`` would otherwise miss because bash skips

# bashrc in non-interactive login mode, and because a default

# Debian/Ubuntu ``~/.bashrc`` short-circuits on non-interactive

# sources. ``~/.profile`` and ``~/.bash_profile`` are tried first

# because ``n`` / ``nvm`` / ``asdf`` installers typically write

# their PATH exports there without an interactivity guard. Turn

# this off if your rc files misbehave when sourced

# non-interactively (e.g. one that hard-exits on TTY checks).

"auto_source_bashrc": True,

"docker_image": "nikolaik/python-nodejs:python3.11-nodejs20",

"docker_forward_env": [],

# Explicit environment variables to set inside Docker containers.

# Unlike docker_forward_env (which reads values from the host process),

# docker_env lets you specify exact key-value pairs — useful when Hermes

# runs as a systemd service without access to the user's shell environment.

# Example: {"SSH_AUTH_SOCK": "/run/user/1000/ssh-agent.sock"}

"docker_env": {},

"singularity_image": "docker://nikolaik/python-nodejs:python3.11-nodejs20",

"modal_image": "nikolaik/python-nodejs:python3.11-nodejs20",

"daytona_image": "nikolaik/python-nodejs:python3.11-nodejs20",

"vercel_runtime": "node24",

# Container resource limits (docker, singularity, modal, daytona, vercel_sandbox — ignored for local/ssh)

"container_cpu": 1,

"container_memory": 5120, # MB (default 5GB)

"container_disk": 51200, # MB (default 50GB)

"container_persistent": True, # Persist filesystem across sessions

# Docker volume mounts — share host directories with the container.

# Each entry is "host_path:container_path" (standard Docker -v syntax).

# Example:

# ["/home/user/projects:/workspace/projects",

# "/home/user/.hermes/cache/documents:/output"]

# For gateway MEDIA delivery, write inside Docker to /output/... and emit

# the host-visible path in MEDIA:, not the container path.

"docker_volumes": [],

# Explicit opt-in: mount the host cwd into /workspace for Docker sessions.

# Default off because passing host directories into a sandbox weakens isolation.

"docker_mount_cwd_to_workspace": False,

# Explicit opt-in: run the Docker container as the host user's uid:gid

# (via `--user`). When enabled, files written into bind-mounted dirs

# (docker_volumes, the persistent workspace, or the auto-mounted cwd)

# are owned by your host user instead of root, which avoids needing

# `sudo chown` after container runs. Default off to preserve behavior

# for images whose entrypoints expect to start as root (e.g. the

# bundled Hermes image, which drops to the `hermes` user via gosu).

# When on, SETUID/SETGID caps are omitted from the container since

# no privilege drop is needed.

"docker_run_as_host_user": False,

# Persistent shell — keep a long-lived bash shell across execute() calls

# so cwd/env vars/shell variables survive between commands.

# Enabled by default for non-local backends (SSH); local is always opt-in

# via TERMINAL_LOCAL_PERSISTENT env var.

"persistent_shell": True,

"web": {

"backend": "", # shared fallback — applies to both search and extract

"search_backend": "", # per-capability override for web_search (e.g. "searxng")

"extract_backend": "", # per-capability override for web_extract (e.g. "native")

"browser": {

"inactivity_timeout": 120,

"command_timeout": 30, # Timeout for browser commands in seconds (screenshot, navigate, etc.)

"record_sessions": False, # Auto-record browser sessions as WebM videos

"allow_private_urls": False, # Allow navigating to private/internal IPs (localhost, 192.168.x.x, etc.)

# Browser engine for local mode. Passed as ``--engine <value>`` to

# agent-browser v0.25.3+.

# "auto" — use Chrome (default, don't pass --engine at all)

# "lightpanda" — use Lightpanda (1.3-5.8x faster navigation, no screenshots)

# "chrome" — explicitly request Chrome

# Also settable via AGENT_BROWSER_ENGINE env var.

"engine": "auto",

"auto_local_for_private_urls": True, # When a cloud provider is set, auto-spawn local Chromium for LAN/localhost URLs instead of sending them to the cloud

"cdp_url": "", # Optional persistent CDP endpoint for attaching to an existing Chromium/Chrome

# CDP supervisor — dialog + frame detection via a persistent WebSocket.

# Active only when a CDP-capable backend is attached (Browserbase or

# local Chrome via /browser connect). See

# website/docs/developer-guide/browser-supervisor.md.

"dialog_policy": "must_respond", # must_respond | auto_dismiss | auto_accept

"dialog_timeout_s": 300, # Safety auto-dismiss after N seconds under must_respond

"camofox": {

# When true, Hermes sends a stable profile-scoped userId to Camofox

# so the server maps it to a persistent Firefox profile automatically.

# When false (default), each session gets a random userId (ephemeral).

"managed_persistence": False,

# Filesystem checkpoints — automatic snapshots before destructive file ops.

# When enabled, the agent takes a snapshot of the working directory once

# per conversation turn (on first write_file/patch call). Use /rollback

# to restore.

# Defaults changed in v2 (single shared shadow store, real pruning):

# - enabled: True -> False (opt-in; most users never use /rollback)

# - max_snapshots: 50 -> 20 (now actually enforced via ref rewrite)

# - auto_prune: False -> True (orphans/stale pruned automatically)

# Opt in via ``hermes chat --checkpoints`` or set enabled=True here.

"checkpoints": {

"enabled": False,

# Max checkpoints to keep per working directory. Pre-v2 this only

# limited the `/rollback` listing; v2 actually rewrites the ref and

# garbage-collects older commits.

"max_snapshots": 20,

# Hard ceiling on total ``~/.hermes/checkpoints/`` size (MB). When

# exceeded, the oldest checkpoint per project is dropped in a

# round-robin pass until total size falls under the cap.

# 0 disables the size cap.

"max_total_size_mb": 500,

# Skip any single file larger than this when staging a checkpoint.

# Prevents accidental snapshotting of datasets, model weights, and

# other large generated assets. 0 disables the filter.

"max_file_size_mb": 10,

# Auto-maintenance: hermes sweeps the checkpoint base at startup

# (at most once per ``min_interval_hours``) and:

# * deletes project entries whose workdir no longer exists (orphan)

# * deletes project entries whose last_touch is older than

# ``retention_days``

# * GCs the single shared store to reclaim unreachable objects

# * enforces ``max_total_size_mb`` across remaining projects

# * deletes ``legacy-*`` archives older than ``retention_days``

"auto_prune": True,

"retention_days": 7,

"delete_orphans": True,

"min_interval_hours": 24,

# Maximum characters returned by a single read_file call. Reads that

# exceed this are rejected with guidance to use offset+limit.

# 100K chars ≈ 25–35K tokens across typical tokenisers.

"file_read_max_chars": 100_000,

# Tool-output truncation thresholds. When terminal output or a

# single read_file page exceeds these limits, Hermes truncates the

# payload sent to the model (keeping head + tail for terminal,

# enforcing pagination for read_file). Tuning these trades context

# footprint against how much raw output the model can see in one

# shot. Ported from anomalyco/opencode PR #23770.

# - max_bytes: terminal_tool output cap, in chars

# (default 50_000 ≈ 12-15K tokens).

# - max_lines: read_file pagination cap — the maximum `limit`

# a single read_file call can request before

# being clamped (default 2000).

# - max_line_length: per-line cap applied when read_file emits a

# line-numbered view (default 2000 chars).

"tool_output": {

"max_bytes": 50_000,

"max_lines": 2000,

"max_line_length": 2000,

# Tool loop guardrails nudge models when they repeat failed or

# non-progressing tool calls. Soft warnings are always-on by default;

# hard stops are opt-in so interactive CLI/TUI sessions keep flowing.

"tool_loop_guardrails": {

"warnings_enabled": True,

"hard_stop_enabled": False,

"warn_after": {

"exact_failure": 2,

"same_tool_failure": 3,

"idempotent_no_progress": 2,

"hard_stop_after": {

"exact_failure": 5,

"same_tool_failure": 8,

"idempotent_no_progress": 5,

"compression": {

"enabled": True,

"threshold": 0.50, # compress when context usage exceeds this ratio

"target_ratio": 0.20, # fraction of threshold to preserve as recent tail

"protect_last_n": 20, # minimum recent messages to keep uncompressed

"hygiene_hard_message_limit": 400, # gateway session-hygiene force-compress threshold by message count

# Anthropic prompt caching (Claude via OpenRouter or native Anthropic API).

# cache_ttl must be "5m" or "1h" (Anthropic-supported tiers); other values are ignored.

"prompt_caching": {

"cache_ttl": "5m",

# OpenRouter-specific settings.

# response_cache: enable OpenRouter response caching (X-OpenRouter-Cache header).

# When enabled, identical requests return cached responses for free (zero billing).

# This is separate from Anthropic prompt caching and works alongside it.

# See: https://openrouter.ai/docs/guides/features/response-caching

# response_cache_ttl: how long cached responses remain valid, in seconds (1-86400).

# Default 300 (5 minutes). Only used when response_cache is enabled.

"openrouter": {

"response_cache": True,

"response_cache_ttl": 300,

# AWS Bedrock provider configuration.

# Only used when model.provider is "bedrock".

"bedrock": {

"region": "", # AWS region for Bedrock API calls (empty = AWS_REGION env var → us-east-1)

"discovery": {

"enabled": True, # Auto-discover models via ListFoundationModels

"provider_filter": [], # Only show models from these providers (e.g. ["anthropic", "amazon"])

"refresh_interval": 3600, # Cache discovery results for this many seconds

"guardrail": {

# Amazon Bedrock Guardrails — content filtering and safety policies.

# Create a guardrail in the Bedrock console, then set the ID and version here.

# See: https://docs.aws.amazon.com/bedrock/latest/userguide/guardrails.html

"guardrail_identifier": "", # e.g. "abc123def456"

"guardrail_version": "", # e.g. "1" or "DRAFT"

"stream_processing_mode": "async", # "sync" or "async"

"trace": "disabled", # "enabled", "disabled", or "enabled_full"

# Auxiliary model config — provider:model for each side task.

# Format: provider is the provider name, model is the model slug.

# "auto" for provider = auto-detect best available provider.

# Empty model = use provider's default auxiliary model.

# All tasks fall back to openrouter:google/gemini-3-flash-preview if

# the configured provider is unavailable.

"auxiliary": {

"vision": {

"provider": "auto", # auto | openrouter | nous | codex | custom

"model": "", # e.g. "google/gemini-2.5-flash", "gpt-4o"

"base_url": "", # direct OpenAI-compatible endpoint (takes precedence over provider)

"api_key": "", # API key for base_url (falls back to OPENAI_API_KEY)

"timeout": 120, # seconds — LLM API call timeout; vision payloads need generous timeout

"extra_body": {}, # OpenAI-compatible provider-specific request fields

"download_timeout": 30, # seconds — image HTTP download timeout; increase for slow connections

"web_extract": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 360, # seconds (6min) — per-attempt LLM summarization timeout; increase for slow local models

"extra_body": {},

"compression": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 120, # seconds — compression summarises large contexts; increase for local models

"extra_body": {},

"session_search": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 30,

"extra_body": {},

"max_concurrency": 3, # Clamp parallel summaries to avoid request-burst 429s on small providers

"skills_hub": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 30,

"extra_body": {},

"approval": {

"provider": "auto",

"model": "", # fast/cheap model recommended (e.g. gemini-flash, haiku)

"base_url": "",

"api_key": "",

"timeout": 30,

"extra_body": {},

"mcp": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 30,

"extra_body": {},

"title_generation": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 30,

"extra_body": {},

# Triage specifier — flesh out a rough one-liner in the Kanban

# Triage column into a concrete spec, then promote it to ``todo``.

# Invoked by ``hermes kanban specify`` (single id or --all). Set a

# cheap, capable model here (gemini-flash works well); the main

# model is overkill for short spec expansion.

"triage_specifier": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 120,

"extra_body": {},

# Curator — skill-usage review fork. Timeout is generous because the

# review pass can take several minutes on reasoning models (umbrella

# building over hundreds of candidate skills). "auto" = use main chat

# model; override via `hermes model` → auxiliary → Curator to route

# to a cheaper aux model (e.g. openrouter google/gemini-3-flash-preview).

"curator": {

"provider": "auto",

"model": "",

"base_url": "",

"api_key": "",

"timeout": 600,

"extra_body": {},

"display": {

"compact": False,

"personality": "kawaii",

"resume_display": "full",

"busy_input_mode": "interrupt", # interrupt | queue | steer

# When true, `hermes --tui` auto-resumes the most recent human-

# facing session on launch instead of forging a fresh one.

# Mirrors `hermes -c` muscle memory. Default off so existing

# users aren't surprised. HERMES_TUI_RESUME=<id> always wins.

"tui_auto_resume_recent": False,

"bell_on_complete": False,

"show_reasoning": False,

"streaming": False,

"final_response_markdown": "strip", # render | strip | raw

# Preserve recent classic CLI output across Ctrl+L, /redraw, and

# terminal resize full-screen clears. Disable if a terminal emulator

# behaves badly with replayed scrollback.

"persistent_output": True,

"persistent_output_max_lines": 200,

"inline_diffs": True, # Show inline diff previews for write actions (write_file, patch, skill_manage)

"show_cost": False, # Show $ cost in the status bar (off by default)

"skin": "default",

# UI language for static user-facing messages (approval prompts, a

# handful of gateway slash-command replies). Does NOT affect agent

# responses, log lines, tool outputs, or slash-command descriptions.

# Supported: en, zh, ja, de, es, fr, tr, uk. Unknown values fall back to en.

"language": "en",

# TUI busy indicator style: kaomoji (default), emoji, unicode (braille

# spinner), or ascii. Live-swappable via `/indicator <style>`.

"tui_status_indicator": "kaomoji",

"user_message_preview": { # CLI: how many submitted user-message lines to echo back in scrollback

"first_lines": 2,

"last_lines": 2,

"interim_assistant_messages": True, # Gateway: show natural mid-turn assistant status messages

"tool_progress_command": False, # Enable /verbose command in messaging gateway

"tool_progress_overrides": {}, # DEPRECATED — use display.platforms instead

"tool_preview_length": 0, # Max chars for tool call previews (0 = no limit, show full paths/commands)

# Auto-delete system-notice replies (e.g. "✨ New session started!",

# "♻ Restarting gateway…", "⚡ Stopped…") after N seconds on platforms

# that support message deletion (currently Telegram; other platforms

# ignore and leave the message in place). Only affects slash-command

# replies wrapped with gateway.platforms.base.EphemeralReply — agent

# responses and content messages are never touched. Default 0

# (disabled) preserves prior behavior.

"ephemeral_system_ttl": 0,

"platforms": {}, # Per-platform display overrides: {"telegram": {"tool_progress": "all"}, "slack": {"tool_progress": "off"}}

# Gateway runtime-metadata footer appended to the FINAL message of a turn

# (disabled by default to keep replies minimal). When enabled, renders

# e.g. `model · 68% · ~/projects/hermes`. Per-platform overrides go under

# display.platforms.<platform>.runtime_footer.

"runtime_footer": {

"enabled": False,

"fields": ["model", "context_pct", "cwd"], # Order shown; drop any to hide

"copy_shortcut": "auto", # "auto" (platform default) | "ctrl_c" | "ctrl_shift_c" | "disabled"

# Web dashboard settings

"dashboard": {

"theme": "default", # Dashboard visual theme: "default", "midnight", "ember", "mono", "cyberpunk", "rose"

# Privacy settings

"privacy": {

"redact_pii": False, # When True, hash user IDs and strip phone numbers from LLM context

# Text-to-speech configuration

# Each provider supports an optional `max_text_length:` override for the

# per-request input-character cap. Omit it to use the provider's documented

# limit (OpenAI 4096, xAI 15000, MiniMax 10000, ElevenLabs 5k-40k model-aware,

# Gemini 5000, Edge 5000, Mistral 4000, NeuTTS/KittenTTS 2000).

"tts": {

"edge": {

"voice": "en-US-AriaNeural",

# Popular: AriaNeural, JennyNeural, AndrewNeural, BrianNeural, SoniaNeural

"elevenlabs": {

"voice_id": "pNInz6obpgDQGcFmaJgB", # Adam

"model_id": "eleven_multilingual_v2",

"openai": {

"model": "gpt-4o-mini-tts",

"voice": "alloy",

# Voices: alloy, echo, fable, onyx, nova, shimmer

"xai": {

"voice_id": "eve", # or custom voice ID — see https://docs.x.ai/developers/model-capabilities/audio/custom-voices

"language": "en",

"sample_rate": 24000,

"bit_rate": 128000,

"mistral": {

"model": "voxtral-mini-tts-2603",

"voice_id": "c69964a6-ab8b-4f8a-9465-ec0925096ec8", # Paul - Neutral

"neutts": {

"ref_audio": "", # Path to reference voice audio (empty = bundled default)

"ref_text": "", # Path to reference voice transcript (empty = bundled default)

"model": "neuphonic/neutts-air-q4-gguf", # HuggingFace model repo

"device": "cpu", # cpu, cuda, or mps

"piper": {

# Voice name (e.g. "en_US-lessac-medium") downloaded on first

# use, OR an absolute path to a pre-downloaded .onnx file.

# Full voice list: https://github.com/OHF-Voice/piper1-gpl/blob/main/docs/VOICES.md

"voice": "en_US-lessac-medium",

# "voices_dir": "", # Override voice cache dir; default = ~/.hermes/cache/piper-voices/

# "use_cuda": False, # Requires onnxruntime-gpu

# "length_scale": 1.0, # 2.0 = twice as slow

# "noise_scale": 0.667,

# "noise_w_scale": 0.8,

# "volume": 1.0,

# "normalize_audio": True,

"stt": {

"enabled": True,

"provider": "local", # "local" (free, faster-whisper) | "groq" | "openai" (Whisper API) | "mistral" (Voxtral Transcribe)

"local": {

"model": "base", # tiny, base, small, medium, large-v3

"language": "", # auto-detect by default; set to "en", "es", "fr", etc. to force

"openai": {

"model": "whisper-1", # whisper-1, gpt-4o-mini-transcribe, gpt-4o-transcribe

"mistral": {

"model": "voxtral-mini-latest", # voxtral-mini-latest, voxtral-mini-2602

"voice": {

"record_key": "ctrl+b",

"max_recording_seconds": 120,

"auto_tts": False,

"beep_enabled": True, # Play record start/stop beeps in CLI voice mode

"silence_threshold": 200, # RMS below this = silence (0-32767)

"silence_duration": 3.0, # Seconds of silence before auto-stop

"human_delay": {

"mode": "off",

"min_ms": 800,

"max_ms": 2500,

# Context engine -- controls how the context window is managed when

# approaching the model's token limit.

# "compressor" = built-in lossy summarization (default).

# Set to a plugin name to activate an alternative engine (e.g. "lcm"

# for Lossless Context Management). The engine must be installed as

# a plugin in plugins/context_engine/<name>/ or ~/.hermes/plugins/.

"context": {

"engine": "compressor",

# Persistent memory -- bounded curated memory injected into system prompt

"memory": {

"memory_enabled": True,

"user_profile_enabled": True,

"memory_char_limit": 2200, # ~800 tokens at 2.75 chars/token

"user_char_limit": 1375, # ~500 tokens at 2.75 chars/token

# External memory provider plugin (empty = built-in only).

# Set to a provider name to activate: "openviking", "mem0",

# "hindsight", "holographic", "retaindb", "byterover".

# Only ONE external provider is allowed at a time.

"provider": "",

# Subagent delegation — override the provider:model used by delegate_task

# so child agents can run on a different (cheaper/faster) provider and model.

# Uses the same runtime provider resolution as CLI/gateway startup, so all

# configured providers (OpenRouter, Nous, Z.ai, Kimi, etc.) are supported.

"delegation": {

"model": "", # e.g. "google/gemini-3-flash-preview" (empty = inherit parent model)

"provider": "", # e.g. "openrouter" (empty = inherit parent provider + credentials)

"base_url": "", # direct OpenAI-compatible endpoint for subagents

"api_key": "", # API key for delegation.base_url (falls back to OPENAI_API_KEY)

# When delegate_task narrows child toolsets explicitly, preserve any

# MCP toolsets the parent already has enabled. On by default so

# narrowing (e.g. toolsets=["web","browser"]) expresses "I want these

# extras" without silently stripping MCP tools the parent already has.

# Set to false for strict intersection.

"inherit_mcp_toolsets": True,

"max_iterations": 50, # per-subagent iteration cap (each subagent gets its own budget,

# independent of the parent's max_iterations)

"child_timeout_seconds": 600, # wall-clock timeout for each child agent (floor 30s,

View remainder of file in raw view

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

config.py

Latest commit

History

config.py

File metadata and controls