Files
hermes-agent/environments/pwncollege_env/process_config.yaml
Hermes Agent a1f9961f51 feat: add disable_secret_redaction config for RL environments
Adds a new disable_secret_redaction field to HermesAgentEnvConfig that
sets HERMES_REDACT_SECRETS=false, preventing the secret redactor from
munging source code containing password fields (e.g. Flask apps in
web-security challenges).

Follows same pattern as disable_command_guards -> HERMES_YOLO_MODE.
2026-03-31 16:19:22 +00:00

55 lines
1.4 KiB
YAML

env:
# Breadth: total items to process (>= 842 challenges in dojo)
total_steps: 850
# Depth: completions per item (1 = max coverage speed)
group_size: 1
# Concurrency: match dojo max_instances (16 slots)
eval_concurrency: 16
max_agent_turns: 30
max_token_length: 16384
agent_temperature: 0.7
enabled_toolsets:
- terminal
- file
- pwncollege
terminal_backend: ssh
terminal_timeout: 120
terminal_lifetime: 3600
disable_command_guards: true
disable_secret_redaction: true
tool_call_parser: hermes
# Dojo connection
base_url: http://100.120.55.25:8080
ssh_host: 100.120.55.25
ssh_port: 2222
ssh_key: ""
# No filters = all challenges
challenge: hello/hello
dojo_filter: null
module_filter: null
# Output
data_path_to_save_groups: environments/pwncollege_env/eval_runs/process_all.jsonl
data_dir_to_save_evals: environments/pwncollege_env/eval_runs/process_all
ensure_scores_are_not_same: false
include_messages: true
use_wandb: false
wandb_name: pwncollege-process
# Not needed for process mode but required by config schema
tokenizer_name: NousResearch/Hermes-3-Llama-3.1-8B
rollout_server_url: http://localhost:8000
openai:
- timeout: 1200
num_max_requests_at_once: 128
model_name: xiaomi/mimo-v2-flash
server_type: openai
api_key: ""
base_url: https://openrouter.ai/api/v1
health_check: false
slurm: false
testing: false