mirror of
https://github.com/microsoft/SkillOpt.git
synced 2026-07-03 14:02:58 +08:00
35 lines
599 B
YAML
35 lines
599 B
YAML
_base_: ../_base_/default.yaml
|
|
|
|
model:
|
|
reasoning_effort: medium
|
|
|
|
train:
|
|
train_size: 80
|
|
batch_size: 40
|
|
accumulation: 1
|
|
|
|
gradient:
|
|
minibatch_size: 8
|
|
merge_batch_size: 8
|
|
|
|
optimizer:
|
|
learning_rate: 4
|
|
|
|
evaluation:
|
|
sel_env_num: 0
|
|
test_env_num: 0
|
|
|
|
env:
|
|
name: spreadsheetbench
|
|
skill_init: skillopt/envs/spreadsheetbench/skills/initial.md
|
|
split_mode: split_dir
|
|
split_dir: data/spreadsheetbench_split
|
|
data_path: ""
|
|
split_output_dir: ""
|
|
data_root: data/spreadsheetbench_verified_400
|
|
mode: multi
|
|
max_turns: 30
|
|
max_completion_tokens: 16384
|
|
exec_timeout: 600
|
|
workers: 24
|