Files
roboimi/roboimi/vla/conf/config.yaml

51 lines
1.8 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
defaults:
- agent: resnet_transformer
- data: simpe_robot_dataset
- eval: eval
- _self_
# ====================
# 训练配置
# ====================
train:
# 基础训练参数
batch_size: 16 # 批次大小
lr: 1e-4 # 学习率
max_steps: 100000 # 最大训练步数
device: "cuda" # 设备: "cuda" 或 "cpu"
# 数据加载
num_workers: 12 # DataLoader 工作进程数(调试时设为 0
val_split: 0.0 # 验证集比例;默认使用全量数据训练
seed: 42 # 随机种子(用于数据划分)
# 日志和检查点
log_freq: 100 # 日志记录频率(步数)
save_freq: 2000 # 保存检查点频率(步数)
use_swanlab: false # 是否启用 SwanLab 标量日志
swanlab_project: "roboimi-vla" # SwanLab project 名称
swanlab_run_name: null # 可选的 SwanLab 运行名
rollout_val_freq_epochs: 50 # 每隔多少个 epoch 执行一次 rollout 验证
rollout_validate_on_checkpoint: false # 是否在保存 checkpoint 后立即运行 rollout 验证
rollout_num_episodes: 3 # rollout 验证的回合数
# 学习率调度器(带预热)
warmup_steps: 2000 # 预热步数Transformer建议更长
scheduler_type: "cosine" # 预热后的调度器: "constant" 或 "cosine"
min_lr: 1e-6 # 最小学习率(用于余弦退火)
# 优化器
weight_decay: 1e-5 # 权重衰减L2 正则化)
grad_clip: 1.0 # 梯度裁剪阈值
# 微调配置
pretrained_ckpt: null # 预训练 checkpoint 路径(用于微调),例如: "checkpoints/vla_model_step_8000.pt"
# ====================
# 实验配置
# ====================
experiment:
name: "vla_diffusion" # 实验名称
notes: "" # 实验备注
tags: [] # 实验标签