feat(inference): 添加动作平滑器

2026-02-03 10:32:09 +08:00
parent a977cc4f5e
commit c1ce560b32
2 changed files with 93 additions and 0 deletions
--- a/roboimi/demos/config.yaml
+++ b/roboimi/demos/config.yaml
@@ -38,6 +38,11 @@ episode_len:      # leave empty here by default
 camera_names: []  # leave empty here by default
 xml_dir:          # leave empty here by default
 # action smoothing settings (for GR00T)
 use_action_smoothing: true
 smooth_method: "ema"     # Options: "ema", "moving_avg", "lowpass", "none"
 smooth_alpha: 0.3        # Smoothing factor (0-1), smaller = smoother
 # transformer settings
 batch_size: 15                          
 state_dim: 16            
--- a/roboimi/demos/diana_eval.py
+++ b/roboimi/demos/diana_eval.py
@@ -12,6 +12,71 @@ from roboimi.envs.double_pos_ctrl_env import make_sim_env
 from roboimi.utils.act_ex_utils import sample_transfer_pose
 class ActionSmoother:
    """
    动作平滑器，支持多种平滑策略
    """
    def __init__(self, action_dim, method='ema', alpha=0.3, window_size=5):
        """
        Args:
            action_dim: 动作维度
            method: 平滑方法 ('ema', 'moving_avg', 'lowpass', 'none')
            alpha: EMA 平滑系数 (0-1)，越小越平滑
            window_size: 滑动窗口大小
        """
        self.action_dim = action_dim
        self.method = method
        self.alpha = alpha
        self.window_size = window_size
        self.history = []
        self.prev_action = None
    def smooth(self, action):
        """
        对动作进行平滑处理
        Args:
            action: 当前动作 [action_dim]
        Returns:
            smoothed_action: 平滑后的动作
        """
        if self.method == 'none':
            return action
        if self.method == 'ema':
            # 指数移动平均
            if self.prev_action is None:
                smoothed = action
            else:
                smoothed = self.alpha * action + (1 - self.alpha) * self.prev_action
            self.prev_action = smoothed
            return smoothed
        elif self.method == 'moving_avg':
            # 滑动平均
            self.history.append(action.copy())
            if len(self.history) > self.window_size:
                self.history.pop(0)
            return np.mean(self.history, axis=0)
        elif self.method == 'lowpass':
            # 一阶低通滤波器
            if self.prev_action is None:
                smoothed = action
            else:
                smoothed = self.prev_action + self.alpha * (action - self.prev_action)
            self.prev_action = smoothed
            return smoothed
        else:
            raise ValueError(f"Unknown smoothing method: {self.method}")
    def reset(self):
        """重置平滑器状态"""
        self.history = []
        self.prev_action = None
 #should be added into IOUtils
 def get_image(obs,camera_names):
@@ -57,6 +122,19 @@ def run_episode(config, policy, stats, save_episode,num_rollouts):
    pre_process = lambda s_qpos: (s_qpos - stats['qpos_mean']) / stats['qpos_std']
    post_process = lambda a: a * stats['action_std'] + stats['action_mean']
    box_pos = sample_transfer_pose()
    # 初始化动作平滑器
    action_dim = config['action_dim']
    use_smoothing = config.get('use_action_smoothing', False)
    smooth_method = config.get('smooth_method', 'ema')
    smooth_alpha = config.get('smooth_alpha', 0.3)
    if use_smoothing and config['policy_class'] == "GR00T":
        smoother = ActionSmoother(action_dim, method=smooth_method, alpha=smooth_alpha)
        print(f"Action smoothing enabled: method={smooth_method}, alpha={smooth_alpha}")
    else:
        smoother = None
    for rollout_id in range(num_rollouts):
        print("\nrollout_id===",rollout_id,"\n")
        image_list = []
@@ -64,6 +142,11 @@ def run_episode(config, policy, stats, save_episode,num_rollouts):
        query_frequency = config['policy_config'].get('num_queries', 1)
        print("query_freq =====",query_frequency)
        env.reset(box_pos)
        # 重置平滑器
        if smoother is not None:
            smoother.reset()
        with torch.inference_mode():
            for t in range(700):
                image_list.append(env._get_image_obs()['images'] if 'images' in env._get_image_obs() else {print("img error")})
@@ -83,6 +166,11 @@ def run_episode(config, policy, stats, save_episode,num_rollouts):
                action = post_process(raw_action)
                # 应用动作平滑（仅对 GR00T）
                if smoother is not None:
                    action = smoother.smooth(action)
                print("action == ",action)
                env.step_jnt(action)
                rewards.append(env.rew)