From 4bdd2475b00041b637b08aec75ffeb7cd6a5c430 Mon Sep 17 00:00:00 2001
From: Martino Russi <nopyeps@gmail.com>
Date: Thu, 27 Nov 2025 10:22:11 +0100
Subject: [PATCH] complete work

---
 .../robots/unitree_g1/arm_calibration.json    |   2 +-
 .../robots/unitree_g1/config_unitree_g1.py    |  22 +-
 src/lerobot/robots/unitree_g1/unitree_g1.py   | 694 +++++++++++++++++-
 3 files changed, 702 insertions(+), 16 deletions(-)

diff --git a/src/lerobot/robots/unitree_g1/arm_calibration.json b/src/lerobot/robots/unitree_g1/arm_calibration.json
index 55fdbfa6e..1220f992c 100644
--- a/src/lerobot/robots/unitree_g1/arm_calibration.json
+++ b/src/lerobot/robots/unitree_g1/arm_calibration.json
@@ -75,7 +75,7 @@
         "drive_mode": 0,
         "homing_offset": 0,
         "range_min": -2.2,
-        "range_max": 0.1
+        "range_max": 0.5
     },
     "kRightElbow.pos": {
         "id": 3,
diff --git a/src/lerobot/robots/unitree_g1/config_unitree_g1.py b/src/lerobot/robots/unitree_g1/config_unitree_g1.py
index a7d56b705..1d1e5633e 100644
--- a/src/lerobot/robots/unitree_g1/config_unitree_g1.py
+++ b/src/lerobot/robots/unitree_g1/config_unitree_g1.py
@@ -25,6 +25,7 @@ from ..config import RobotConfig
 @dataclass
 class UnitreeG1Config(RobotConfig):
    # id: str = "unitree_g1"
+    motion_mode: bool = False
     simulation_mode: bool = True
     kp_high = 40.0
     kd_high = 3.0
@@ -40,9 +41,12 @@ class UnitreeG1Config(RobotConfig):
     arm_velocity_limit = 100.0
     control_dt = 1.0 / 250.0
 
+    speed_gradual_max: bool = False
     gradual_start_time: float | None = None
     gradual_time: float | None = None
 
+    audio_client: bool = True
+
     freeze_body: bool = False
     gravity_compensation: bool = True
 
@@ -52,7 +56,7 @@ class UnitreeG1Config(RobotConfig):
     # This robot class ONLY uses sockets to communicate with a bridge on the Orin
     # Run 'python dds_to_socket.py' on the Orin first, then set this to the Orin's IP
     # Example: socket_host="192.168.123.164" (Orin's wlan0 IP)
-    socket_host: str | None = None# = "172.18.129.215"
+    socket_host: str | None = None # = "172.18.129.215"#
     socket_port: int | None = None
 
     # Locomotion control
@@ -60,12 +64,26 @@ class UnitreeG1Config(RobotConfig):
     #policy_path: str = "src/lerobot/robots/unitree_g1/assets/g1/locomotion/motion.pt"
     policy_path: str = "src/lerobot/robots/unitree_g1/assets/g1/locomotion/GR00T-WholeBodyControl-Walk.onnx"
     
+    # Motion imitation (dance_102, gangnam_style, etc)
+    motion_imitation_control: bool = False
+    motion_policy_path: str = "src/lerobot/robots/unitree_g1/assets/g1/mimic/gangnam_style/policy.onnx"  # Use policy
+    #motion_policy_path: str = None  # Set to None for direct playback mode (no policy)
+    motion_file_path: str = "src/lerobot/robots/unitree_g1/assets/g1/mimic/gangnam_style/G1_gangnam_style_V01.bvh_60hz.csv"
+    motion_fps: float = 60.0
+    motion_control_dt: float = 0.02
+
+    motion_joint_ids_map: list = field(default_factory=lambda: [0, 6, 12, 1, 7, 13, 2, 8, 14, 3, 9, 15, 22, 4, 10, 16, 23, 5, 11, 17, 24, 18, 25, 19, 26, 20, 27, 21, 28])
+    motion_stiffness: list = field(default_factory=lambda: [40.2, 99.1, 40.2, 99.1, 28.5, 28.5, 40.2, 99.1, 40.2, 99.1, 28.5, 28.5, 40.2, 28.5, 28.5, 14.3, 14.3, 14.3, 14.3, 14.3, 16.8, 16.8, 14.3, 14.3, 14.3, 14.3, 14.3, 16.8, 16.8])
+    motion_damping: list = field(default_factory=lambda: [2.56, 6.31, 2.56, 6.31, 1.81, 1.81, 2.56, 6.31, 2.56, 6.31, 1.81, 1.81, 2.56, 1.81, 1.81, 0.907, 0.907, 0.907, 0.907, 0.907, 1.07, 1.07, 0.907, 0.907, 0.907, 0.907, 0.907, 1.07, 1.07])
+    motion_default_joint_pos: list = field(default_factory=lambda: [-0.302, -0.319, 0.00124, 0.000442, 0.00489, 0.00191, 0.00929, 0.00796, 0.00546, 0.672, 0.67, 0.2, 0.202, -0.368, -0.355, 0.194, -0.196, -0.00644, 0.00976, 0.00258, -0.00029, 0.605, 0.596, 0.00818, 0.00322, 0.00293, -0.00339, -0.00955, -0.00715])
+    motion_action_scale: list = field(default_factory=lambda: [0.548, 0.548, 0.548, 0.351, 0.351, 0.439, 0.548, 0.548, 0.439, 0.351, 0.351, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.439, 0.0745, 0.0745, 0.0745, 0.0745])
+    
     # Locomotion parameters (from g1.yaml)
     locomotion_control_dt: float = 0.02
     
     leg_joint2motor_idx: list = field(default_factory=lambda: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11])
     locomotion_kps: list = field(default_factory=lambda: [150, 150, 150, 300, 40, 40, 150, 150, 150, 300, 40, 40])
-    locomotion_kds: list = field(default_factory=lambda: [2, 2, 2, 4, 2, 2, 2, 2, 2, 4, 2, 2])
+    locomotion_kds: list = field(default_factory=lambda: [6, 6, 6, 4, 2, 2, 6, 6, 6, 4, 2, 2])
     default_leg_angles: list = field(default_factory=lambda: [-0.1, 0.0, 0.0, 0.3, -0.2, 0.0, -0.1, 0.0, 0.0, 0.3, -0.2, 0.0])
 
     arm_waist_joint2motor_idx: list = field(default_factory=lambda: [12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28])
diff --git a/src/lerobot/robots/unitree_g1/unitree_g1.py b/src/lerobot/robots/unitree_g1/unitree_g1.py
index 79566b0a7..a8e9ec471 100644
--- a/src/lerobot/robots/unitree_g1/unitree_g1.py
+++ b/src/lerobot/robots/unitree_g1/unitree_g1.py
@@ -30,6 +30,7 @@ import onnxruntime as ort
 from unitree_sdk2py.idl.unitree_hg.msg.dds_ import LowCmd_ as hg_LowCmd, LowState_ as hg_LowState  # idl for g1, h1_2
 from unitree_sdk2py.idl.default import unitree_hg_msg_dds__LowCmd_
 from unitree_sdk2py.utils.crc import CRC
+from unitree_sdk2py.g1.audio.g1_audio_client import AudioClient
 from unitree_sdk2py.comm.motion_switcher.motion_switcher_client import (
     MotionSwitcherClient,
 )
@@ -45,6 +46,7 @@ import torch
 logger = logging.getLogger(__name__)
 
 kTopicLowCommand_Debug = "rt/lowcmd"
+kTopicLowCommand_Motion = "rt/arm_sdk"
 kTopicLowState = "rt/lowstate"
 
 G1_29_Num_Motors = 35
@@ -89,6 +91,8 @@ class DataBuffer:
         with self.lock:
             self.data = data
 
+#eventually observations should be everything: motor torques etc etc 
+#motor class for unitree? 
 class UnitreeG1(Robot):
 
     config_class = UnitreeG1Config
@@ -103,6 +107,7 @@ class UnitreeG1(Robot):
         self.cameras = make_cameras_from_configs(config.cameras)
         self.q_target = np.zeros(14)
         self.tauff_target = np.zeros(14)
+        self.motion_mode = config.motion_mode
         self.simulation_mode = config.simulation_mode
         self.kp_high = config.kp_high
         self.kd_high = config.kd_high
@@ -115,6 +120,7 @@ class UnitreeG1(Robot):
         self.arm_velocity_limit = config.arm_velocity_limit
         self.control_dt = config.control_dt
 
+        self._speed_gradual_max = config.speed_gradual_max
         self._gradual_start_time = config.gradual_start_time
         self._gradual_time = config.gradual_time
 
@@ -126,6 +132,7 @@ class UnitreeG1(Robot):
         self.freeze_body = config.freeze_body
         self.gravity_compensation = config.gravity_compensation
 
+
         self.calibrated = False
 
         self.calibrate()
@@ -155,15 +162,16 @@ class UnitreeG1(Robot):
         # initialize lowcmd nd lowstate subscriber
         if self.simulation_mode:
             ChannelFactoryInitialize(0, "lo")
-
             logger.info("Launching MuJoCo simulation environment...")
             self.mujoco_env = make_env("lerobot/unitree-g1-mujoco", trust_remote_code=True)
             logger.info("MuJoCo environment launched successfully!")
         else:
             ChannelFactoryInitialize(0)
 
-        # Always use debug mode (direct motor control)
-        self.lowcmd_publisher = ChannelPublisher(kTopicLowCommand_Debug, hg_LowCmd)
+        if self.motion_mode:
+            self.lowcmd_publisher = ChannelPublisher(kTopicLowCommand_Motion, hg_LowCmd)
+        else:
+            self.lowcmd_publisher = ChannelPublisher(kTopicLowCommand_Debug, hg_LowCmd)
         self.lowcmd_publisher.Init()
         self.lowstate_subscriber = ChannelSubscriber(kTopicLowState, hg_LowState)
         self.lowstate_subscriber.Init()
@@ -209,7 +217,13 @@ class UnitreeG1(Robot):
                     self.msg.motor_cmd[id].kp = self.kp_high
                     self.msg.motor_cmd[id].kd = self.kd_high
             self.msg.motor_cmd[id].q = self.all_motor_q[id]
-        #print current motor q, kp, kd
+
+        if config.audio_client:
+            pass
+            # self.audio_client = AudioClient()
+            # self.audio_client.SetTimeout(10.0)
+            # self.audio_client.Init()
+            # logger.info("[UnitreeG1] Audio client initialized!")
 
         logger.info("Lock OK!\n") #motors are not locked x
         # for i in range(10000):
@@ -221,24 +235,62 @@ class UnitreeG1(Robot):
         self.keyboard_running = False
         self.locomotion_thread = None
         self.locomotion_running = False
+        self.motion_imitation_thread = None
+        self.motion_imitation_running = False
         
         # Initialize publish thread for arm control
-        # Note: This thread runs alongside locomotion thread
+        # Note: This thread runs alongside locomotion/motion_imitation threads
         # - Arm thread: controls arms (indices 15-28)
         # - Locomotion thread: controls legs (0-11), waist (12-14)
         # Both update different parts of self.msg, both call Write()
         self.publish_thread = None
         self.ctrl_lock = threading.Lock()
-        self.publish_thread = threading.Thread(target=self._ctrl_motor_state)
-        self.publish_thread.daemon = True
-        self.publish_thread.start()
-        logger.info("Arm control publish thread started")
+        if not config.motion_imitation_control:  # Allow with locomotion, disable only for motion imitation
+            self.publish_thread = threading.Thread(target=self._ctrl_motor_state)
+            self.publish_thread.daemon = True
+            self.publish_thread.start()
+            logger.info("Arm control publish thread started")
 
         # Load locomotion policy if enabled
         self.policy = None
-        self.policy_type = None  # 'torchscript' or 'onnx'
+        self.policy_type = None  # 'torchscript', 'onnx', or 'motion_imitation'
+        self.motion_loader = None
         
-        if config.locomotion_control:
+        if config.motion_imitation_control:
+            # Motion imitation mode (dance, etc.)
+            if config.motion_file_path is None:
+                raise ValueError("motion_imitation_control is True but motion_file_path is not set")
+            
+            logger.info(f"Loading motion reference from {config.motion_file_path}")
+            
+            # Load motion file
+            self.motion_loader = self.MotionLoader(config.motion_file_path, config.motion_fps)
+            
+            # Load ONNX policy (optional for now - can run in direct playback mode)
+            if config.motion_policy_path and Path(config.motion_policy_path).exists():
+                logger.info(f"Loading motion imitation policy from {config.motion_policy_path}")
+                self.policy = ort.InferenceSession(config.motion_policy_path)
+                self.policy_type = 'motion_imitation'
+                logger.info("Motion imitation ONNX policy loaded successfully")
+                logger.info(f"ONNX input: {self.policy.get_inputs()[0].name}, shape: {self.policy.get_inputs()[0].shape}")
+                logger.info(f"ONNX output: {self.policy.get_outputs()[0].name}, shape: {self.policy.get_outputs()[0].shape}")
+            else:
+                logger.info("Running in DIRECT PLAYBACK mode (no policy - just reference motion)")
+                self.policy = None
+                self.policy_type = 'motion_playback'
+            
+            # Initialize motion imitation variables
+            self.motion_counter = 0
+            self.motion_qj_all = np.zeros(29, dtype=np.float32)  # All 29 joints from robot
+            self.motion_dqj_all = np.zeros(29, dtype=np.float32)
+            self.motion_action = np.zeros(29, dtype=np.float32)  # 29D action output
+            self.motion_obs = np.zeros(154, dtype=np.float32)  # 154D observation
+            self.motion_elapsed_time = 0.0
+            
+            # Initialize motion and start
+            self.init_motion_imitation()
+            
+        elif config.locomotion_control:
             if config.policy_path is None:
                 raise ValueError("locomotion_control is True but policy_path is not set")
             
@@ -363,7 +415,12 @@ class UnitreeG1(Robot):
         return cliped_arm_q_target
 
     def _ctrl_motor_state(self):
-        """Arm control thread - publishes commands for arms only."""
+        """Arm control thread - publishes commands for arms only.
+        NOTE: This thread is NOT started when motion_imitation_control or locomotion_control is True.
+        Those modes handle their own publishing."""
+        if self.motion_mode:
+            self.msg.motor_cmd[G1_29_JointIndex.kNotUsedJoint0].q = 1.0
+
         while True:
             start_time = time.time()
             
@@ -395,6 +452,10 @@ class UnitreeG1(Robot):
             self.msg.crc = self.crc.Crc(self.msg)
             self.lowcmd_publisher.Write(self.msg)
 
+            if self._speed_gradual_max is True:
+                t_elapsed = start_time - self._gradual_start_time
+                self.arm_velocity_limit = 20.0 + (10.0 * min(1.0, t_elapsed / 5.0))
+
             current_time = time.time()
             all_t_elapsed = current_time - start_time
             sleep_time = max(0, (self.control_dt - all_t_elapsed))
@@ -424,6 +485,37 @@ class UnitreeG1(Robot):
         """Return current state dq of the left and right arm motors."""
         return np.array([self.lowstate_buffer.GetData().motor_state[id].dq for id in G1_29_JointArmIndex])
 
+    def ctrl_dual_arm_go_home(self):
+        """Move both the left and right arms of the robot to their home position by setting the target joint angles (q) and torques (tau) to zero."""
+        logger.info("[G1_29_ArmController] ctrl_dual_arm_go_home start...")
+        max_attempts = 100
+        current_attempts = 0
+        with self.ctrl_lock:
+            self.q_target = np.zeros(14)
+            #self.q_target[G1_29_JointIndex.kLeftElbow] = 0.5
+            # self.tauff_target = np.zeros(14)
+        tolerance = 0.05  # Tolerance threshold for joint angles to determine "close to zero", can be adjusted based on your motor's precision requirements
+        while current_attempts < max_attempts:
+            current_q = self.get_current_dual_arm_q()
+            if np.all(np.abs(current_q) < tolerance):
+                if self.motion_mode:
+                    for weight in np.linspace(1, 0, num=101):
+                        self.msg.motor_cmd[G1_29_JointIndex.kNotUsedJoint0].q = weight
+                        time.sleep(0.02)
+                logger.info("[G1_29_ArmController] both arms have reached the home position.")
+                break
+            current_attempts += 1
+            time.sleep(0.05)
+
+    def speed_gradual_max(self, t=5.0):
+        """Parameter t is the total time required for arms velocity to gradually increase to its maximum value, in seconds. The default is 5.0."""
+        self._gradual_start_time = time.time()
+        self._gradual_time = t
+        self._speed_gradual_max = True
+
+    def speed_instant_max(self):
+        """set arms velocity to the maximum value immediately, instead of gradually increasing."""
+        self.arm_velocity_limit = 30.0
 
     def _Is_weak_motor(self, motor_index):
         weak_motors = [
@@ -522,6 +614,159 @@ class UnitreeG1(Robot):
             'motors': motors_data,
         }
 
+    def audio_control(self, command, volume: int = 80):
+        """
+        Unified audio/LED control function for the G1 robot.
+        
+        Args:
+            command: Can be one of:
+                - str: Text to speak via TTS
+                - tuple[int, int, int]: RGB values (0-255) for LED control
+                - str (path): Path to WAV file to play
+            volume: Volume level 0-100 (default: 80)
+        
+        Examples:
+            robot.audio_control("Hello world")  # TTS
+            robot.audio_control((255, 0, 0))     # Red LED
+            robot.audio_control("audio.wav")     # Play WAV file
+        """
+        # Set volume
+        self.audio_client.SetVolume(volume)
+        
+        # Detect command type and execute
+        if isinstance(command, tuple) and len(command) == 3:
+            # LED control - RGB tuple
+            r, g, b = command
+            logger.info(f"Setting LED to RGB({r}, {g}, {b})")
+            self.audio_client.LedControl(r, g, b)
+            
+        elif isinstance(command, str):
+            # Check if it's a file path
+            if Path(command).exists():
+                # Play WAV file
+                logger.info(f"Playing audio file: {command}")
+                self._play_wav_file(command)
+            else:
+                # Text-to-speech
+                logger.info(f"Speaking: {command}")
+                self.audio_client.TtsMaker(command, 0)  # 0 for English
+        else:
+            raise ValueError(
+                f"Invalid command type: {type(command)}. "
+                "Expected str (text/path) or tuple[int, int, int] (RGB)"
+            )
+
+    def _read_wav_file(self, filename: str):
+        """Read WAV file and return PCM data as bytes."""
+        with open(filename, 'rb') as f:
+            def read(fmt):
+                return struct.unpack(fmt, f.read(struct.calcsize(fmt)))
+
+            # Read RIFF header
+            chunk_id, = read('<I')
+            if chunk_id != 0x46464952:  # "RIFF"
+                raise ValueError("Not a valid WAV file (invalid RIFF header)")
+
+            _chunk_size, = read('<I')
+            format_tag, = read('<I')
+            if format_tag != 0x45564157:  # "WAVE"
+                raise ValueError("Not a valid WAV file (invalid WAVE format)")
+
+            # Read fmt chunk
+            subchunk1_id, = read('<I')
+            subchunk1_size, = read('<I')
+
+            # Skip JUNK chunk if present
+            if subchunk1_id == 0x4B4E554A:  # "JUNK"
+                f.seek(subchunk1_size, 1)
+                subchunk1_id, = read('<I')
+                subchunk1_size, = read('<I')
+
+            if subchunk1_id != 0x20746D66:  # "fmt "
+                raise ValueError("Invalid fmt chunk")
+
+            if subchunk1_size not in [16, 18]:
+                raise ValueError(f"Unsupported fmt chunk size: {subchunk1_size}")
+
+            audio_format, = read('<H')
+            if audio_format != 1:
+                raise ValueError(f"Only PCM format supported, got format {audio_format}")
+
+            num_channels, = read('<H')
+            sample_rate, = read('<I')
+            _byte_rate, = read('<I')
+            _block_align, = read('<H')
+            bits_per_sample, = read('<H')
+
+            if bits_per_sample != 16:
+                raise ValueError(f"Only 16-bit samples supported, got {bits_per_sample}-bit")
+
+            if sample_rate != 16000:
+                raise ValueError(f"Sample rate must be 16000 Hz, got {sample_rate} Hz")
+
+            if num_channels != 1:
+                raise ValueError(f"Must be mono (1 channel), got {num_channels} channels")
+
+            if subchunk1_size == 18:
+                extra_size, = read('<H')
+                if extra_size != 0:
+                    f.seek(extra_size, 1)
+
+            # Find data chunk
+            while True:
+                subchunk2_id, subchunk2_size = read('<II')
+                if subchunk2_id == 0x61746164:  # "data"
+                    break
+                f.seek(subchunk2_size, 1)
+
+            # Read PCM data
+            raw_pcm = f.read(subchunk2_size)
+            if len(raw_pcm) != subchunk2_size:
+                raise ValueError("Failed to read full PCM data")
+
+            return raw_pcm
+
+    def _play_wav_file(self, filename: str, chunk_size: int = 96000):
+        """
+        Play a WAV file through the robot's speaker.
+        
+        Args:
+            filename: Path to WAV file (must be 16kHz, mono, 16-bit PCM)
+            chunk_size: Bytes per chunk (default: 96000 = ~3 seconds at 16kHz)
+        """
+        # Read WAV file
+        pcm_data = self._read_wav_file(filename)
+        
+        stream_id = str(int(time.time() * 1000))
+        app_name = "lerobot"
+        offset = 0
+        chunk_index = 0
+        total_size = len(pcm_data)
+
+        logger.info(f"Playing audio: {total_size} bytes in {(total_size // chunk_size) + 1} chunks")
+
+        # Send audio in chunks
+        while offset < total_size:
+            remaining = total_size - offset
+            current_chunk_size = min(chunk_size, remaining)
+            chunk = pcm_data[offset:offset + current_chunk_size]
+
+            # Send chunk
+            ret_code, _ = self.audio_client.PlayStream(app_name, stream_id, list(chunk))
+            if ret_code != 0:
+                logger.error(f"Failed to send chunk {chunk_index}, return code: {ret_code}")
+                break
+            else:
+                logger.debug(f"Sent chunk {chunk_index}/{(total_size // chunk_size)}")
+
+            offset += current_chunk_size
+            chunk_index += 1
+            time.sleep(1.0)  # Wait between chunks
+
+        # Calculate playback duration
+        duration_seconds = len(pcm_data) / (16000 * 2)  # 16kHz, 16-bit (2 bytes)
+        logger.info(f"Audio playback will take ~{duration_seconds:.1f} seconds")
+
     def get_observation(self) -> dict[str, Any]:
         obs_array = self.get_current_dual_arm_q()
         obs_dict = {f"{G1_29_JointArmIndex(motor).name}.pos": val for motor, val in zip(G1_29_JointArmIndex, obs_array, strict=True)}
@@ -746,6 +991,78 @@ class UnitreeG1(Robot):
             self.ry = struct.unpack("f", data[12:16])[0]
             self.ly = struct.unpack("f", data[20:24])[0]
     
+    class MotionLoader:
+        """Load and interpolate motion from CSV file for motion imitation."""
+        def __init__(self, motion_file: str, fps: float = 60.0):
+            """Load motion from CSV file.
+            
+            CSV format: [root_pos(3), root_quat_xyzw(4), joint_dof(29)] per row
+            """
+            self.dt = 1.0 / fps
+            
+            # Load CSV
+            data = np.loadtxt(motion_file, delimiter=',')
+            self.num_frames = data.shape[0]
+            self.duration = self.num_frames * self.dt
+            
+            # Split data
+            self.root_positions = data[:, 0:3]  # (N, 3)
+            self.root_quaternions_xyzw = data[:, 3:7]  # (N, 4) [x, y, z, w]
+            self.dof_positions = data[:, 7:]  # (N, 29)
+            
+            # Compute velocities (finite differences)
+            self.dof_velocities = np.diff(self.dof_positions, axis=0, prepend=self.dof_positions[0:1]) / self.dt
+            
+            # Current playback state
+            self.current_time = 0.0
+            self.index_0 = 0
+            self.index_1 = 0
+            self.blend = 0.0
+            
+            logger.info(f"MotionLoader: Loaded {self.num_frames} frames, duration={self.duration:.2f}s")
+            
+        def update(self, time: float):
+            """Update motion to specific time (loops at duration)."""
+            self.current_time = time % self.duration  # Loop
+            phase = self.current_time / self.duration
+            
+            self.index_0 = int(phase * (self.num_frames - 1))
+            self.index_1 = min(self.index_0 + 1, self.num_frames - 1)
+            self.blend = (self.current_time - self.index_0 * self.dt) / self.dt
+            
+        def get_joint_pos(self) -> np.ndarray:
+            """Get interpolated joint positions (29D)."""
+            return self.dof_positions[self.index_0] * (1 - self.blend) + \
+                   self.dof_positions[self.index_1] * self.blend
+        
+        def get_joint_vel(self) -> np.ndarray:
+            """Get interpolated joint velocities (29D)."""
+            return self.dof_velocities[self.index_0] * (1 - self.blend) + \
+                   self.dof_velocities[self.index_1] * self.blend
+        
+        def get_root_quat_wxyz(self) -> np.ndarray:
+            """Get interpolated root quaternion [w, x, y, z]."""
+            # Spherical linear interpolation (SLERP)
+            q0 = self.root_quaternions_xyzw[self.index_0]  # [x, y, z, w]
+            q1 = self.root_quaternions_xyzw[self.index_1]
+            
+            # Convert to scipy format [x, y, z, w]
+            r0 = R.from_quat(q0)
+            r1 = R.from_quat(q1)
+            
+            # SLERP
+            key_times = [0, 1]
+            key_rots = R.from_quat([q0, q1])
+            slerp = R.from_quat(key_rots.as_quat())  # Simplified - just use linear for now
+            
+            # Linear interpolation for simplicity
+            quat_xyzw = q0 * (1 - self.blend) + q1 * self.blend
+            # Normalize
+            quat_xyzw = quat_xyzw / np.linalg.norm(quat_xyzw)
+            
+            # Convert to [w, x, y, z]
+            return np.array([quat_xyzw[3], quat_xyzw[0], quat_xyzw[1], quat_xyzw[2]], dtype=np.float32)
+    
     def locomotion_get_gravity_orientation(self, quaternion):
         """Get gravity orientation from quaternion."""
         qw = quaternion[0]
@@ -1185,7 +1502,10 @@ class UnitreeG1(Robot):
             return
         
         logger.info("Starting locomotion test sequence...")
-
+        
+        # 1. Home the arms first
+        logger.info("Homing arms to zero position...")
+        #self.ctrl_dual_arm_go_home()
 
         # 2. Move legs to default position
         self.locomotion_move_to_default_pos()
@@ -1227,6 +1547,354 @@ class UnitreeG1(Robot):
         logger.info("GR00T locomotion initialization complete! Policy is now running.")
         logger.info("516D observations (86D × 6 frames), 15D actions (legs + waist)")
 
+    def motion_imitation_run(self):
+        """Motion imitation policy loop - tracks reference motion (dance_102, etc)."""
+        self.motion_counter += 1
+        self.motion_elapsed_time = self.motion_counter * self.config.motion_control_dt
+        
+        # Update motion loader to current time
+        self.motion_loader.update(self.motion_elapsed_time)
+        
+        # Get current lowstate
+        lowstate = self.lowstate_buffer.GetData()
+        if lowstate is None:
+            return
+        
+        # Get ALL 29 joint positions and velocities from robot
+        # IMPORTANT: Convert from motor order to BFS order to match reference motion
+        # The C++ code does: robot_bfs[i] = motor[joint_ids_map[i]]
+        for i in range(29):
+            motor_idx = self.config.motion_joint_ids_map[i]
+            self.motion_qj_all[i] = lowstate.motor_state[motor_idx].q
+            self.motion_dqj_all[i] = lowstate.motor_state[motor_idx].dq
+        
+        # ======== 23 DOF MODE CONFIGURATION ========
+        # For real robot - zeros out joints not present in 23 DOF hardware
+        # Waist: yaw(12), pitch(14) | Wrist: L_pitch/yaw(20,21), R_pitch/yaw(27,28)
+        USE_23DOF = True  # Set to True for real robot without these joints
+        JOINTS_TO_ZERO_23DOF = []#12,14,20, 21, 27, 28]#12, 14, 20, 21, 27, 28]#
+        
+        # Apply 23 DOF zeroing to robot observations if enabled
+        if USE_23DOF:
+            for joint_idx in JOINTS_TO_ZERO_23DOF:
+                self.motion_qj_all[joint_idx] = 0.0
+                self.motion_dqj_all[joint_idx] = 0.0
+            if self.motion_counter == 1:
+                logger.info("="*60)
+                logger.info("🤖 23 DOF MODE ENABLED")
+                logger.info(f"   Zeroing joints: {JOINTS_TO_ZERO_23DOF}")
+                logger.info("   Waist: yaw(12), pitch(14)")
+                logger.info("   Wrist L: pitch(20), yaw(21) | Wrist R: pitch(27), yaw(28)")
+                logger.info("   Applied to: robot obs, reference motion, policy actions")
+                logger.info("="*60)
+        
+        # Get IMU data
+        robot_quat = lowstate.imu_state.quaternion  # [w, x, y, z]
+        ang_vel = np.array(lowstate.imu_state.gyroscope, dtype=np.float32)  # 3D
+        
+        if self.policy is None:
+            # DIRECT PLAYBACK MODE (no policy)
+            motion_joint_pos_dfs = self.motion_loader.get_joint_pos()
+            
+            # Zero out missing joints for 23 DOF mode
+            if USE_23DOF:
+                # Convert to BFS to zero out, then convert back
+                motion_joint_pos_bfs_temp = np.zeros(29, dtype=np.float32)
+                for i in range(29):
+                    motion_joint_pos_bfs_temp[i] = motion_joint_pos_dfs[self.config.motion_joint_ids_map[i]]
+                for joint_idx in JOINTS_TO_ZERO_23DOF:
+                    motion_joint_pos_bfs_temp[joint_idx] = 0.0
+                # Convert back to DFS for sending
+                for i in range(29):
+                    motion_joint_pos_dfs[self.config.motion_joint_ids_map[i]] = motion_joint_pos_bfs_temp[i]
+            
+            for i in range(29):
+                motor_idx = self.config.motion_joint_ids_map[i]
+                csv_idx = self.config.motion_joint_ids_map[i]
+                self.msg.motor_cmd[motor_idx].q = motion_joint_pos_dfs[csv_idx]
+                self.msg.motor_cmd[motor_idx].qd = 0
+                self.msg.motor_cmd[motor_idx].kp = self.config.motion_stiffness[motor_idx]
+                self.msg.motor_cmd[motor_idx].kd = self.config.motion_damping[motor_idx]
+                self.msg.motor_cmd[motor_idx].tau = 0
+        else:
+            # POLICY MODE - Full observation construction and inference
+            
+            # ======== DEBUG TEST MODES ========
+            # Mode 1: Direct playback (no policy) - set motion_policy_path = None in config instead
+            # Mode 2: Send default pos (stand still) - TEST_SEND_DEFAULT_POS = True
+            # Mode 3: Policy with zero reference - TEST_WITH_ZEROS = True, TEST_SEND_DEFAULT_POS = False
+            # Mode 4: Policy with real reference - TEST_WITH_ZEROS = False, TEST_SEND_DEFAULT_POS = False
+            TEST_WITH_ZEROS = False  # True = use zero reference motion in observation
+            TEST_SEND_DEFAULT_POS = False  # True = bypass policy and send default pos (stand still)
+            TEST_DIRECT_PLAYBACK = False  # True = bypass policy and send reference motion directly
+            
+            if TEST_DIRECT_PLAYBACK:
+                # DEBUG: Play back reference motion without policy
+                motion_joint_pos_dfs = self.motion_loader.get_joint_pos()  # 29D in DFS order
+                
+                # Zero out missing joints for 23 DOF mode
+                if USE_23DOF:
+                    # Convert to BFS to zero out, then convert back
+                    motion_joint_pos_bfs_temp = np.zeros(29, dtype=np.float32)
+                    for i in range(29):
+                        motion_joint_pos_bfs_temp[i] = motion_joint_pos_dfs[self.config.motion_joint_ids_map[i]]
+                    for joint_idx in JOINTS_TO_ZERO_23DOF:
+                        motion_joint_pos_bfs_temp[joint_idx] = 0.0
+                    # Convert back to DFS for sending
+                    for i in range(29):
+                        motion_joint_pos_dfs[self.config.motion_joint_ids_map[i]] = motion_joint_pos_bfs_temp[i]
+                
+                # Send directly to motors using joint_ids_map (same as direct playback mode)
+                for i in range(29):
+                    motor_idx = self.config.motion_joint_ids_map[i]
+                    csv_idx = self.config.motion_joint_ids_map[i]
+                    self.msg.motor_cmd[motor_idx].q = motion_joint_pos_dfs[csv_idx]
+                    self.msg.motor_cmd[motor_idx].qd = 0
+                    self.msg.motor_cmd[motor_idx].kp = self.config.motion_stiffness[motor_idx]
+                    self.msg.motor_cmd[motor_idx].kd = self.config.motion_damping[motor_idx]
+                    self.msg.motor_cmd[motor_idx].tau = 0
+                
+                if self.motion_counter == 1:
+                    logger.info("="*60)
+                    logger.info("⚠️  DEBUG MODE: DIRECT PLAYBACK (reference motion, no policy)")
+                    logger.info("="*60)
+                
+                target_joint_pos_bfs = None  # Not used in this mode
+                
+            else:
+                # Run observation construction and policy
+                if TEST_WITH_ZEROS:
+                    # Send zeros for reference motion
+                    motion_joint_pos_bfs = np.zeros(29, dtype=np.float32)
+                    motion_joint_vel_bfs = np.zeros(29, dtype=np.float32)
+                    if self.motion_counter == 1:
+                        logger.info("="*60)
+                        logger.info("⚠️  DEBUG MODE: Using ZERO reference motion + RUNNING POLICY")
+                        logger.info("="*60)
+                else:
+                    # Get reference motion (DFS order from CSV)
+                    motion_joint_pos_dfs = self.motion_loader.get_joint_pos()  # 29D
+                    motion_joint_vel_dfs = self.motion_loader.get_joint_vel()  # 29D
+                    
+                    # Convert from DFS to BFS order: bfs[i] = dfs[joint_ids_map[i]]
+                    motion_joint_pos_bfs = np.zeros(29, dtype=np.float32)
+                    motion_joint_vel_bfs = np.zeros(29, dtype=np.float32)
+                    for i in range(29):
+                        motion_joint_pos_bfs[i] = motion_joint_pos_dfs[self.config.motion_joint_ids_map[i]]
+                        motion_joint_vel_bfs[i] = motion_joint_vel_dfs[self.config.motion_joint_ids_map[i]]
+                    
+                    # Zero out missing joints in reference motion for 23 DOF mode
+                    if USE_23DOF:
+                        for joint_idx in JOINTS_TO_ZERO_23DOF:
+                            motion_joint_pos_bfs[joint_idx] = 0.0
+                            motion_joint_vel_bfs[joint_idx] = 0.0
+                
+                # Compute motion_anchor_ori_b (6D rotation matrix representation)
+                motion_quat_wxyz = self.motion_loader.get_root_quat_wxyz()
+                robot_rot = R.from_quat([robot_quat[1], robot_quat[2], robot_quat[3], robot_quat[0]]).as_matrix()
+                motion_rot = R.from_quat([motion_quat_wxyz[1], motion_quat_wxyz[2], motion_quat_wxyz[3], motion_quat_wxyz[0]]).as_matrix()
+                relative_rot = robot_rot.T @ motion_rot
+                motion_anchor_ori_b = np.array([relative_rot[0, 0], relative_rot[0, 1], 
+                                                relative_rot[1, 0], relative_rot[1, 1],
+                                                relative_rot[2, 0], relative_rot[2, 1]], dtype=np.float32)
+                
+                # Compute joint positions and velocities relative to default
+                default_joint_pos = np.array(self.config.motion_default_joint_pos, dtype=np.float32)
+                joint_pos_rel = self.motion_qj_all - default_joint_pos
+                joint_vel_rel = self.motion_dqj_all.copy()
+                
+                # Build 154D observation:
+                # motion_command (58D) = joint_pos (29D) + joint_vel (29D) from reference
+                # motion_anchor_ori_b (6D)
+                # base_ang_vel (3D)
+                # joint_pos_rel (29D)
+                # joint_vel_rel (29D)
+                # last_action (29D)
+                self.motion_obs[0:29] = motion_joint_pos_bfs
+                self.motion_obs[29:58] = motion_joint_vel_bfs
+                self.motion_obs[58:64] = motion_anchor_ori_b
+                self.motion_obs[64:67] = ang_vel
+                self.motion_obs[67:96] = joint_pos_rel
+                self.motion_obs[96:125] = joint_vel_rel
+                self.motion_obs[125:154] = self.motion_action
+                
+                if TEST_SEND_DEFAULT_POS:
+                    # DEBUG: Just send default positions (should make robot stand still)
+                    target_joint_pos_bfs = default_joint_pos.copy()
+                    if self.motion_counter == 1:
+                        logger.info("="*60)
+                        logger.info("⚠️  DEBUG MODE: Sending DEFAULT positions (NO POLICY)")
+                        logger.info("="*60)
+                        logger.info(f"   Default pos BFS[0:5]: {target_joint_pos_bfs[0:5]}")
+                    if self.motion_counter % 50 == 0:
+                        logger.info(f"   [DEFAULT MODE] Sending: [{target_joint_pos_bfs[0]:.4f}, {target_joint_pos_bfs[6]:.4f}, {target_joint_pos_bfs[12]:.4f}]")
+                        logger.info(f"   [DEFAULT MODE] Robot at: [{self.motion_qj_all[0]:.4f}, {self.motion_qj_all[6]:.4f}, {self.motion_qj_all[12]:.4f}]")
+                else:
+                    # Run ONNX policy inference
+                    obs_tensor = torch.from_numpy(self.motion_obs).unsqueeze(0)
+                    ort_inputs = {self.policy.get_inputs()[0].name: obs_tensor.cpu().numpy()}
+                    ort_outs = self.policy.run(None, ort_inputs)
+                    self.motion_action = ort_outs[0].squeeze()  # 29D action in BFS order
+                    
+                    # Zero out missing joints in policy actions for 23 DOF mode
+                    if USE_23DOF:
+                        for joint_idx in JOINTS_TO_ZERO_23DOF:
+                            self.motion_action[joint_idx] = 0.0
+                    
+                    # Process actions: scale and add offset
+                    action_scale = np.array(self.config.motion_action_scale, dtype=np.float32)
+                    target_joint_pos_bfs = default_joint_pos + self.motion_action * action_scale
+                
+                # Send commands to motors: motor[joint_ids_map[i]] = action[i]
+                for i in range(29):
+                    motor_idx = self.config.motion_joint_ids_map[i]
+                    self.msg.motor_cmd[motor_idx].q = target_joint_pos_bfs[i]
+                    self.msg.motor_cmd[motor_idx].qd = 0
+                    self.msg.motor_cmd[motor_idx].kp = self.config.motion_stiffness[motor_idx]
+                    self.msg.motor_cmd[motor_idx].kd = self.config.motion_damping[motor_idx]
+                    self.msg.motor_cmd[motor_idx].tau = 0
+        
+        # Debug print (only when running policy, not in TEST_SEND_DEFAULT_POS or TEST_DIRECT_PLAYBACK mode)
+        if self.motion_counter == 1 and self.policy and not TEST_SEND_DEFAULT_POS and not TEST_DIRECT_PLAYBACK:
+            logger.info("="*60)
+            logger.info("POLICY MODE OBSERVATION CHECK (First iteration)")
+            logger.info("="*60)
+            logger.info(f"Reference motion (BFS) samples: [{motion_joint_pos_bfs[0]:.3f}, {motion_joint_pos_bfs[6]:.3f}, {motion_joint_pos_bfs[12]:.3f}]")
+            logger.info(f"Robot joints (BFS) samples:     [{self.motion_qj_all[0]:.3f}, {self.motion_qj_all[6]:.3f}, {self.motion_qj_all[12]:.3f}]")
+            logger.info(f"Default positions samples:      [{default_joint_pos[0]:.3f}, {default_joint_pos[6]:.3f}, {default_joint_pos[12]:.3f}]")
+            logger.info(f"Joint pos rel samples:          [{joint_pos_rel[0]:.3f}, {joint_pos_rel[6]:.3f}, {joint_pos_rel[12]:.3f}]")
+            logger.info(f"Joint vel rel samples:          [{joint_vel_rel[0]:.3f}, {joint_vel_rel[6]:.3f}, {joint_vel_rel[12]:.3f}]")
+            logger.info(f"Angular velocity:               [{ang_vel[0]:.3f}, {ang_vel[1]:.3f}, {ang_vel[2]:.3f}]")
+            logger.info(f"Motion anchor ori:              [{motion_anchor_ori_b[0]:.3f}, ..., {motion_anchor_ori_b[5]:.3f}]")
+            logger.info(f"Observation breakdown:")
+            logger.info(f"  [0:29]   motion_cmd_pos: range [{self.motion_obs[0:29].min():.3f}, {self.motion_obs[0:29].max():.3f}]")
+            logger.info(f"  [29:58]  motion_cmd_vel: range [{self.motion_obs[29:58].min():.3f}, {self.motion_obs[29:58].max():.3f}]")
+            logger.info(f"  [58:64]  anchor_ori:     range [{self.motion_obs[58:64].min():.3f}, {self.motion_obs[58:64].max():.3f}]")
+            logger.info(f"  [64:67]  ang_vel:        range [{self.motion_obs[64:67].min():.3f}, {self.motion_obs[64:67].max():.3f}]")
+            logger.info(f"  [67:96]  joint_pos_rel:  range [{self.motion_obs[67:96].min():.3f}, {self.motion_obs[67:96].max():.3f}]")
+            logger.info(f"  [96:125] joint_vel_rel:  range [{self.motion_obs[96:125].min():.3f}, {self.motion_obs[96:125].max():.3f}]")
+            logger.info(f"  [125:154] last_action:   range [{self.motion_obs[125:154].min():.3f}, {self.motion_obs[125:154].max():.3f}]")
+            logger.info(f"Full obs range: [{self.motion_obs.min():.3f}, {self.motion_obs.max():.3f}]")
+            logger.info(f"Action output (first): [{self.motion_action.min():.3f}, {self.motion_action.max():.3f}]")
+            logger.info(f"Action scale samples: [{action_scale[0]:.3f}, {action_scale[6]:.3f}, {action_scale[12]:.3f}]")
+            logger.info(f"Target positions samples: [{target_joint_pos_bfs[0]:.3f}, {target_joint_pos_bfs[6]:.3f}, {target_joint_pos_bfs[12]:.3f}]")
+            logger.info("="*60)
+        
+        if self.motion_counter % 50 == 0:
+            if self.policy is None:
+                mode = "DIRECT"
+            elif TEST_DIRECT_PLAYBACK:
+                mode = "DIRECT_DEBUG"
+            elif TEST_SEND_DEFAULT_POS:
+                mode = "DEFAULT_POS"
+            elif TEST_WITH_ZEROS:
+                mode = "POLICY_ZEROS"
+            else:
+                mode = "POLICY"
+            logger.info(f"Motion {mode}: t={self.motion_elapsed_time:.2f}s, frame={self.motion_loader.index_0}/{self.motion_loader.num_frames}")
+            if self.policy and not TEST_SEND_DEFAULT_POS and not TEST_DIRECT_PLAYBACK:
+                logger.info(f"  Policy action range: [{self.motion_action.min():.3f}, {self.motion_action.max():.3f}]")
+                logger.info(f"  Sample actions[0,6,12]: [{self.motion_action[0]:.3f}, {self.motion_action[6]:.3f}, {self.motion_action[12]:.3f}]")
+                logger.info(f"  Target pos (after scale)[0,6,12]: [{target_joint_pos_bfs[0]:.3f}, {target_joint_pos_bfs[6]:.3f}, {target_joint_pos_bfs[12]:.3f}]")
+                logger.info(f"  Robot pos (BFS)[0,6,12]: [{self.motion_qj_all[0]:.3f}, {self.motion_qj_all[6]:.3f}, {self.motion_qj_all[12]:.3f}]")
+        
+        # Send command
+        self.msg.crc = self.crc.Crc(self.msg)
+        self.lowcmd_publisher.Write(self.msg)
+    
+    def _motion_imitation_thread_loop(self):
+        """Background thread that runs the motion imitation policy at specified rate."""
+        logger.info("Motion imitation thread started")
+        while self.motion_imitation_running:
+            start_time = time.time()
+            try:
+                self.motion_imitation_run()
+            except Exception as e:
+                logger.error(f"Error in motion imitation loop: {e}")
+                import traceback
+                traceback.print_exc()
+            
+            # Sleep to maintain control rate
+            elapsed = time.time() - start_time
+            sleep_time = max(0, self.config.motion_control_dt - elapsed)
+            time.sleep(sleep_time)
+        logger.info("Motion imitation thread stopped")
+    
+    def start_motion_imitation_thread(self):
+        """Start the background motion imitation control thread."""
+        if not self.config.motion_imitation_control:
+            logger.warning("motion_imitation_control is False, cannot start thread")
+            return
+        
+        if self.motion_imitation_running:
+            logger.warning("Motion imitation thread already running")
+            return
+        
+        logger.info("Starting motion imitation control thread...")
+        self.motion_imitation_running = True
+        self.motion_imitation_thread = threading.Thread(target=self._motion_imitation_thread_loop, daemon=True)
+        self.motion_imitation_thread.start()
+        logger.info("Motion imitation control thread started!")
+    
+    def stop_motion_imitation_thread(self):
+        """Stop the background motion imitation control thread."""
+        if not self.motion_imitation_running:
+            return
+        
+        logger.info("Stopping motion imitation control thread...")
+        self.motion_imitation_running = False
+        if self.motion_imitation_thread:
+            self.motion_imitation_thread.join(timeout=2.0)
+        logger.info("Motion imitation control thread stopped")
+    
+    def init_motion_imitation(self):
+        """Initialize motion imitation - move to default standing pose and start policy."""
+        if not self.config.motion_imitation_control:
+            logger.warning("motion_imitation_control is False, cannot run initialization")
+            return
+        
+        logger.info("Starting motion imitation initialization...")
+        
+        # Move to default standing position
+        logger.info("Moving to default standing position...")
+        total_time = 3.0
+        num_steps = int(total_time / self.config.motion_control_dt)
+        
+        # Get current positions (in motor order)
+        current_q_motor = self.get_current_motor_q()
+        
+        # target_q is in BFS order from config, need to convert to motor order
+        target_q_bfs = np.array(self.config.motion_default_joint_pos, dtype=np.float32)
+        target_q_motor = np.zeros(29, dtype=np.float32)
+        for i in range(29):
+            motor_idx = self.config.motion_joint_ids_map[i]
+            target_q_motor[motor_idx] = target_q_bfs[i]
+        
+        # Interpolate to target (both in motor order now)
+        for i in range(num_steps):
+            alpha = i / num_steps
+            for motor_idx in range(29):
+                self.msg.motor_cmd[motor_idx].q = current_q_motor[motor_idx] * (1 - alpha) + target_q_motor[motor_idx] * alpha
+                self.msg.motor_cmd[motor_idx].qd = 0
+                self.msg.motor_cmd[motor_idx].kp = self.config.motion_stiffness[motor_idx]
+                self.msg.motor_cmd[motor_idx].kd = self.config.motion_damping[motor_idx]
+                self.msg.motor_cmd[motor_idx].tau = 0
+            self.msg.crc = self.crc.Crc(self.msg)
+            self.lowcmd_publisher.Write(self.msg)
+            time.sleep(self.config.motion_control_dt)
+        
+        logger.info("Reached default position")
+        
+        # Wait 2 seconds
+        time.sleep(2.0)
+        
+        # Start motion imitation policy thread
+        logger.info("Starting motion imitation policy control...")
+        self.start_motion_imitation_thread()
+        
+        logger.info("Motion imitation initialization complete! Policy is now running.")
+        logger.info(f"154D observations, 29D actions. Motion duration: {self.motion_loader.duration:.2f}s")
+
 
 class G1_29_JointArmIndex(IntEnum):
     # Left arm