2466206547
diff --git a/‎.claude/settings.json‎
Lines changed: 11 additions & 0 deletions b/‎.claude/settings.json‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎=2.0.2‎
Lines changed: 6 additions & 0 deletions b/‎=2.0.2‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎command.sh‎
Lines changed: 23 additions & 0 deletions b/‎command.sh‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎examples/libero/convert_libero_data_to_lerobot.py‎
Lines changed: 11 additions & 6 deletions b/‎examples/libero/convert_libero_data_to_lerobot.py‎
Lines changed: 11 additions & 6 deletions
diff --git a/‎examples/libero/convert_my_data_to_lerobot.py‎
Lines changed: 144 additions & 0 deletions b/‎examples/libero/convert_my_data_to_lerobot.py‎
Lines changed: 144 additions & 0 deletions
diff --git a/‎examples/libero/convert_my_data_to_lerobot_fixed.py‎
Lines changed: 171 additions & 0 deletions b/‎examples/libero/convert_my_data_to_lerobot_fixed.py‎
Lines changed: 171 additions & 0 deletions
@@ -0,0 +1,11 @@
+{
+  "apiKeyHelper": "echo 'sk-Qgob5ZFAqMSHyuwsd8u0d0UWfPqZbgj9dNWsAZL1GkBG3409'",
+  "env": {
+    "ANTHROPIC_API_KEY": "sk-Qgob5ZFAqMSHyuwsd8u0d0UWfPqZbgj9dNWsAZL1GkBG3409",
+    "ANTHROPIC_BASE_URL": "https://code.ppchat.vip"
+  },
+  "permissions": {
+    "allow": [],
+    "deny": []
+  }
+}
@@ -0,0 +1,6 @@
+Looking in indexes: https://mirrors.aliyun.com/pypi/simple/, https://pypi.ngc.nvidia.com
+Collecting pycocotools
+  Downloading https://mirrors.aliyun.com/pypi/packages/61/d7/32996d713921c504875a4cebf241c182aa37e58daab5c3c4737f539ac0d4/pycocotools-2.0.10-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (455 kB)
+Requirement already satisfied: numpy in /map-vepfs/miniconda3/lib/python3.10/site-packages (from pycocotools) (1.26.4)
+Installing collected packages: pycocotools
+Successfully installed pycocotools-2.0.10
@@ -0,0 +1,23 @@
+uv run scripts/serve_policy.py --env=DROID
+export OPENPI_DATA_HOME='/map-vepfs/haoxiao/yijingkun/openpi/.openpi-cache'
+
+/usr/local/bin/clash -d ~/.config/clash
+export https_proxy=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 all_proxy=socks5://127.0.0.1:7890
+
+nvm use 20
+export ANTHROPIC_AUTH_TOKEN=sk-Qgob5ZFAqMSHyuwsd8u0d0UWfPqZbgj9dNWsAZL1GkBG3409
+export ANTHROPIC_BASE_URL=https://code.ppchat.vip
+claude
+
+uv run examples/libero/convert_libero_data_to_lerobot.py --data_dir ~/.cache/huggingface/hub/datasets--openvla--modified_libero_rlds/snapshots/6ce6aaaaabdbe590b1eef5cd29c0d33f14a08551/
+
+#export HF_LEROBOT_HOME='/map-vepfs/haoxiao/yijingkun/physical-intelligence'
+export HF_LEROBOT_HOME='/map-vepfs/haoxiao/yijingkun'
+
+XLA_PYTHON_CLIENT_MEM_FRACTION=0.9 uv run scripts/train.py pi0_fast_libero --exp-name=my_experiment --overwrite --batch_size=8
+
+uv run examples/libero/convert_my_data_to_lerobot.py --data_dir {dataset_path} #convert ur3 data to lerobot data
+uv run scripts/compute_norm_stats.py --config-name pi0_ur3
+XLA_PYTHON_CLIENT_MEM_FRACTION=0.9 uv run scripts/train.py pi0_ur3 --exp-name=my_experiment --overwrite
+
+sudo fuser -v /dev/nvidia*
@@ -19,24 +19,29 @@
 """
 
 import shutil
+from pathlib import Path
 
 from lerobot.common.datasets.lerobot_dataset import HF_LEROBOT_HOME
 from lerobot.common.datasets.lerobot_dataset import LeRobotDataset
 import tensorflow_datasets as tfds
 import tyro
 
 REPO_NAME = "your_hf_username/libero"  # Name of the output dataset, also used for the Hugging Face Hub
+# RAW_DATASET_NAMES = [
+#     "libero_10_no_noops",
+#     "libero_goal_no_noops",
+#     "libero_object_no_noops",
+#     "libero_spatial_no_noops",
+# ]  # For simplicity we will combine multiple Libero datasets into one training dataset
+
 RAW_DATASET_NAMES = [
-    "libero_10_no_noops",
     "libero_goal_no_noops",
-    "libero_object_no_noops",
-    "libero_spatial_no_noops",
-]  # For simplicity we will combine multiple Libero datasets into one training dataset
-
+] 
 
 def main(data_dir: str, *, push_to_hub: bool = False):
     # Clean up any existing dataset in the output directory
-    output_path = HF_LEROBOT_HOME / REPO_NAME
+    #output_path = HF_LEROBOT_HOME / REPO_NAME
+    output_path = Path("/map-vepfs/haoxiao/yijingkun/libero")
     if output_path.exists():
         shutil.rmtree(output_path)
 
 
@@ -0,0 +1,144 @@
+"""
+Minimal example script for converting a dataset to LeRobot format.
+
+We use the Libero dataset (stored in RLDS) for this example, but it can be easily
+modified for any other data you have saved in a custom format.
+
+Usage:
+uv run examples/libero/convert_libero_data_to_lerobot.py --data_dir /path/to/your/data
+
+If you want to push your dataset to the Hugging Face Hub, you can use the following command:
+uv run examples/libero/convert_libero_data_to_lerobot.py --data_dir /path/to/your/data --push_to_hub
+
+Note: to run the script, you need to install tensorflow_datasets:
+`uv pip install tensorflow tensorflow_datasets`
+
+You can download the raw Libero datasets from https://huggingface.co/datasets/openvla/modified_libero_rlds
+The resulting dataset will get saved to the $HF_LEROBOT_HOME directory.
+Running this conversion script will take approximately 30 minutes.
+"""
+import os
+import shutil
+from pathlib import Path
+from PIL import Image
+import numpy as np
+
+from lerobot.common.datasets.lerobot_dataset import HF_LEROBOT_HOME
+from lerobot.common.datasets.lerobot_dataset import LeRobotDataset
+import tensorflow_datasets as tfds
+import tyro
+
+REPO_NAME = "ur3"  # Name of the output dataset, also used for the Hugging Face Hub
+# RAW_DATASET_NAMES = [
+#     "libero_10_no_noops",
+#     "libero_goal_no_noops",
+#     "libero_object_no_noops",
+#     "libero_spatial_no_noops",
+# ]  # For simplicity we will combine multiple Libero datasets into one training dataset
+
+RAW_DATASET_NAMES = [
+    "libero_goal_no_noops",
+] 
+
+def main(data_dir: str, *, push_to_hub: bool = False):
+    # Clean up any existing dataset in the output directory
+    #output_path = HF_LEROBOT_HOME / REPO_NAME
+    output_path = Path("/map-vepfs/haoxiao/yijingkun/ur3")
+    if output_path.exists():
+        shutil.rmtree(output_path)
+
+    # Create LeRobot dataset, define features to store
+    # OpenPi assumes that proprio is stored in `state` and actions in `action`
+    # LeRobot assumes that dtype of image data is `image`
+    img = Image.open(f'{data_dir}/0/images/front_images/0.png')
+    front_image = np.array(img)
+    width, height = front_image.shape[1], front_image.shape[0]
+    dataset = LeRobotDataset.create(
+        repo_id=REPO_NAME,
+        robot_type="panda",
+        fps=10,
+        features={
+            "image": {
+                "dtype": "image",
+                "shape": (width, height, 3),
+                # "shape": (224, 224, 3),
+                # "shape": (480, 640, 3),
+                "names": ["height", "width", "channel"],
+            },
+            "wrist_image": {
+                "dtype": "image",
+                "shape": (width, height, 3),
+                # "shape": (224, 224, 3),
+                # "shape": (480, 640, 3),
+                "names": ["height", "width", "channel"],
+            },
+            "state": {
+                "dtype": "float32",
+                "shape": (8,),
+                "names": ["state"],
+            },
+            "actions": {
+                "dtype": "float32",
+                "shape": (8,),
+                "names": ["actions"],
+            },
+        },
+        image_writer_threads=10,
+        image_writer_processes=5,
+    )
+
+    # Loop over raw Libero datasets and write episodes to the LeRobot dataset
+    # You can modify this for your own data format
+    # for raw_dataset_name in RAW_DATASET_NAMES:
+    #     raw_dataset = tfds.load(raw_dataset_name, data_dir=data_dir, split="train")
+        # for episode in raw_dataset:
+        #     for step in episode["steps"].as_numpy_iterator():
+        #         dataset.add_frame(
+        #             {
+        #                 "image": step["observation"]["image"],
+        #                 "wrist_image": step["observation"]["wrist_image"],
+        #                 "state": step["observation"]["state"],
+        #                 "actions": step["action"],
+        #                 "task": step["language_instruction"].decode(),
+        #             }
+        #         )
+        #     dataset.save_episode()
+    
+    for i in range(64):
+        len_frame = len(os.listdir(f'{data_dir}/{i}/joint_states'))
+        for j in range(len_frame):
+            img = Image.open(f'{data_dir}/{i}/images/front_images/{j}.png')
+            front_image = np.array(img)
+
+            img = Image.open(f'{data_dir}/{i}/images/ee_images/{j}.png')
+            ee_image = np.array(img)
+
+            state = np.load(f'{data_dir}/{i}/joint_states/{j}.npy').astype(np.float32)
+            state = np.insert(state, 6, 0.0)
+
+            actions = np.load(f'{data_dir}/{i}/joint_states/{j}.npy').astype(np.float32)
+            actions = np.insert(actions, 6, 0.0)
+
+            dataset.add_frame(
+                {
+                    "image": front_image,
+                    "wrist_image": ee_image,
+                    "state": state,
+                    "actions": actions,
+                    "task": "pick up the blue cube and place on the top of red cube",
+                }
+            )
+        dataset.save_episode()
+
+    # Optionally push to the Hugging Face Hub
+    if push_to_hub:
+        dataset.push_to_hub(
+            tags=["libero", "panda", "rlds"],
+            private=False,
+            push_videos=True,
+            license="apache-2.0",
+        )
+
+
+if __name__ == "__main__":
+    tyro.cli(main)
@@ -0,0 +1,171 @@
+"""
+Minimal example script for converting a dataset to LeRobot format.
+
+We use the Libero dataset (stored in RLDS) for this example, but it can be easily
+modified for any other data you have saved in a custom format.
+
+Usage:
+uv run examples/libero/convert_libero_data_to_lerobot.py --data_dir /path/to/your/data
+
+If you want to push your dataset to the Hugging Face Hub, you can use the following command:
+uv run examples/libero/convert_libero_data_to_lerobot.py --data_dir /path/to/your/data --push_to_hub
+
+Note: to run the script, you need to install tensorflow_datasets:
+`uv pip install tensorflow tensorflow_datasets`
+
+You can download the raw Libero datasets from https://huggingface.co/datasets/openvla/modified_libero_rlds
+The resulting dataset will get saved to the $HF_LEROBOT_HOME directory.
+Running this conversion script will take approximately 30 minutes.
+"""
+import os
+import shutil
+from pathlib import Path
+from PIL import Image
+import numpy as np
+
+from lerobot.common.datasets.lerobot_dataset import HF_LEROBOT_HOME
+from lerobot.common.datasets.lerobot_dataset import LeRobotDataset
+import tensorflow_datasets as tfds
+import tyro
+
+REPO_NAME = "ur3"  # Name of the output dataset, also used for the Hugging Face Hub
+# RAW_DATASET_NAMES = [
+#     "libero_10_no_noops",
+#     "libero_goal_no_noops",
+#     "libero_object_no_noops",
+#     "libero_spatial_no_noops",
+# ]  # For simplicity we will combine multiple Libero datasets into one training dataset
+
+RAW_DATASET_NAMES = [
+    "libero_goal_no_noops",
+] 
+
+def main(data_dir: str, *, push_to_hub: bool = False):
+    # Clean up any existing dataset in the output directory
+    #output_path = HF_LEROBOT_HOME / REPO_NAME
+    output_path = Path("/map-vepfs/haoxiao/yijingkun/ur3")
+    if output_path.exists():
+        shutil.rmtree(output_path)
+
+    # Create LeRobot dataset, define features to store
+    # OpenPi assumes that proprio is stored in `state` and actions in `action`
+    # LeRobot assumes that dtype of image data is `image`
+    dataset = LeRobotDataset.create(
+        repo_id=REPO_NAME,
+        robot_type="panda",
+        fps=10,
+        features={
+            "image": {
+                "dtype": "image",
+                "shape": (224, 224, 3),
+                "names": ["height", "width", "channel"],
+            },
+            "wrist_image": {
+                "dtype": "image",
+                "shape": (224, 224, 3),
+                "names": ["height", "width", "channel"],
+            },
+            "state": {
+                "dtype": "float32",
+                "shape": (8,),
+                "names": ["state"],
+            },
+            "actions": {
+                "dtype": "float32",
+                "shape": (8,),
+                "names": ["actions"],
+            },
+        },
+        image_writer_threads=10,
+        image_writer_processes=5,
+    )
+
+    # Loop over raw Libero datasets and write episodes to the LeRobot dataset
+    # You can modify this for your own data format
+    # for raw_dataset_name in RAW_DATASET_NAMES:
+    #     raw_dataset = tfds.load(raw_dataset_name, data_dir=data_dir, split="train")
+        # for episode in raw_dataset:
+        #     for step in episode["steps"].as_numpy_iterator():
+        #         dataset.add_frame(
+        #             {
+        #                 "image": step["observation"]["image"],
+        #                 "wrist_image": step["observation"]["wrist_image"],
+        #                 "state": step["observation"]["state"],
+        #                 "actions": step["action"],
+        #                 "task": step["language_instruction"].decode(),
+        #             }
+        #         )
+        #     dataset.save_episode()
+    # Get list of available episode directories
+    episode_dirs = [d for d in os.listdir(data_dir) if d.isdigit() and os.path.isdir(os.path.join(data_dir, d))]
+    episode_dirs.sort(key=int)  # Sort numerically
+    
+    for episode_dir in episode_dirs:
+        i = int(episode_dir)
+        episode_path = os.path.join(data_dir, episode_dir)
+        joint_states_path = os.path.join(episode_path, 'joint_states')
+        
+        # Check if required directories exist
+        if not os.path.exists(joint_states_path):
+            print(f"Skipping episode {i} - joint_states directory not found")
+            continue
+            
+        len_frame = len(os.listdir(joint_states_path))
+        episode_frame_count = 0
+        
+        for j in range(len_frame):
+            try:
+                front_img_path = f'{episode_path}/images/front_images/{j}.png'
+                ee_img_path = f'{episode_path}/images/ee_images/{j}.png'
+                joint_state_path = f'{episode_path}/joint_states/{j}.npy'
+                
+                # Check if all required files exist
+                if not all(os.path.exists(path) for path in [front_img_path, ee_img_path, joint_state_path]):
+                    print(f"Skipping episode {i}, frame {j} - missing files")
+                    continue
+                
+                img = Image.open(front_img_path)
+                front_image = np.array(img)
+
+                img = Image.open(ee_img_path)
+                ee_image = np.array(img)
+
+                state = np.load(joint_state_path).astype(np.float32)
+                state = np.insert(state, 6, 0.0)
+
+                actions = np.load(joint_state_path).astype(np.float32)
+                actions = np.insert(actions, 6, 0.0)
+
+                dataset.add_frame(
+                    {
+                        "image": front_image,
+                        "wrist_image": ee_image,
+                        "state": state,
+                        "actions": actions,
+                        "task": "pick up the red cube and place on the top of blue cube",
+                    }
+                )
+                episode_frame_count += 1
+            except (OSError, IOError) as e:
+                print(f"Skipping corrupted image at episode {i}, frame {j}: {e}")
+                continue
+        
+        # Only save episode if we have at least one valid frame
+        if episode_frame_count > 0:
+            dataset.save_episode()
+            print(f"Saved episode {i} with {episode_frame_count} frames")
+        else:
+            print(f"Skipping episode {i} - no valid frames")
+
+    # Optionally push to the Hugging Face Hub
+    if push_to_hub:
+        dataset.push_to_hub(
+            tags=["libero", "panda", "rlds"],
+            private=False,
+            push_videos=True,
+            license="apache-2.0",
+        )
+
+
+if __name__ == "__main__":
+    tyro.cli(main)