|
74 | 74 | </tr> |
75 | 75 | </table> |
76 | 76 |
|
| 77 | + <table width="880" border="0" align="center" cellspacing="0" cellpadding="0"> |
| 78 | + <tr style="background-color: var(--highlight-color)"> |
| 79 | + <td style="width:35%; vertical-align:middle; padding-right: 20px;"> |
| 80 | + <div class="image-container"> |
| 81 | + <img src='publications/2025_PLD.gif' width="90%"> |
| 82 | + </div> |
| 83 | + </td> |
| 84 | + <td style="width:65%; vertical-align:middle"> |
| 85 | + <papertitle>Self-Improving Vision-Language-Action Models with Data Generation via Residual RL</papertitle> |
| 86 | + <br> |
| 87 | + Wenli Xiao<sup>*</sup>, Haotian Lin<sup>*</sup>, Andy Peng, Haoru Xue, Tairan He, Yuqi Xie, Fengyuan Hu, Jimmy Wu, Zhengyi Luo, Linxi "Jim" Fan, Guanya Shi, Yuke Zhu |
| 88 | + <br> |
| 89 | + <a href="https://arxiv.org/abs/2511.00091" target="_blank"><i class="far fa-file"></i> paper</a>   |
| 90 | + <a href="https://www.wenlixiao.com/self-improve-VLA-PLD" target="_blank"><i class="fas fa-globe"></i> website</a> |
| 91 | + <p style="margin-top: 5px"><i class="fas fa-comment-dots"></i> TL;DR: Probe, Learn, Distill (PLD): On-policy probing from a base VLA model + off-policy residual RL + distillation for VLA post-training. |
| 92 | + </td> |
| 93 | + </tr> |
| 94 | + </table> |
| 95 | + |
| 96 | + <br> |
| 97 | + |
| 98 | + <table width="880" border="0" align="center" cellspacing="0" cellpadding="0"> |
| 99 | + <tr> |
| 100 | + <td style="width:35%; vertical-align:middle; padding-right: 20px;"> |
| 101 | + <div class="image-container"> |
| 102 | + <img src='publications/2025_TWIST2.gif' width="90%"> |
| 103 | + </div> |
| 104 | + </td> |
| 105 | + <td style="width:65%; vertical-align:middle"> |
| 106 | + <papertitle>TWIST2: Scalable, Portable, and Holistic Humanoid Data Collection System</papertitle> |
| 107 | + <br> |
| 108 | + Yanjie Ze, Siheng Zhao, Weizhuo Wang, Angjoo Kanazawa<sup>†</sup>, Rocky Duan<sup>†</sup>, Pieter Abbeel<sup>†</sup>, Guanya Shi<sup>†</sup>, Jiajun Wu<sup>†</sup>, C. Karen Liu<sup>†</sup> |
| 109 | + <br> |
| 110 | + <a href="https://arxiv.org/abs/2511.02832" target="_blank"><i class="far fa-file"></i> paper</a>   |
| 111 | + <a href="https://yanjieze.com/TWIST2/" target="_blank"><i class="fas fa-globe"></i> website</a>   |
| 112 | + <a href="https://github.com/amazon-far/TWIST2" target="_blank"><i class="fas fa-code"></i> code</a> |
| 113 | + <p style="margin-top: 5px"><i class="fas fa-comment-dots"></i> TL;DR: TWIST2 is a portable whole-body humanoid teleoperation system that enables scalable data collection. |
| 114 | + </td> |
| 115 | + </tr> |
| 116 | + </table> |
| 117 | + |
| 118 | + <br> |
| 119 | + |
| 120 | + <table width="880" border="0" align="center" cellspacing="0" cellpadding="0"> |
| 121 | + <tr> |
| 122 | + <td style="width:35%; vertical-align:middle; padding-right: 20px;"> |
| 123 | + <div class="image-container"> |
| 124 | + <img src='publications/2025_ResMimic.gif' width="90%"> |
| 125 | + </div> |
| 126 | + </td> |
| 127 | + <td style="width:65%; vertical-align:middle"> |
| 128 | + <papertitle>ResMimic: From General Motion Tracking to Humanoid Whole-body Loco-Manipulation via Residual Learning</papertitle> |
| 129 | + <br> |
| 130 | + Siheng Zhao, Yanjie Ze, Yue Wang, C. Karen Liu<sup>†</sup>, Pieter Abbeel<sup>†</sup>, Guanya Shi<sup>†</sup>, Rocky Duan<sup>†</sup> |
| 131 | + <br> |
| 132 | + <a href="https://www.arxiv.org/abs/2510.05070" target="_blank"><i class="far fa-file"></i> paper</a>   |
| 133 | + <a href="https://resmimic.github.io/" target="_blank"><i class="fas fa-globe"></i> website</a> |
| 134 | + <p style="margin-top: 5px"><i class="fas fa-comment-dots"></i> TL;DR: A two-stage humanoid skill learning framework that learns a residual policy on top of a pre-trained general motion tracking policy. |
| 135 | + </td> |
| 136 | + </tr> |
| 137 | + </table> |
| 138 | + |
| 139 | + <br> |
| 140 | + |
77 | 141 | <table width="880" border="0" align="center" cellspacing="0" cellpadding="0"> |
78 | 142 | <tr style="background-color: var(--highlight-color)"> |
79 | 143 | <td style="width:35%; vertical-align:middle; padding-right: 20px;"> |
|
0 commit comments