Skip to content

Commit b2bd6b0

Browse files
committed
Added CDE
1 parent 489ce01 commit b2bd6b0

File tree

4 files changed

+26
-1
lines changed

4 files changed

+26
-1
lines changed

_bibliography/papers.bib

Lines changed: 16 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,22 @@ @string{iros
66
@string{ral = {IEEE Robotics and Automation Letters}}
77
@string{tro = {IEEE Transactions on Robotics}}
88
@string{ijrr = {The International Journal of Robotics Research}}
9+
@misc{mao2025cde,
10+
title = {CDE: Concept-Driven Exploration for Reinforcement Learning},
11+
author = {Le Mao and Andrew H. Liu and Renos Zabounidis and Zachary Kingston and Joseph Campbell},
12+
abstract = {Intelligent exploration remains a critical challenge in reinforcement learning (RL), especially in visual control tasks. Unlike low-dimensional state-based RL, visual RL must extract task-relevant structure from raw pixels, making exploration inefficient. We propose Concept-Driven Exploration (CDE), which leverages a pre-trained vision-language model (VLM) to generate object-centric visual concepts from textual task descriptions as weak, potentially noisy supervisory signals. Rather than directly conditioning on these noisy signals, CDE trains a policy to reconstruct the concepts via an auxiliary objective, using reconstruction accuracy as an intrinsic reward to guide exploration toward task-relevant objects. Because the policy internalizes these concepts, VLM queries are only needed during training, reducing dependence on external models during deployment. Across five challenging simulated visual manipulation tasks, CDE achieves efficient, targeted exploration and remains robust to noisy VLM predictions. Finally, we demonstrate real-world transfer by deploying CDE on a Franka Research 3 arm, attaining an 80\% success rate in a real-world manipulation task.},
13+
eprint = {2510.08851},
14+
archivePrefix = {arXiv},
15+
primaryClass = {cs.RO},
16+
year = 2025,
17+
pdf = {https://arxiv.org/abs/2510.08851},
18+
projects = {implicit},
19+
note = {Under Review},
20+
abbr = {ARXIV},
21+
website = {https://sites.google.com/view/concept-learn/home},
22+
code = {https://github.com/LeMaoLeMao/Concept-Learning},
23+
preview = {cde.png}
24+
}
925
@misc{chen2025spasm,
1026
title = {Differentiable Particle Optimization for Fast Sequential Manipulation},
1127
author = {Lucas Chen and Shrutheesh R. Iyer and Zachary Kingston},

_data/coauthors.yml

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,15 @@
6161
member: true
6262
url: shrutheesh
6363

64+
"liu":
65+
- firstname: ["Andrew H."]
66+
member: true
67+
url: andy
68+
69+
"campbell":
70+
- firstname: ["Joseph"]
71+
url: https://joe-campbell.github.io/website/
72+
6473
"likhachev":
6574
- firstname: ["Maxim"]
6675
url: https://www.cs.cmu.edu/~maxim/

_members/andy.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
---
22
layout: member
33
title: Andy Liu
4-
first_name: Andy
4+
first_name: Andrew H.
55
last_name: Liu
66
pronouns: he/him
77
github: "andyhl-96"
1.97 MB
Loading

0 commit comments

Comments
 (0)