Skip to content

Commit bd27cb0

Browse files
committed
feat: use external channel creation and remove duplicate env creation
Signed-off-by: Hao Lin <linhaomails@gmail.com>
1 parent ff5b348 commit bd27cb0

File tree

60 files changed

+369
-923
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

60 files changed

+369
-923
lines changed

.github/CODEOWNERS

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111

1212
/rlinf/data @guozhen1997 @Lin-xs @andylin-hao
1313

14-
/rlinf/envs @guozhen1997 @XuS1994
14+
/rlinf/envs @guozhen1997 @andylin-hao @Lin-xs
1515

1616
/rlinf/hybrid_engines/fsdp @guozhen1997
1717
/rlinf/hybrid_engines/megatron @guozhen1997
@@ -26,11 +26,11 @@
2626

2727
/rlinf/utils @guozhen1997 @Lin-xs @andylin-hao
2828

29-
/rlinf/workers/actor/fsdp_actor_worker.py @guozhen1997
29+
/rlinf/workers/actor/fsdp_actor_worker.py @guozhen1997 @andylin-hao @Lin-xs
3030
/rlinf/workers/actor/megatron_actor_worker.py @guozhen1997 @andylin-hao
31-
/rlinf/workers/env @guozhen1997 @XuS1994
31+
/rlinf/workers/env @guozhen1997 @andylin-hao @Lin-xs
3232
/rlinf/workers/inference @andylin-hao
33-
/rlinf/workers/rollout/hf @guozhen1997
33+
/rlinf/workers/rollout/hf @guozhen1997 @Lin-xs @andylin-hao
3434
/rlinf/workers/rollout/sglang @Lin-xs @andylin-hao
3535
/rlinf/workers/rollout/vllm @Lin-xs @andylin-hao
3636
/rlinf/workers/rollout/utils.py @Lin-xs @andylin-hao

.github/workflows/ci-tests.yml

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,11 +2,7 @@ name: CI Test
22

33
on:
44
push:
5-
branches:
6-
- "release/v[0-9].[0-9]"
7-
- main
85
pull_request:
9-
branches: [main]
106
types: [synchronize, labeled]
117
workflow_dispatch:
128

examples/embodiment/config/behavior_eval.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -80,31 +80,18 @@ algorithm:
8080

8181
env:
8282
group_name: "EnvGroup"
83-
channel:
84-
name: "env_buffer_list"
85-
queue_name: "obs_buffer"
86-
queue_size: 0
8783
enable_offload: False
8884
num_envs_per_gpu: 2
8985

9086
rollout:
9187
group_name: "RolloutGroup"
92-
channel:
93-
name: ${env.channel.name}
94-
queue_name: "action_buffer"
95-
queue_size: 0
96-
mode: "colocate"
9788
backend: "huggingface"
9889
model_dir: "/path/to/model/RLinf-OpenVLAOFT-Behavior/"
9990
enable_offload: True
10091
pipeline_stage_num: 1
10192

10293
actor:
10394
group_name: "ActorGroup"
104-
channel:
105-
name: ${env.channel.name}
106-
queue_name: "replay_buffer"
107-
queue_size: 0
10895
training_backend: "fsdp"
10996
checkpoint_load_path: "/path/to/model/RLinf-OpenVLAOFT-Behavior/"
11097
checkpoint_save_path: "../results"

examples/embodiment/config/behavior_ppo_openvlaoft.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -82,20 +82,11 @@ algorithm:
8282

8383
env:
8484
group_name: "EnvGroup"
85-
channel:
86-
name: "env_buffer_list"
87-
queue_name: "obs_buffer"
88-
queue_size: 0
8985
enable_offload: False
9086
num_envs_per_gpu: 2
9187

9288
rollout:
9389
group_name: "RolloutGroup"
94-
channel:
95-
name: ${env.channel.name}
96-
queue_name: "action_buffer"
97-
queue_size: 0
98-
mode: "colocate"
9990
backend: "huggingface"
10091
model_dir: "/path/to/model/RLinf-OpenVLAOFT-Behavior/"
10192
precision: ${actor.model.precision}
@@ -104,10 +95,6 @@ rollout:
10495

10596
actor:
10697
group_name: "ActorGroup"
107-
channel:
108-
name: ${env.channel.name}
109-
queue_name: "replay_buffer"
110-
queue_size: 0
11198
training_backend: "fsdp"
11299
checkpoint_load_path: "/path/to/model/RLinf-OpenVLAOFT-Behavior/"
113100
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_grpo_openpi.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -86,19 +86,10 @@ algorithm:
8686

8787
env:
8888
group_name: "EnvGroup"
89-
channel:
90-
name: "env_buffer_list"
91-
queue_name: "obs_buffer"
92-
queue_size: 0
9389
enable_offload: False
9490

9591
rollout:
9692
group_name: "RolloutGroup"
97-
channel:
98-
name: ${env.channel.name}
99-
queue_name: "action_buffer"
100-
queue_size: 0
101-
mode: "colocate"
10293
generation_backend: "huggingface"
10394
model_dir: "/path/to/model/openpi"
10495
precision: ${actor.model.precision}
@@ -109,10 +100,6 @@ rollout:
109100

110101
actor:
111102
group_name: "ActorGroup"
112-
channel:
113-
name: ${env.channel.name}
114-
queue_name: "replay_buffer"
115-
queue_size: 0
116103
training_backend: "fsdp"
117104
checkpoint_load_path: "/path/to/model/openpi"
118105
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_grpo_openpi_pi05.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -85,19 +85,10 @@ algorithm:
8585

8686
env:
8787
group_name: "EnvGroup"
88-
channel:
89-
name: "env_buffer_list"
90-
queue_name: "obs_buffer"
91-
queue_size: 0
9288
enable_offload: False
9389

9490
rollout:
9591
group_name: "RolloutGroup"
96-
channel:
97-
name: ${env.channel.name}
98-
queue_name: "action_buffer"
99-
queue_size: 0
100-
mode: "colocate"
10192
generation_backend: "huggingface"
10293
model_dir: "/path/to/model/openpi"
10394
precision: ${actor.model.precision}
@@ -108,10 +99,6 @@ rollout:
10899

109100
actor:
110101
group_name: "ActorGroup"
111-
channel:
112-
name: ${env.channel.name}
113-
queue_name: "replay_buffer"
114-
queue_size: 0
115102
training_backend: "fsdp"
116103
checkpoint_load_path: "/path/to/model/openpi"
117104
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_grpo_openvlaoft.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -86,19 +86,10 @@ algorithm:
8686

8787
env:
8888
group_name: "EnvGroup"
89-
channel:
90-
name: "env_buffer_list"
91-
queue_name: "obs_buffer"
92-
queue_size: 0
9389
enable_offload: False
9490

9591
rollout:
9692
group_name: "RolloutGroup"
97-
channel:
98-
name: ${env.channel.name}
99-
queue_name: "action_buffer"
100-
queue_size: 0
101-
mode: "colocate"
10293
generation_backend: "huggingface"
10394
model_dir: "/path/to/model/Openvla-oft-SFT-libero10-traj1/"
10495
precision: ${actor.model.precision}
@@ -107,10 +98,6 @@ rollout:
10798

10899
actor:
109100
group_name: "ActorGroup"
110-
channel:
111-
name: ${env.channel.name}
112-
queue_name: "replay_buffer"
113-
queue_size: 0
114101
training_backend: "fsdp"
115102
checkpoint_load_path: "/path/to/model/Openvla-oft-SFT-libero10-traj1/"
116103
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_grpo_openvlaoft_eval.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -86,19 +86,10 @@ algorithm:
8686

8787
env:
8888
group_name: "EnvGroup"
89-
channel:
90-
name: "env_buffer_list"
91-
queue_name: "obs_buffer"
92-
queue_size: 0
9389
enable_offload: False
9490

9591
rollout:
9692
group_name: "RolloutGroup"
97-
channel:
98-
name: ${env.channel.name}
99-
queue_name: "action_buffer"
100-
queue_size: 0
101-
mode: "colocate"
10293
generation_backend: "huggingface"
10394
model_dir: "/path/to/model/Openvla-oft-SFT-libero10-traj1/"
10495
precision: ${actor.model.precision}
@@ -107,10 +98,6 @@ rollout:
10798

10899
actor:
109100
group_name: "ActorGroup"
110-
channel:
111-
name: ${env.channel.name}
112-
queue_name: "replay_buffer"
113-
queue_size: 0
114101
training_backend: "fsdp"
115102
checkpoint_load_path: "/path/to/model/Openvla-oft-SFT-libero10-traj1/"
116103
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_ppo_openpi.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -86,19 +86,10 @@ algorithm:
8686

8787
env:
8888
group_name: "EnvGroup"
89-
channel:
90-
name: "env_buffer_list"
91-
queue_name: "obs_buffer"
92-
queue_size: 0
9389
enable_offload: False
9490

9591
rollout:
9692
group_name: "RolloutGroup"
97-
channel:
98-
name: ${env.channel.name}
99-
queue_name: "action_buffer"
100-
queue_size: 0
101-
mode: "colocate"
10293
generation_backend: "huggingface"
10394
model_dir: "/path/to/model/openpi"
10495
precision: ${actor.model.precision}
@@ -109,10 +100,6 @@ rollout:
109100

110101
actor:
111102
group_name: "ActorGroup"
112-
channel:
113-
name: ${env.channel.name}
114-
queue_name: "replay_buffer"
115-
queue_size: 0
116103
training_backend: "fsdp"
117104
checkpoint_load_path: "/path/to/model/openpi"
118105
checkpoint_save_path: "../results"

examples/embodiment/config/libero_10_ppo_openpi_pi05.yaml

Lines changed: 0 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -85,19 +85,10 @@ algorithm:
8585

8686
env:
8787
group_name: "EnvGroup"
88-
channel:
89-
name: "env_buffer_list"
90-
queue_name: "obs_buffer"
91-
queue_size: 0
9288
enable_offload: False
9389

9490
rollout:
9591
group_name: "RolloutGroup"
96-
channel:
97-
name: ${env.channel.name}
98-
queue_name: "action_buffer"
99-
queue_size: 0
100-
mode: "colocate"
10192
generation_backend: "huggingface"
10293
model_dir: "/path/to/model/openpi"
10394
precision: ${actor.model.precision}
@@ -108,10 +99,6 @@ rollout:
10899

109100
actor:
110101
group_name: "ActorGroup"
111-
channel:
112-
name: ${env.channel.name}
113-
queue_name: "replay_buffer"
114-
queue_size: 0
115102
training_backend: "fsdp"
116103
checkpoint_load_path: "/path/to/model/openpi"
117104
checkpoint_save_path: "../results"

0 commit comments

Comments
 (0)