Skip to content

Commit aa070e3

Browse files
committed
[minor]: rm sa config for future release
1 parent f19ddd3 commit aa070e3

2 files changed

Lines changed: 105 additions & 106 deletions

File tree

README.md

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@ This repository is built on top of [openpi](https://github.com/Physical-Intellig
7575

7676
For Model Arithmetic (mixing checkpoints), GPU memory requirements depend on the model size and number of checkpoints being mixed. A single A100 (80GB) is sufficient for most use cases.
7777

78-
The repo has been tested with Ubuntu 22.04.
78+
Non-edge components (e.g., Policy Training, Model Arithmetic) have been tested on Ubuntu 22.04.
7979

8080
### Hardware
8181

@@ -112,7 +112,6 @@ uv pip install safetensors
112112
Download the Kai0 dataset so it is available under `./data` for training and evaluation. From the repository root, run:
113113

114114
```bash
115-
pip install huggingface_hub # if not already installed
116115
python scripts/download_dataset.py
117116
```
118117

src/openpi/training/config.py

Lines changed: 104 additions & 104 deletions
Original file line numberDiff line numberDiff line change
@@ -1224,110 +1224,110 @@ def __post_init__(self) -> None:
12241224

12251225

12261226
#************************Advantage Estimator***************************
1227-
TrainConfig(
1228-
name="ADVANTAGE_TORCH_KAI0_FLATTEN_FOLD",
1229-
advantage_estimator=True,
1230-
model=pi0_config.AdvantageEstimatorConfig(
1231-
pi05=True,
1232-
loss_value_weight=1.,
1233-
loss_action_weight=0.,
1234-
discrete_state_input=False,
1235-
),
1236-
data=LerobotAgilexDataConfig(
1237-
repo_id = "Path/to/your/advantage/dataset",
1238-
assets=AssetsConfig(
1239-
assets_dir="Path/to/your/advantage/dataset/assets",
1240-
asset_id="Your_advantage_dataset_name",
1241-
),
1242-
default_prompt="Flatten and fold the cloth.",
1243-
# * why removing "prompt" here will lead to an error in transforms.py
1244-
repack_transforms=_transforms.Group(
1245-
inputs=[
1246-
_transforms.RepackTransform(
1247-
{
1248-
"images": {
1249-
"top_head": "observation.images.top_head",
1250-
"hand_left": "observation.images.hand_left",
1251-
"hand_right": "observation.images.hand_right",
1252-
"his_-100_top_head": "his_-100_observation.images.top_head",
1253-
"his_-100_hand_left": "his_-100_observation.images.hand_left",
1254-
"his_-100_hand_right": "his_-100_observation.images.hand_right",
1255-
},
1256-
"state": "observation.state",
1257-
"actions": "action",
1258-
# "prompt": "prompt", # ! Not adding this for default prompt.
1259-
"episode_length": "episode_length",
1260-
"frame_index": "frame_index",
1261-
"episode_index": "episode_index",
1262-
"progress_gt": "progress_gt",
1263-
"stage_progress_gt": "stage_progress_gt",
1264-
"progress": "progress",
1265-
# "is_suboptimal": "is_suboptimal",
1266-
}
1267-
)
1268-
]
1269-
)
1270-
),
1271-
pytorch_weight_path="Path/to/your/pi05_base/checkpoint",
1272-
num_train_steps=100_000,
1273-
keep_period=10000,
1274-
save_interval=10000,
1275-
num_workers=8,
1276-
batch_size=16, # * 1 gpus
1277-
# batch_size=128, # * 8 gpus
1278-
skip_norm_stats=True, # * No norm stats used.
1279-
),
1280-
TrainConfig(
1281-
name="ADVANTAGE_TORCH_PI06_FLATTEN_FOLD",
1282-
advantage_estimator=True,
1283-
model=pi0_config.AdvantageEstimatorConfig(
1284-
pi05=True,
1285-
loss_value_weight=1.,
1286-
loss_action_weight=0., # No action loss in advantage estimator training
1287-
discrete_state_input=False, # Not using states into prompt like pi05
1288-
),
1289-
data=LerobotAgilexDataConfig(
1290-
# repo_id = "/cpfs01/shared/filtered_cut_data/short_sleeve/flatten_fold/v9-3/1022_20_590_v9-3_2000_lerobot",
1291-
repo_id = "Path/to/your/advantage/dataset",
1292-
assets=AssetsConfig(
1293-
assets_dir="Path/to/your/advantage/dataset/assets",
1294-
asset_id="Your_advantage_dataset_name",
1295-
),
1296-
default_prompt="Flatten and fold the cloth.",
1297-
# * why removing "prompt" here will lead to an error in transforms.py
1298-
repack_transforms=_transforms.Group(
1299-
inputs=[
1300-
_transforms.RepackTransform(
1301-
{
1302-
"images": {
1303-
"top_head": "observation.images.top_head",
1304-
"hand_left": "observation.images.hand_left",
1305-
"hand_right": "observation.images.hand_right",
1306-
},
1307-
"state": "observation.state",
1308-
"actions": "action",
1309-
# "prompt": "prompt", # No need if default prompt is used.
1310-
"episode_length": "episode_length",
1311-
"frame_index": "frame_index",
1312-
"episode_index": "episode_index",
1313-
"progress_gt": "progress_gt",
1314-
"stage_progress_gt": "stage_progress_gt",
1315-
"progress": "progress",
1316-
# "is_suboptimal": "is_suboptimal",
1317-
}
1318-
)
1319-
]
1320-
)
1321-
),
1322-
pytorch_weight_path="Path/to/your/pi06_base/checkpoint",
1323-
num_train_steps=100_000,
1324-
keep_period=10000,
1325-
save_interval=10000,
1326-
num_workers=55,
1327-
# batch_size=16, # * 1 gpus
1328-
batch_size=18*8, # * 8 gpus
1329-
skip_norm_stats=True, # * No norm stats used.
1330-
),
1227+
# TrainConfig(
1228+
# name="ADVANTAGE_TORCH_KAI0_FLATTEN_FOLD",
1229+
# advantage_estimator=True,
1230+
# model=pi0_config.AdvantageEstimatorConfig(
1231+
# pi05=True,
1232+
# loss_value_weight=1.,
1233+
# loss_action_weight=0.,
1234+
# discrete_state_input=False,
1235+
# ),
1236+
# data=LerobotAgilexDataConfig(
1237+
# repo_id = "Path/to/your/advantage/dataset",
1238+
# assets=AssetsConfig(
1239+
# assets_dir="Path/to/your/advantage/dataset/assets",
1240+
# asset_id="Your_advantage_dataset_name",
1241+
# ),
1242+
# default_prompt="Flatten and fold the cloth.",
1243+
# # * why removing "prompt" here will lead to an error in transforms.py
1244+
# repack_transforms=_transforms.Group(
1245+
# inputs=[
1246+
# _transforms.RepackTransform(
1247+
# {
1248+
# "images": {
1249+
# "top_head": "observation.images.top_head",
1250+
# "hand_left": "observation.images.hand_left",
1251+
# "hand_right": "observation.images.hand_right",
1252+
# "his_-100_top_head": "his_-100_observation.images.top_head",
1253+
# "his_-100_hand_left": "his_-100_observation.images.hand_left",
1254+
# "his_-100_hand_right": "his_-100_observation.images.hand_right",
1255+
# },
1256+
# "state": "observation.state",
1257+
# "actions": "action",
1258+
# # "prompt": "prompt", # ! Not adding this for default prompt.
1259+
# "episode_length": "episode_length",
1260+
# "frame_index": "frame_index",
1261+
# "episode_index": "episode_index",
1262+
# "progress_gt": "progress_gt",
1263+
# "stage_progress_gt": "stage_progress_gt",
1264+
# "progress": "progress",
1265+
# # "is_suboptimal": "is_suboptimal",
1266+
# }
1267+
# )
1268+
# ]
1269+
# )
1270+
# ),
1271+
# pytorch_weight_path="Path/to/your/pi05_base/checkpoint",
1272+
# num_train_steps=100_000,
1273+
# keep_period=10000,
1274+
# save_interval=10000,
1275+
# num_workers=8,
1276+
# batch_size=16, # * 1 gpus
1277+
# # batch_size=128, # * 8 gpus
1278+
# skip_norm_stats=True, # * No norm stats used.
1279+
# ),
1280+
# TrainConfig(
1281+
# name="ADVANTAGE_TORCH_PI06_FLATTEN_FOLD",
1282+
# advantage_estimator=True,
1283+
# model=pi0_config.AdvantageEstimatorConfig(
1284+
# pi05=True,
1285+
# loss_value_weight=1.,
1286+
# loss_action_weight=0., # No action loss in advantage estimator training
1287+
# discrete_state_input=False, # Not using states into prompt like pi05
1288+
# ),
1289+
# data=LerobotAgilexDataConfig(
1290+
# # repo_id = "/cpfs01/shared/filtered_cut_data/short_sleeve/flatten_fold/v9-3/1022_20_590_v9-3_2000_lerobot",
1291+
# repo_id = "Path/to/your/advantage/dataset",
1292+
# assets=AssetsConfig(
1293+
# assets_dir="Path/to/your/advantage/dataset/assets",
1294+
# asset_id="Your_advantage_dataset_name",
1295+
# ),
1296+
# default_prompt="Flatten and fold the cloth.",
1297+
# # * why removing "prompt" here will lead to an error in transforms.py
1298+
# repack_transforms=_transforms.Group(
1299+
# inputs=[
1300+
# _transforms.RepackTransform(
1301+
# {
1302+
# "images": {
1303+
# "top_head": "observation.images.top_head",
1304+
# "hand_left": "observation.images.hand_left",
1305+
# "hand_right": "observation.images.hand_right",
1306+
# },
1307+
# "state": "observation.state",
1308+
# "actions": "action",
1309+
# # "prompt": "prompt", # No need if default prompt is used.
1310+
# "episode_length": "episode_length",
1311+
# "frame_index": "frame_index",
1312+
# "episode_index": "episode_index",
1313+
# "progress_gt": "progress_gt",
1314+
# "stage_progress_gt": "stage_progress_gt",
1315+
# "progress": "progress",
1316+
# # "is_suboptimal": "is_suboptimal",
1317+
# }
1318+
# )
1319+
# ]
1320+
# )
1321+
# ),
1322+
# pytorch_weight_path="Path/to/your/pi06_base/checkpoint",
1323+
# num_train_steps=100_000,
1324+
# keep_period=10000,
1325+
# save_interval=10000,
1326+
# num_workers=55,
1327+
# # batch_size=16, # * 1 gpus
1328+
# batch_size=18*8, # * 8 gpus
1329+
# skip_norm_stats=True, # * No norm stats used.
1330+
# ),
13311331
#************************advantage estimator***************************
13321332
# RoboArena & PolaRiS configs.
13331333
*roboarena_config.get_roboarena_configs(),

0 commit comments

Comments
 (0)