liruiw commited on
Commit
9f47354
1 Parent(s): 3719021

Upload 3 files

Browse files
Files changed (3) hide show
  1. config.yaml +188 -0
  2. model.pth +3 -0
  3. trunk.pth +3 -0
config.yaml ADDED
@@ -0,0 +1,188 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 0
2
+ output_dir: output/05_05_2024_20_21_54_727273
3
+ domains: austin_sailor_dataset_converted_externally_to_rlds, stanford_hydra_dataset_converted_externally_to_rlds,
4
+ austin_buds_dataset_converted_externally_to_rlds, austin_sirius_dataset_converted_externally_to_rlds,
5
+ berkeley_mvp_converted_externally_to_rlds, berkeley_rpt_converted_externally_to_rlds,
6
+ iamlab_cmu_pickup_insert_converted_externally_to_rlds, utaustin_mutex, imperialcollege_sawyer_wrist_cam,
7
+ stanford_mask_vit_converted_externally_to_rlds, language_table, kuka, bc_z, robo_net,
8
+ dlr_sara_pour_converted_externally_to_rlds, stanford_robocook_converted_externally_to_rlds,
9
+ cmu_play_fusion, bridge, furniture_bench_dataset_converted_externally_to_rlds, ucsd_pick_and_place_dataset_converted_externally_to_rlds,
10
+ usc_cloth_sim_converted_externally_to_rlds, stanford_kuka_multimodal_dataset_converted_externally_to_rlds,
11
+ roboturk, kaist_nonprehensile_converted_externally_to_rlds, asu_table_top_converted_externally_to_rlds,
12
+ utokyo_xarm_pick_and_place_converted_externally_to_rlds, berkeley_cable_routing,
13
+ droid, uiuc_d3field, robo_set, qut_dexterous_manpulation, nyu_door_opening_surprising_effectiveness,
14
+ nyu_franka_play_dataset_converted_externally_to_rlds, mimic_play, maniskill_dataset_converted_externally_to_rlds,
15
+ columbia_cairlab_pusht_real, conq_hose_manipulation, dlr_edan_shared_control_converted_externally_to_rlds,
16
+ berkeley_gnm_sac_son, berkeley_autolab_ur5, aloha_mobile, agent_aware_affordances
17
+ log_dir: output/05_05_2024_20_21_54_727273
18
+ debug_distributed: false
19
+ wb_tag: default
20
+ wb_cont_run: 2nxmlp81
21
+ log_interval: 10
22
+ script_name: run_resnet_30dataset_traj100000_embed_256_batch2048_800k_language
23
+ save_wb_checkpoint: true
24
+ slurm_job_id: '27155760'
25
+ effective_total_epochs: 100
26
+ effective_batch_size: 256
27
+ epoch_size: 10
28
+ total_num_traj: 0
29
+ total_num_sample: 0
30
+ rank: 0
31
+ gpu: 0
32
+ task_per_gpu: 1
33
+ world_size: 64
34
+ debug_submitit: false
35
+ ngpus: 8
36
+ nodes: 8
37
+ timeout: 4320
38
+ job_dir: logs/
39
+ partition: learnlab
40
+ use_volta32: true
41
+ comment: ''
42
+ resume: logs/
43
+ dist_url: file:///checkpoint/xinleic/experiments/43124ff352a546a8b51d5fb4234b51d8_init
44
+ dist_on_itp: false
45
+ local_rank: 1
46
+ distributed: true
47
+ dist_backend: nccl
48
+ dset_w_temperature: 2.0
49
+ dataset_shuffle: true
50
+ dataset_groups: ''
51
+ nodelist: learnlab,learnfair,scavenge
52
+ fsdp: false
53
+ count_flops: false
54
+ accumuate_gradient_steps: 1
55
+ trunk_acc_gradient_step: 1
56
+ submitit_autoresume: true
57
+ customized_dataset_mixture_file: ''
58
+ trunk_separate_opt: false
59
+ dataset:
60
+ _target_: hpt_pretrain.dataset.traj_dataset.TrajDataset
61
+ horizon: 5
62
+ val_ratio: 0.1
63
+ pad_after: 0
64
+ precompute_feat: true
65
+ image_encoder: resnet
66
+ episode_cnt: 100000
67
+ step_cnt: 10000000
68
+ data_augmentation: false
69
+ use_disk: true
70
+ pad_before: 0
71
+ data_ratio: 1
72
+ action_horizon: 8
73
+ observation_horizon: 4
74
+ dataset_postfix: _traj100000
75
+ dataset_encoder_postfix: _resnet
76
+ use_multiview: false
77
+ normalize_state: true
78
+ use_heldout_dataset: true
79
+ heldout_dataset: false
80
+ regenerate: false
81
+ continue_generate: false
82
+ network:
83
+ _target_: hpt_pretrain.models.policy.Policy
84
+ embed_dim: 256
85
+ num_blocks: 16
86
+ num_heads: 8
87
+ use_modality_embedding: true
88
+ use_domain_embedding: false
89
+ token_postprocessing: mean
90
+ weight_init_style: pytorch
91
+ drop_path: 0.1
92
+ mae_loss_scale: 0.0
93
+ masked_autoencoding: false
94
+ action_horizon: ${dataset.action_horizon}
95
+ stem:
96
+ modalities:
97
+ - image
98
+ - state
99
+ - language
100
+ modality_embed_dim: 256
101
+ normalize_state: ${dataset.normalize_state}
102
+ state_embedding_dim: 1
103
+ image_encoder: ${dataset.image_encoder}
104
+ crossattn_dim_head: 64
105
+ crossattn_heads: 8
106
+ crossattn_modality_dropout: 0.1
107
+ observation_horizon: ${dataset.observation_horizon}
108
+ random_horizon_masking: true
109
+ add_pos_embedding_to_state: false
110
+ num_blocks: 1
111
+ crossattn_latent:
112
+ image: 16
113
+ state: 16
114
+ language: 8
115
+ image:
116
+ _target_: hpt_pretrain.models.policy_stem.MLP
117
+ input_dim: 512
118
+ output_dim: 256
119
+ widths:
120
+ - 128
121
+ num_of_copy: 1
122
+ state:
123
+ _target_: hpt_pretrain.models.policy_stem.MLP
124
+ input_dim: 8
125
+ output_dim: 256
126
+ widths:
127
+ - 128
128
+ language:
129
+ _target_: hpt_pretrain.models.policy_stem.MLP
130
+ input_dim: 768
131
+ output_dim: ${network.embed_dim}
132
+ widths:
133
+ - 128
134
+ head:
135
+ _target_: hpt_pretrain.models.policy_head.MLP
136
+ input_dim: 256
137
+ tanh_end: true
138
+ output_dim: 48
139
+ dropout: true
140
+ widths:
141
+ - 256
142
+ - 128
143
+ dataloader:
144
+ batch_size: 32
145
+ num_workers: 1
146
+ pin_memory: false
147
+ persistent_workers: false
148
+ drop_last: true
149
+ val_dataloader:
150
+ num_workers: 1
151
+ pin_memory: false
152
+ persistent_workers: false
153
+ ddp_dataloader:
154
+ num_workers: 8
155
+ pin_memory: false
156
+ persistent_workers: false
157
+ drop_last: false
158
+ prefetch_factor: 6
159
+ ddp_val_dataloader:
160
+ num_workers: 8
161
+ pin_memory: false
162
+ persistent_workers: false
163
+ drop_last: false
164
+ prefetch_factor: 2
165
+ optimizer:
166
+ _target_: torch.optim.AdamW
167
+ lr: 0.001
168
+ eps: 1.0e-06
169
+ weight_decay: 0.05
170
+ optimizer_misc:
171
+ nontrunk_lr_scale: 0.5
172
+ warmup_lr:
173
+ lr: 1.0e-10
174
+ step: 1000
175
+ train:
176
+ total_epochs: 30000
177
+ total_iters: 800000
178
+ epoch_iters: 1000
179
+ validation_iters: 100
180
+ use_accumulation: false
181
+ pretrained_dir: '05_05_2024_20_21_54_727273'
182
+ max_validation_size: 10
183
+ load_pretrain_trunk_only: false
184
+ freeze_trunk: false
185
+ lr_scheduler:
186
+ _target_: torch.optim.lr_scheduler.CosineAnnealingLR
187
+ T_max: 800000
188
+ eta_min: 1.0e-06
model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76698f5a63dce67bc7b6cb5622781af0c0e3569eaffe459652c3e177afb4c481
3
+ size 379997162
trunk.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b59bf717a7aac851d5a65fb752f4cc957a170f5bb474fc097197be0d9cfa103
3
+ size 50642858