File size: 1,048 Bytes
6dfcb0f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
OUTPUT_DIR="${HOME}/checkpoints/cwm_cvpr_checkpoints/ablation_3frame_16x16_no_clumping_mr0.95/"
DATA_PATH="${HOME}/BBNet/bbnet/models/VideoMAE-main/video_file_lists/kinetics_400_train_list.txt"

python3 ~/BBNet/bbnet/models/VideoMAE-main/run_cwm_pretraining.py \
		    --data_path ${DATA_PATH} \
		    --mask_type rotated_table \
		    --mask_ratio 0.95 \
		    --mask_kwargs '{"tube_length": 1}' \
		    --model vitbase_16x16patch_3frames_1tube \
		    --context_frames 2 \
		    --target_frames 1 \
		    --temporal_units 'ms' \
		    --sampling_rate 150 \
		    --context_target_gap 150 150 \
		    --batch_size 32 \
		    --accum_iter 1 \
		    --opt adamw \
		    --opt_betas 0.9 0.95 \
		    --warmup_epochs 40 \
		    --save_ckpt_freq 50 \
		    --epochs 800 \
		    --no_normlize_target \
		    --rescale_size 224 \
		    --augmentation_type 'multiscale' \
		    --augmentation_scales 1.0 0.875 0.75 0.66 \
		    --log_dir ${OUTPUT_DIR} \
		    --output_dir ${OUTPUT_DIR} \
		    --print_freq 1 \
		    --num_workers 16 \
		    --use_xla \