myniu commited on
Commit
12f772a
1 Parent(s): b6fb998
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +40 -0
  2. ckpts/controlnet/config.json +45 -0
  3. ckpts/controlnet/diffusion_pytorch_model.safetensors +3 -0
  4. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/config.yaml +59 -0
  5. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/resume.sh +8 -0
  6. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/resume_slurm.sh +9 -0
  7. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/train.sh +6 -0
  8. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/train_slurm.sh +7 -0
  9. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/validate.sh +6 -0
  10. models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/validate_slurm.sh +8 -0
  11. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/config.yaml +58 -0
  12. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/resume.sh +8 -0
  13. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/resume_slurm.sh +9 -0
  14. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/train.sh +6 -0
  15. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/train_slurm.sh +7 -0
  16. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/validate.sh +6 -0
  17. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/validate_slurm.sh +8 -0
  18. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/config.yaml +58 -0
  19. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/resume.sh +6 -0
  20. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/resume_slurm.sh +9 -0
  21. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/train.sh +4 -0
  22. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/train_slurm.sh +7 -0
  23. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/validate.sh +6 -0
  24. models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/validate_slurm.sh +8 -0
  25. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/config.yaml +61 -0
  26. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/resume.sh +8 -0
  27. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/resume_slurm.sh +9 -0
  28. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/train.sh +6 -0
  29. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/train_slurm.sh +7 -0
  30. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/validate.sh +6 -0
  31. models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/validate_slurm.sh +8 -0
  32. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/config.yaml +58 -0
  33. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/resume.sh +8 -0
  34. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/resume_slurm.sh +9 -0
  35. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/train.sh +6 -0
  36. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/train_slurm.sh +7 -0
  37. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/validate.sh +6 -0
  38. models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/validate_slurm.sh +8 -0
  39. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/config.yaml +58 -0
  40. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/resume.sh +8 -0
  41. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/resume_slurm.sh +9 -0
  42. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/train.sh +6 -0
  43. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/train_slurm.sh +7 -0
  44. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/validate.sh +6 -0
  45. models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/validate_slurm.sh +8 -0
  46. models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/checkpoints/ckpt_iter_42000.pth.tar +3 -0
  47. models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/config.yaml +59 -0
  48. models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/resume.sh +6 -0
  49. models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/resume_slurm.sh +9 -0
  50. models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/train.sh +4 -0
README.md ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ## Environment Setup
2
+
3
+ `pip install -r requirements.txt`
4
+
5
+ ## Download checkpoints
6
+
7
+ 1. Download the pretrained checkpoints of [SVD_xt](https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1) from huggingface to `./ckpts`.
8
+
9
+ 2. Download the checkpint of [MOFA-Adapter](https://huggingface.co/MyNiuuu/MOFA-Video-Traj) from huggingface to `./ckpts`.
10
+
11
+ The final structure of checkpoints should be:
12
+
13
+
14
+ ```text
15
+ ./ckpts/
16
+ |-- controlnet
17
+ | |-- config.json
18
+ | `-- diffusion_pytorch_model.safetensors
19
+ |-- stable-video-diffusion-img2vid-xt-1-1
20
+ | |-- feature_extractor
21
+ | |-- ...
22
+ | |-- image_encoder
23
+ | |-- ...
24
+ | |-- scheduler
25
+ | |-- ...
26
+ | |-- unet
27
+ | |-- ...
28
+ | |-- unet_ch9
29
+ | |-- ...
30
+ | |-- vae
31
+ | |-- ...
32
+ | |-- svd_xt_1_1.safetensors
33
+ | `-- model_index.json
34
+ ```
35
+
36
+ ## Run Gradio Demo
37
+
38
+ `python run_gradio.py`
39
+
40
+ Please refer to the instructions on the gradio interface during the inference process.
ckpts/controlnet/config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "FlowControlNet",
3
+ "_diffusers_version": "0.25.1",
4
+ "_name_or_path": "/apdcephfs_cq10/share_1290939/myniu/svd_controlnet/svdxt11_featureflow_forward_avg_256256_stride4/unimatch_512384/checkpoint-100000/controlnet",
5
+ "addition_time_embed_dim": 256,
6
+ "block_out_channels": [
7
+ 320,
8
+ 640,
9
+ 1280,
10
+ 1280
11
+ ],
12
+ "conditioning_channels": 3,
13
+ "conditioning_embedding_out_channels": [
14
+ 16,
15
+ 32,
16
+ 96,
17
+ 256
18
+ ],
19
+ "cross_attention_dim": 1024,
20
+ "down_block_types": [
21
+ "CrossAttnDownBlockSpatioTemporal",
22
+ "CrossAttnDownBlockSpatioTemporal",
23
+ "CrossAttnDownBlockSpatioTemporal",
24
+ "DownBlockSpatioTemporal"
25
+ ],
26
+ "in_channels": 8,
27
+ "layers_per_block": 2,
28
+ "num_attention_heads": [
29
+ 5,
30
+ 10,
31
+ 10,
32
+ 20
33
+ ],
34
+ "num_frames": 25,
35
+ "out_channels": 4,
36
+ "projection_class_embeddings_input_dim": 768,
37
+ "sample_size": null,
38
+ "transformer_layers_per_block": 1,
39
+ "up_block_types": [
40
+ "UpBlockSpatioTemporal",
41
+ "CrossAttnUpBlockSpatioTemporal",
42
+ "CrossAttnUpBlockSpatioTemporal",
43
+ "CrossAttnUpBlockSpatioTemporal"
44
+ ]
45
+ }
ckpts/controlnet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1303192a1e72d071e15e7eb37fd1ea15f6424aaf2cd6b6b1e1bb3b1e9e75d37e
3
+ size 2777345452
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/config.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 140000
4
+ lr_steps: [80000, 120000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: alexnet_fcn_32x
13
+ sparse_encoder: shallownet32x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 12
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [384, 384]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.000025
34
+ nms_ks: 81
35
+ max_num_guide: 150
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ - data/youtube9000/lists/train.txt
47
+ val_source:
48
+ - data/yfcc/lists/val.txt
49
+ memcached: False
50
+ trainer:
51
+ initial_val: True
52
+ print_freq: 100
53
+ val_freq: 10000
54
+ save_freq: 10000
55
+ val_iter: -1
56
+ val_disp_start_iter: 0
57
+ val_disp_end_iter: 16
58
+ loss_record: ['loss_flow']
59
+ tensorboard: False
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/resume.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch \
7
+ --load-iter 10000 \
8
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/train.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/alexnet_yfcc+youtube_voc_16gpu_140k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/config.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 70000
4
+ lr_steps: [40000, 60000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: alexnet_fcn_32x
13
+ sparse_encoder: shallownet32x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 12
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [384, 384]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.00015625
34
+ nms_ks: 41
35
+ max_num_guide: 150
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ val_source:
47
+ - data/yfcc/lists/val.txt
48
+ memcached: False
49
+ trainer:
50
+ initial_val: True
51
+ print_freq: 100
52
+ val_freq: 10000
53
+ save_freq: 10000
54
+ val_iter: -1
55
+ val_disp_start_iter: 0
56
+ val_disp_end_iter: 16
57
+ loss_record: ['loss_flow']
58
+ tensorboard: False
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/resume.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch \
7
+ --load-iter 10000 \
8
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/train.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_16gpu_70k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/config.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 140000
4
+ lr_steps: [80000, 120000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: alexnet_fcn_32x
13
+ sparse_encoder: shallownet32x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 12
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [384, 384]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.00015625
34
+ nms_ks: 41
35
+ max_num_guide: 150
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ val_source:
47
+ - data/yfcc/lists/val.txt
48
+ memcached: False
49
+ trainer:
50
+ initial_val: True
51
+ print_freq: 100
52
+ val_freq: 10000
53
+ save_freq: 10000
54
+ val_iter: -1
55
+ val_disp_start_iter: 0
56
+ val_disp_end_iter: 16
57
+ loss_record: ['loss_flow']
58
+ tensorboard: False
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/resume.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 10000 \
6
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/train.sh ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/alexnet_yfcc_voc_8gpu_140k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/config.yaml ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 70000
4
+ lr_steps: [40000, 60000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: resnet50
13
+ sparse_encoder: shallownet8x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 10
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [320, 320]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.00015625
34
+ nms_ks: 15
35
+ max_num_guide: -1
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ - data/youtube9000/lists/train.txt
47
+ - data/VIP/lists/train.txt
48
+ - data/MPII/lists/train.txt
49
+ val_source:
50
+ - data/yfcc/lists/val.txt
51
+ memcached: False
52
+ trainer:
53
+ initial_val: True
54
+ print_freq: 100
55
+ val_freq: 10000
56
+ save_freq: 10000
57
+ val_iter: -1
58
+ val_disp_start_iter: 0
59
+ val_disp_end_iter: 16
60
+ loss_record: ['loss_flow']
61
+ tensorboard: False
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/resume.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch \
7
+ --load-iter 10000 \
8
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/train.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc+youtube+vip+mpii_lip_16gpu_70k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/config.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 42000
4
+ lr_steps: [24000, 36000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: resnet50
13
+ sparse_encoder: shallownet8x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 16
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 333
31
+ crop_size: [256, 256]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.00005632
34
+ nms_ks: 49
35
+ max_num_guide: -1
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ val_source:
47
+ - data/yfcc/lists/val.txt
48
+ memcached: False
49
+ trainer:
50
+ initial_val: True
51
+ print_freq: 100
52
+ val_freq: 10000
53
+ save_freq: 10000
54
+ val_iter: -1
55
+ val_disp_start_iter: 0
56
+ val_disp_end_iter: 16
57
+ loss_record: ['loss_flow']
58
+ tensorboard: False
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/resume.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch \
7
+ --load-iter 10000 \
8
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/train.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc_coco_16gpu_42k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/config.yaml ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 42000
4
+ lr_steps: [24000, 36000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: resnet50
13
+ sparse_encoder: shallownet8x
14
+ flow_decoder: MotionDecoderPlain
15
+ skip_layer: False
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 10
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [320, 320]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 0.00003629
34
+ nms_ks: 67
35
+ max_num_guide: -1
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/yfcc/lists/train.txt
46
+ val_source:
47
+ - data/yfcc/lists/val.txt
48
+ memcached: False
49
+ trainer:
50
+ initial_val: True
51
+ print_freq: 100
52
+ val_freq: 10000
53
+ save_freq: 10000
54
+ val_iter: -1
55
+ val_disp_start_iter: 0
56
+ val_disp_end_iter: 16
57
+ loss_record: ['loss_flow']
58
+ tensorboard: False
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/resume.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch \
7
+ --load-iter 10000 \
8
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/train.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 \
4
+ --nnodes=2 --node_rank=$1 \
5
+ --master_addr="192.168.1.1" main.py \
6
+ --config $work_path/config.yaml --launcher pytorch
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/train_slurm.sh ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n16 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/validate.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 70000 \
6
+ --validate
models/cmp/experiments/rep_learning/resnet50_yfcc_voc_16gpu_42k/validate_slurm.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py --config $work_path/config.yaml --launcher slurm \
7
+ --load-iter 70000 \
8
+ --validate
models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/checkpoints/ckpt_iter_42000.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd3a385e227c29f89b5c7c6f4c89d356f6022fa7fcfc71ab1bd40e9833048dd6
3
+ size 228465722
models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/config.yaml ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ arch: CMP
3
+ total_iter: 42000
4
+ lr_steps: [24000, 36000]
5
+ lr_mults: [0.1, 0.1]
6
+ lr: 0.1
7
+ optim: SGD
8
+ warmup_lr: []
9
+ warmup_steps: []
10
+ module:
11
+ arch: CMP
12
+ image_encoder: resnet50
13
+ sparse_encoder: shallownet8x
14
+ flow_decoder: MotionDecoderSkipLayer
15
+ skip_layer: True
16
+ img_enc_dim: 256
17
+ sparse_enc_dim: 16
18
+ output_dim: 198
19
+ decoder_combo: [1,2,4]
20
+ pretrained_image_encoder: False
21
+ flow_criterion: "DiscreteLoss"
22
+ nbins: 99
23
+ fmax: 50
24
+ data:
25
+ workers: 2
26
+ batch_size: 8
27
+ batch_size_test: 1
28
+ data_mean: [123.675, 116.28, 103.53] # RGB
29
+ data_div: [58.395, 57.12, 57.375]
30
+ short_size: 416
31
+ crop_size: [384, 384]
32
+ sample_strategy: ['grid', 'watershed']
33
+ sample_bg_ratio: 5.74e-5
34
+ nms_ks: 41
35
+ max_num_guide: -1
36
+
37
+ flow_file_type: "jpg"
38
+ image_flow_aug:
39
+ flip: False
40
+ flow_aug:
41
+ reverse: False
42
+ scale: False
43
+ rotate: False
44
+ train_source:
45
+ - data/VIP/lists/train.txt
46
+ - data/MPII/lists/train.txt
47
+ val_source:
48
+ - data/VIP/lists/randval.txt
49
+ memcached: False
50
+ trainer:
51
+ initial_val: True
52
+ print_freq: 100
53
+ val_freq: 5000
54
+ save_freq: 5000
55
+ val_iter: -1
56
+ val_disp_start_iter: 0
57
+ val_disp_end_iter: 16
58
+ loss_record: ['loss_flow']
59
+ tensorboard: True
models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/resume.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch \
5
+ --load-iter 10000 \
6
+ --resume
models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/resume_slurm.sh ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ partition=$1
4
+ GLOG_vmodule=MemcachedClient=-1 srun --mpi=pmi2 -p $partition -n8 \
5
+ --gres=gpu:8 --ntasks-per-node=8 \
6
+ python -u main.py \
7
+ --config $work_path/config.yaml --launcher slurm \
8
+ --load-iter 10000 \
9
+ --resume
models/cmp/experiments/semiauto_annot/resnet50_vip+mpii_liteflow/train.sh ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ #!/bin/bash
2
+ work_path=$(dirname $0)
3
+ python -m torch.distributed.launch --nproc_per_node=8 main.py \
4
+ --config $work_path/config.yaml --launcher pytorch