ControlNet-v1-1-Annotators-cpu
/
annotator
/oneformer
/configs
/coco
/Base-COCO-UnifiedSegmentation.yaml
MODEL: | |
BACKBONE: | |
FREEZE_AT: 0 | |
NAME: "build_resnet_backbone" | |
WEIGHTS: "detectron2://ImageNetPretrained/torchvision/R-50.pkl" | |
PIXEL_MEAN: [123.675, 116.280, 103.530] | |
PIXEL_STD: [58.395, 57.120, 57.375] | |
RESNETS: | |
DEPTH: 50 | |
STEM_TYPE: "basic" # not used | |
STEM_OUT_CHANNELS: 64 | |
STRIDE_IN_1X1: False | |
OUT_FEATURES: ["res2", "res3", "res4", "res5"] | |
# NORM: "SyncBN" | |
RES5_MULTI_GRID: [1, 1, 1] # not used | |
DATASETS: | |
TRAIN: ("coco_2017_train_panoptic_with_sem_seg",) | |
TEST_PANOPTIC: ("coco_2017_val_panoptic_with_sem_seg",) # to evaluate instance and semantic performance as well | |
TEST_INSTANCE: ("coco_2017_val",) | |
TEST_SEMANTIC: ("coco_2017_val_panoptic_with_sem_seg",) | |
SOLVER: | |
IMS_PER_BATCH: 16 | |
BASE_LR: 0.0001 | |
STEPS: (327778, 355092) | |
MAX_ITER: 368750 | |
WARMUP_FACTOR: 1.0 | |
WARMUP_ITERS: 10 | |
WEIGHT_DECAY: 0.05 | |
OPTIMIZER: "ADAMW" | |
BACKBONE_MULTIPLIER: 0.1 | |
CLIP_GRADIENTS: | |
ENABLED: True | |
CLIP_TYPE: "full_model" | |
CLIP_VALUE: 0.01 | |
NORM_TYPE: 2.0 | |
AMP: | |
ENABLED: True | |
INPUT: | |
IMAGE_SIZE: 1024 | |
MIN_SCALE: 0.1 | |
MAX_SCALE: 2.0 | |
FORMAT: "RGB" | |
DATASET_MAPPER_NAME: "coco_unified_lsj" | |
MAX_SEQ_LEN: 77 | |
TASK_SEQ_LEN: 77 | |
TASK_PROB: | |
SEMANTIC: 0.33 | |
INSTANCE: 0.66 | |
TEST: | |
EVAL_PERIOD: 5000 | |
DATALOADER: | |
FILTER_EMPTY_ANNOTATIONS: True | |
NUM_WORKERS: 4 | |
VERSION: 2 | |