Spaces:
Runtime error
Runtime error
| MODEL: | |
| META_ARCHITECTURE: "CATSeg" | |
| BACKBONE: | |
| FREEZE_AT: 0 | |
| NAME: "D2SwinTransformer" | |
| SWIN: | |
| EMBED_DIM: 192 | |
| DEPTHS: [2, 2, 18, 2] | |
| NUM_HEADS: [4, 8, 16, 32] | |
| WINDOW_SIZE: 12 | |
| APE: False | |
| DROP_PATH_RATE: 0.3 | |
| PATCH_NORM: True | |
| PRETRAIN_IMG_SIZE: 384 | |
| OUT_FEATURES: ["res2", "res3", "res4"] | |
| WEIGHTS: "swin_large_patch4_window12_384_22k.pkl" | |
| PIXEL_MEAN: [123.675, 116.280, 103.530] | |
| PIXEL_STD: [58.395, 57.120, 57.375] | |
| SEM_SEG_HEAD: | |
| NAME: "OpenVocabHead" | |
| IN_FEATURES: ["res2", "res3", "res4"] | |
| IGNORE_VALUE: 255 | |
| NUM_CLASSES: 171 | |
| TRAIN_CLASS_JSON: "datasets/coco.json" | |
| TEST_CLASS_JSON: "datasets/coco.json" | |
| CLIP_PRETRAINED: "ViT-L/14@336px" | |
| PROMPT_DEPTH: 0 | |
| PROMPT_LENGTH: 0 | |
| TEXT_AFFINITY_DIM: 768 | |
| TEXT_AFFINITY_PROJ_DIM: 128 | |
| APPEARANCE_AFFINITY_DIM: 768 | |
| APPEARANCE_AFFINITY_PROJ_DIM: 128 | |
| DECODER_DIMS: [64, 32] | |
| DECODER_AFFINITY_DIMS: [256, 128] | |
| DECODER_AFFINITY_PROJ_DIMS: [32, 16] | |
| NUM_LAYERS: 4 | |
| NUM_HEADS: 4 | |
| HIDDEN_DIMS: 128 | |
| POOLING_SIZES: [6, 6] | |
| FEATURE_RESOLUTION: [24, 24] | |
| WINDOW_SIZES: 12 | |
| ATTENTION_TYPE: "linear" | |
| CLIP_FINETUNE: "attention" | |
| PROMPT_ENSEMBLE_TYPE: "imagenet" | |
| DATASETS: | |
| TRAIN: ("coco_2017_train_stuff_all_sem_seg",) | |
| TEST: ("coco_2017_test_stuff_all_sem_seg",) | |
| SOLVER: | |
| IMS_PER_BATCH: 4 | |
| BASE_LR: 0.0002 | |
| MAX_ITER: 80000 | |
| WARMUP_FACTOR: 1.0 | |
| WARMUP_ITERS: 0 | |
| WEIGHT_DECAY: 0.0001 | |
| OPTIMIZER: "ADAMW" | |
| LR_SCHEDULER_NAME: "WarmupCosineLR" | |
| BACKBONE_MULTIPLIER: 0.01 | |
| CLIP_MULTIPLIER: 0.01 | |
| CLIP_GRADIENTS: | |
| ENABLED: True | |
| CLIP_TYPE: "full_model" | |
| CLIP_VALUE: 0.01 | |
| NORM_TYPE: 2.0 | |
| INPUT: | |
| MIN_SIZE_TRAIN: (384, ) | |
| MIN_SIZE_TRAIN_SAMPLING: "choice" | |
| MIN_SIZE_TEST: 640 | |
| MAX_SIZE_TEST: 2560 | |
| CROP: | |
| ENABLED: True | |
| TYPE: "absolute" | |
| SIZE: (384, 384) | |
| SINGLE_CATEGORY_MAX_AREA: 1.0 | |
| COLOR_AUG_SSD: True | |
| SIZE_DIVISIBILITY: 384 | |
| FORMAT: "RGB" | |
| DATASET_MAPPER_NAME: "mask_former_semantic" | |
| TEST: | |
| EVAL_PERIOD: 5000 | |
| SLIDING_WINDOW: False | |
| DATALOADER: | |
| FILTER_EMPTY_ANNOTATIONS: True | |
| NUM_WORKERS: 8 | |
| VERSION: 2 | |
| CUDNN_BENCHMARK: True |