Release of PromptSRC with pretrained models.
This commit is contained in:
2
configs/datasets/caltech101.yaml
Normal file
2
configs/datasets/caltech101.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "Caltech101"
|
||||
2
configs/datasets/dtd.yaml
Normal file
2
configs/datasets/dtd.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "DescribableTextures"
|
||||
2
configs/datasets/eurosat.yaml
Normal file
2
configs/datasets/eurosat.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "EuroSAT"
|
||||
2
configs/datasets/fgvc_aircraft.yaml
Normal file
2
configs/datasets/fgvc_aircraft.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "FGVCAircraft"
|
||||
2
configs/datasets/food101.yaml
Normal file
2
configs/datasets/food101.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "Food101"
|
||||
2
configs/datasets/imagenet.yaml
Normal file
2
configs/datasets/imagenet.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "ImageNet"
|
||||
2
configs/datasets/imagenet_a.yaml
Normal file
2
configs/datasets/imagenet_a.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "ImageNetA"
|
||||
2
configs/datasets/imagenet_r.yaml
Normal file
2
configs/datasets/imagenet_r.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "ImageNetR"
|
||||
2
configs/datasets/imagenet_sketch.yaml
Normal file
2
configs/datasets/imagenet_sketch.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "ImageNetSketch"
|
||||
2
configs/datasets/imagenetv2.yaml
Normal file
2
configs/datasets/imagenetv2.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "ImageNetV2"
|
||||
2
configs/datasets/oxford_flowers.yaml
Normal file
2
configs/datasets/oxford_flowers.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "OxfordFlowers"
|
||||
2
configs/datasets/oxford_pets.yaml
Normal file
2
configs/datasets/oxford_pets.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "OxfordPets"
|
||||
2
configs/datasets/stanford_cars.yaml
Normal file
2
configs/datasets/stanford_cars.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "StanfordCars"
|
||||
2
configs/datasets/sun397.yaml
Normal file
2
configs/datasets/sun397.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "SUN397"
|
||||
2
configs/datasets/ucf101.yaml
Normal file
2
configs/datasets/ucf101.yaml
Normal file
@@ -0,0 +1,2 @@
|
||||
DATASET:
|
||||
NAME: "UCF101"
|
||||
35
configs/trainers/CoCoOp/vit_b16_c16_ep10_batch1.yaml
Normal file
35
configs/trainers/CoCoOp/vit_b16_c16_ep10_batch1.yaml
Normal file
@@ -0,0 +1,35 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 1
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 10
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
COCOOP:
|
||||
N_CTX: 16
|
||||
CTX_INIT: ""
|
||||
PREC: "fp16"
|
||||
35
configs/trainers/CoCoOp/vit_b16_c4_ep10_batch1.yaml
Normal file
35
configs/trainers/CoCoOp/vit_b16_c4_ep10_batch1.yaml
Normal file
@@ -0,0 +1,35 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 1
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 10
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
COCOOP:
|
||||
N_CTX: 4
|
||||
CTX_INIT: ""
|
||||
PREC: "fp16"
|
||||
35
configs/trainers/CoCoOp/vit_b16_c4_ep10_batch1_ctxv1.yaml
Normal file
35
configs/trainers/CoCoOp/vit_b16_c4_ep10_batch1_ctxv1.yaml
Normal file
@@ -0,0 +1,35 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 1
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 10
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
COCOOP:
|
||||
N_CTX: 4
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
35
configs/trainers/CoCoOp/vit_b16_c8_ep10_batch1.yaml
Normal file
35
configs/trainers/CoCoOp/vit_b16_c8_ep10_batch1.yaml
Normal file
@@ -0,0 +1,35 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 1
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 10
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
COCOOP:
|
||||
N_CTX: 8
|
||||
CTX_INIT: ""
|
||||
PREC: "fp16"
|
||||
29
configs/trainers/CoOp/rn101.yaml
Normal file
29
configs/trainers/CoOp/rn101.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 200
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN101"
|
||||
29
configs/trainers/CoOp/rn101_ep50.yaml
Normal file
29
configs/trainers/CoOp/rn101_ep50.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN101"
|
||||
29
configs/trainers/CoOp/rn50.yaml
Normal file
29
configs/trainers/CoOp/rn50.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 200
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
33
configs/trainers/CoOp/rn50_ctxv1.yaml
Normal file
33
configs/trainers/CoOp/rn50_ctxv1.yaml
Normal file
@@ -0,0 +1,33 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 200
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
|
||||
TRAINER:
|
||||
COOP:
|
||||
CTX_INIT: "a photo of a"
|
||||
29
configs/trainers/CoOp/rn50_ep100.yaml
Normal file
29
configs/trainers/CoOp/rn50_ep100.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 100
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
29
configs/trainers/CoOp/rn50_ep50.yaml
Normal file
29
configs/trainers/CoOp/rn50_ep50.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
33
configs/trainers/CoOp/rn50_ep50_ctxv1.yaml
Normal file
33
configs/trainers/CoOp/rn50_ep50_ctxv1.yaml
Normal file
@@ -0,0 +1,33 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
|
||||
TRAINER:
|
||||
COOP:
|
||||
CTX_INIT: "a photo of a"
|
||||
17
configs/trainers/CoOp/rn50_val.yaml
Normal file
17
configs/trainers/CoOp/rn50_val.yaml
Normal file
@@ -0,0 +1,17 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 200
|
||||
TEST:
|
||||
BATCH_SIZE: 200
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "RN50"
|
||||
29
configs/trainers/CoOp/vit_b16.yaml
Normal file
29
configs/trainers/CoOp/vit_b16.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 200
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
29
configs/trainers/CoOp/vit_b16_ep100.yaml
Normal file
29
configs/trainers/CoOp/vit_b16_ep100.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 100
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
29
configs/trainers/CoOp/vit_b16_ep50.yaml
Normal file
29
configs/trainers/CoOp/vit_b16_ep50.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
29
configs/trainers/CoOp/vit_b32.yaml
Normal file
29
configs/trainers/CoOp/vit_b32.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 200
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/32"
|
||||
29
configs/trainers/CoOp/vit_b32_ep50.yaml
Normal file
29
configs/trainers/CoOp/vit_b32_ep50.yaml
Normal file
@@ -0,0 +1,29 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 32
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.002
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 5
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/32"
|
||||
39
configs/trainers/IVLP/vit_b16_c2_ep20_batch4_4+4ctx.yaml
Normal file
39
configs/trainers/IVLP/vit_b16_c2_ep20_batch4_4+4ctx.yaml
Normal file
@@ -0,0 +1,39 @@
|
||||
# Independent Vision Language Prompting
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0025
|
||||
MAX_EPOCH: 20
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
IVLP:
|
||||
N_CTX_VISION: 4
|
||||
N_CTX_TEXT: 4
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH_VISION: 9
|
||||
PROMPT_DEPTH_TEXT: 9
|
||||
36
configs/trainers/MaPLe/vit_b16_c2_ep5_batch4_2ctx.yaml
Normal file
36
configs/trainers/MaPLe/vit_b16_c2_ep5_batch4_2ctx.yaml
Normal file
@@ -0,0 +1,36 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0035
|
||||
MAX_EPOCH: 2
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
MAPLE:
|
||||
N_CTX: 2
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH: 9
|
||||
@@ -0,0 +1,36 @@
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0026
|
||||
MAX_EPOCH: 2
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
MAPLE:
|
||||
N_CTX: 2
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH: 3
|
||||
@@ -0,0 +1,43 @@
|
||||
# PromptSRC: Prompting with Self-regularizing constraints
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0025
|
||||
MAX_EPOCH: 20
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
PROMPTSRC:
|
||||
N_CTX_VISION: 4
|
||||
N_CTX_TEXT: 4
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH_VISION: 9
|
||||
PROMPT_DEPTH_TEXT: 9
|
||||
TEXT_LOSS_WEIGHT: 25
|
||||
IMAGE_LOSS_WEIGHT: 10
|
||||
GPA_MEAN: 15
|
||||
GPA_STD: 1
|
||||
@@ -0,0 +1,43 @@
|
||||
# PromptSRC: Prompting with Self-regularizing constraints
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0025
|
||||
MAX_EPOCH: 20
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
PROMPTSRC:
|
||||
N_CTX_VISION: 4
|
||||
N_CTX_TEXT: 4
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH_VISION: 3
|
||||
PROMPT_DEPTH_TEXT: 3
|
||||
TEXT_LOSS_WEIGHT: 25
|
||||
IMAGE_LOSS_WEIGHT: 10
|
||||
GPA_MEAN: 6
|
||||
GPA_STD: 10
|
||||
@@ -0,0 +1,47 @@
|
||||
# PromptSRC: Prompting with Self-regularizing constraints
|
||||
DATALOADER:
|
||||
TRAIN_X:
|
||||
BATCH_SIZE: 4
|
||||
TEST:
|
||||
BATCH_SIZE: 100
|
||||
NUM_WORKERS: 8
|
||||
|
||||
INPUT:
|
||||
SIZE: (224, 224)
|
||||
INTERPOLATION: "bicubic"
|
||||
PIXEL_MEAN: [0.48145466, 0.4578275, 0.40821073]
|
||||
PIXEL_STD: [0.26862954, 0.26130258, 0.27577711]
|
||||
TRANSFORMS: ["random_resized_crop", "random_flip", "normalize"]
|
||||
|
||||
OPTIM:
|
||||
NAME: "sgd"
|
||||
LR: 0.0025
|
||||
MAX_EPOCH: 50
|
||||
LR_SCHEDULER: "cosine"
|
||||
WARMUP_EPOCH: 1
|
||||
WARMUP_TYPE: "constant"
|
||||
WARMUP_CONS_LR: 1e-5
|
||||
|
||||
TRAIN:
|
||||
PRINT_FREQ: 20
|
||||
|
||||
MODEL:
|
||||
BACKBONE:
|
||||
NAME: "ViT-B/16"
|
||||
|
||||
TRAINER:
|
||||
PROMPTSRC:
|
||||
N_CTX_VISION: 4
|
||||
N_CTX_TEXT: 4
|
||||
CTX_INIT: "a photo of a"
|
||||
PREC: "fp16"
|
||||
PROMPT_DEPTH_VISION: 9
|
||||
PROMPT_DEPTH_TEXT: 9
|
||||
TEXT_LOSS_WEIGHT: 25
|
||||
IMAGE_LOSS_WEIGHT: 10
|
||||
# Use the below configuration for: ImageNet, Caltech101, OxfordPets, Food101, UCF101 and SUN397
|
||||
GPA_MEAN: 30
|
||||
GPA_STD: 30
|
||||
# Use the below configuration for: StanfordCars, Flowers102, FGVCAircraft, DTD and EuroSAT
|
||||
# GPA_MEAN: 45
|
||||
# GPA_STD: 5
|
||||
Reference in New Issue
Block a user