-
Notifications
You must be signed in to change notification settings - Fork 1
/
VDT.yml
95 lines (73 loc) · 1.48 KB
/
VDT.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
MODEL:
META_ARCHITECTURE: Baseline_multiview
PIXEL_MEAN: [127.5, 127.5, 127.5]
PIXEL_STD: [127.5, 127.5, 127.5]
BACKBONE:
NAME: build_multiview_vit_backbone_onebranch
DEPTH: base
FEAT_DIM: 768
PRETRAIN: True
PRETRAIN_PATH: XXX
STRIDE_SIZE: (16, 16)
DROP_PATH_RATIO: 0.1
DROP_RATIO: 0.0
ATT_DROP_RATE: 0.0
INNER_SUB: True
HEADS:
NAME: EmbeddingHead
NORM: BN
WITH_BNNECK: True
POOL_LAYER: Identity
NECK_FEAT: before
CLS_LAYER: Linear
LOSSES:
NAME: ("CrossEntropyLoss", "TripletLoss",)
CE:
EPSILON: 0.
SCALE: 1.
# view-related learning
VIEW_ID: True
VIEW_OREG: True
VIEW_LAMBDA: 0.001
TRI:
MARGIN: 0.0
HARD_MINING: True
NORM_FEAT: False
SCALE: 1.
INPUT:
SIZE_TRAIN: [ 256, 128 ]
SIZE_TEST: [ 256, 128 ]
REA:
ENABLED: True
PROB: 0.5
FLIP:
ENABLED: True
PADDING:
ENABLED: True
DATALOADER:
SAMPLER_TRAIN: NaiveIdentitySampler
NUM_INSTANCE: 4
NUM_WORKERS: 8
SOLVER:
AMP:
ENABLED: True
OPT: SGD
MAX_EPOCH: 120
BASE_LR: 0.008
WEIGHT_DECAY: 0.0001
IMS_PER_BATCH: 128
SCHED: CosineAnnealingLR
ETA_MIN_LR: 0.0000016
WARMUP_FACTOR: 0.01
WARMUP_ITERS: 2000
CLIP_GRADIENTS:
ENABLED: True
CHECKPOINT_PERIOD: 5
TEST:
EVAL_PERIOD: 5
IMS_PER_BATCH: 1024
CUDNN_BENCHMARK: True
DATASETS:
NAMES: ("CARGO",)
TESTS: ("CARGO", "CARGO_GG", "CARGO_AA", "CARGO_AG",)
OUTPUT_DIR: logs/CARGO/VDT_base