|
| 1 | +_base_ = [ |
| 2 | + '../_base_/models/segmenter_vit-b16_mask.py', |
| 3 | + '../_base_/datasets/ade20k.py', '../_base_/default_runtime.py', |
| 4 | + '../_base_/schedules/schedule_160k.py' |
| 5 | +] |
| 6 | + |
| 7 | +model = dict( |
| 8 | + pretrained='pretrain/vit_large_p16_384.pth', |
| 9 | + backbone=dict( |
| 10 | + type='VisionTransformer', |
| 11 | + img_size=(640, 640), |
| 12 | + embed_dims=1024, |
| 13 | + num_layers=24, |
| 14 | + num_heads=16), |
| 15 | + decode_head=dict( |
| 16 | + type='SegmenterMaskTransformerHead', |
| 17 | + in_channels=1024, |
| 18 | + channels=1024, |
| 19 | + num_heads=16, |
| 20 | + embed_dims=1024), |
| 21 | + test_cfg=dict(mode='slide', crop_size=(640, 640), stride=(608, 608))) |
| 22 | + |
| 23 | +optimizer = dict(lr=0.001, weight_decay=0.0) |
| 24 | + |
| 25 | +img_norm_cfg = dict( |
| 26 | + mean=[127.5, 127.5, 127.5], std=[127.5, 127.5, 127.5], to_rgb=True) |
| 27 | +crop_size = (640, 640) |
| 28 | +train_pipeline = [ |
| 29 | + dict(type='LoadImageFromFile'), |
| 30 | + dict(type='LoadAnnotations', reduce_zero_label=True), |
| 31 | + dict(type='Resize', img_scale=(2048, 640), ratio_range=(0.5, 2.0)), |
| 32 | + dict(type='RandomCrop', crop_size=crop_size, cat_max_ratio=0.75), |
| 33 | + dict(type='RandomFlip', prob=0.5), |
| 34 | + dict(type='PhotoMetricDistortion'), |
| 35 | + dict(type='Normalize', **img_norm_cfg), |
| 36 | + dict(type='Pad', size=crop_size, pad_val=0, seg_pad_val=255), |
| 37 | + dict(type='DefaultFormatBundle'), |
| 38 | + dict(type='Collect', keys=['img', 'gt_semantic_seg']) |
| 39 | +] |
| 40 | +test_pipeline = [ |
| 41 | + dict(type='LoadImageFromFile'), |
| 42 | + dict( |
| 43 | + type='MultiScaleFlipAug', |
| 44 | + img_scale=(2048, 640), |
| 45 | + # img_ratios=[0.5, 0.75, 1.0, 1.25, 1.5, 1.75], |
| 46 | + flip=False, |
| 47 | + transforms=[ |
| 48 | + dict(type='Resize', keep_ratio=True), |
| 49 | + dict(type='RandomFlip'), |
| 50 | + dict(type='Normalize', **img_norm_cfg), |
| 51 | + dict(type='ImageToTensor', keys=['img']), |
| 52 | + dict(type='Collect', keys=['img']) |
| 53 | + ]) |
| 54 | +] |
| 55 | +data = dict( |
| 56 | + # num_gpus: 8 -> batch_size: 8 |
| 57 | + samples_per_gpu=1, |
| 58 | + train=dict(pipeline=train_pipeline), |
| 59 | + val=dict(pipeline=test_pipeline), |
| 60 | + test=dict(pipeline=test_pipeline)) |
0 commit comments