-
Notifications
You must be signed in to change notification settings - Fork 597
/
stark_st2_r50_50e_lasot.py
93 lines (90 loc) · 3.06 KB
/
stark_st2_r50_50e_lasot.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
_base_ = ['./stark_st2_r50_50e_got10k.py']
# model setting
model = dict(test_cfg=dict(update_intervals=[300]))
data_root = 'data/'
train_pipeline = [
dict(
type='TridentSampling',
num_search_frames=1,
num_template_frames=2,
max_frame_range=[200],
cls_pos_prob=0.5,
train_cls_head=True),
dict(type='LoadMultiImagesFromFile', to_float32=True),
dict(type='SeqLoadAnnotations', with_bbox=True, with_label=True),
dict(type='SeqGrayAug', prob=0.05),
dict(
type='SeqRandomFlip',
share_params=True,
flip_ratio=0.5,
direction='horizontal'),
dict(
type='SeqBboxJitter',
center_jitter_factor=[0, 0, 4.5],
scale_jitter_factor=[0, 0, 0.5],
crop_size_factor=[2, 2, 5]),
dict(
type='SeqCropLikeStark',
crop_size_factor=[2, 2, 5],
output_size=[128, 128, 320]),
dict(type='SeqBrightnessAug', jitter_range=0.2),
dict(
type='SeqRandomFlip',
share_params=False,
flip_ratio=0.5,
direction='horizontal'),
dict(
type='SeqNormalize',
mean=[123.675, 116.28, 103.53],
std=[58.395, 57.12, 57.375],
to_rgb=True),
dict(type='CheckPadMaskValidity', stride=16),
dict(
type='VideoCollect',
keys=['img', 'gt_bboxes', 'gt_labels', 'padding_mask'],
meta_keys=('valid')),
dict(type='ConcatSameTypeFrames', num_key_frames=2),
dict(type='SeqDefaultFormatBundle', ref_prefix='search')
]
# dataset settings
data = dict(
train=dict(
type='RandomSampleConcatDataset',
dataset_sampling_weights=[1, 1, 1, 1],
dataset_cfgs=[
dict(
type='GOT10kDataset',
ann_file=data_root +
'got10k/annotations/got10k_train_infos.txt',
img_prefix=data_root + 'got10k',
pipeline=train_pipeline,
split='train',
test_mode=False),
dict(
type='LaSOTDataset',
ann_file=data_root + 'lasot/annotations/lasot_train_infos.txt',
img_prefix=data_root + 'lasot/LaSOTBenchmark',
pipeline=train_pipeline,
split='train',
test_mode=False),
dict(
type='TrackingNetDataset',
ann_file=data_root +
'trackingnet/annotations/trackingnet_train_infos.txt',
img_prefix=data_root + 'trackingnet',
pipeline=train_pipeline,
split='train',
test_mode=False),
dict(
type='SOTCocoDataset',
ann_file=data_root +
'coco/annotations/instances_train2017.json',
img_prefix=data_root + 'coco/train2017',
pipeline=train_pipeline,
split='train',
test_mode=False)
]),
test=dict(
type='LaSOTDataset',
ann_file=data_root + 'lasot/annotations/lasot_test_infos.txt',
img_prefix=data_root + 'lasot/LaSOTBenchmark'))