-
Notifications
You must be signed in to change notification settings - Fork 0
/
AVA22_ViT-B.yaml
86 lines (79 loc) · 1.77 KB
/
AVA22_ViT-B.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
DDP_CONFIG:
WORLD_SIZE: 1
WORLD_RANK: 0
GPU_WORLD_SIZE: 8
GPU_WORLD_RANK: 0
DIST_URL: 'tcp://{}:11588'
WORLD_URLS: ["{}"]
AUTO_RANK_MATCH: True
DIST_BACKEND: 'nccl'
GPU: 0
DISTRIBUTED: True
CONFIG:
EVAL_ONLY: True
TWO_STREAM: False
USE_LFB: False
USE_LOCATION: False
VAL:
BATCH_SIZE: 1
FREQ: 2
DATA:
DATASET_NAME: 'ava'
LABEL_PATH: '../assets/ava_action_list_v2.1_for_activitynet_2018.pbtxt'
ANNO_PATH: '../assets/ava_{}_v22_updated.json'
DATA_PATH: '/path/to/dataset/AVA/frames/{}/'
NUM_CLASSES: 80
MULTIGRID: False
IMG_SIZE: 256
IMG_RESHAPE_SIZE: 288
TEMP_LEN: 16
FRAME_RATE: 4
MODEL:
SINGLE_FRAME: True
BACKBONE_NAME: ViT
TUNE_POINT: 0 # [0, 11]
GENERATE_LFB: False
NAME: 'ava_vit-b'
ENC_LAYERS: 6
DEC_LAYERS: 6
D_MODEL: 256
NHEAD: 8
DIM_FEEDFORWARD: 2048
QUERY_NUM: 15
NORMALIZE_BEFORE: False
DROPOUT: 0.1
DS_RATE: 8
TEMP_LEN: 16
SAMPLE_RATE: 4
PRETRAINED: True
PRETRAIN_BACKBONE_DIR: "../pretrained_models/backbone/ViT-B_K400_16x4.pth"
PRETRAIN_TRANSFORMER_DIR: "/path/to/ava22_csn50_transformer.pth"
PRETRAINED_PATH: ""
POSITION_EMBEDDING: "sine"
NUM_FEATURE_LEVELS: 4
NUM_ENC_N_POINTS: 8
BBOX_EMBED_DIFF_EACH_LAYER: False
LABEL_SMOOTHING_ALPHA: 0.1
MATCHER:
COST_CLASS: 12
COST_BBOX: 5
COST_GIOU: 2
BNY_LOSS: True
BEFORE: False
LOSS_COFS:
MASK_COF: 1
DICE_COF: 10
BBOX_COF: 5
GIOU_COF: 2
PERSON_COF: 1
EOS_COF: 0.1
WEIGHT: 10
CLIPS_MAX_NORM: 0.1
LOG:
BASE_PATH: '/path/to/save/AVA'
LOG_DIR: 'tb_log'
SAVE_DIR: 'checkpoints'
EVAL_DIR: '/path/to/save/AVA/eval'
RES_DIR: CM_ViT-B_{}-{}/res
EXP_NAME: CM_ViT-B_{}-{}
DISPLAY_FREQ: 1000