-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathUCF_ViT-B.yaml
85 lines (78 loc) · 1.68 KB
/
UCF_ViT-B.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
DDP_CONFIG:
WORLD_SIZE: 1
WORLD_RANK: 0
GPU_WORLD_SIZE: 8
GPU_WORLD_RANK: 0
DIST_URL: 'tcp://{}:11591'
WORLD_URLS: ["{}"]
AUTO_RANK_MATCH: True
DIST_BACKEND: 'nccl'
GPU: 0
DISTRIBUTED: True
CONFIG:
EVAL_ONLY: True
TWO_STREAM: False
USE_LFB: False
USE_LOCATION: False
VAL:
BATCH_SIZE: 1
FREQ: 2
DATA:
DATASET_NAME: 'ucf'
ANNO_PATH: '/path/to/dataset/UCF101_v2/UCF101v2-GT.pkl'
DATA_PATH: '/path/to/dataset/UCF101_v2/rgb-images'
NUM_CLASSES: 24
MULTIGRID: False
IMG_SIZE: 224
IMG_RESHAPE_SIZE: 256
TEMP_LEN: 32
FRAME_RATE: 1
MODEL:
SINGLE_FRAME: False
BACKBONE_NAME: ViT
TUNE_POINT: 0 # [0, 11]
TEMPORAL_DS_STRATEGY: decode
LAST_STRIDE: False
GENERATE_LFB: False
NAME: 'ucf_vit-b'
ENC_LAYERS: 3
DEC_LAYERS: 3
D_MODEL: 256
NHEAD: 8
DIM_FEEDFORWARD: 2048
QUERY_NUM: 15
NORMALIZE_BEFORE: False
DROPOUT: 0.1
DS_RATE: 8
TEMP_LEN: 32
SAMPLE_RATE: 1
PRETRAINED: True
PRETRAIN_BACKBONE_DIR: "../pretrained_models/backbone/ViT-B_K400_16x4.pth"
POSITION_EMBEDDING: "sine"
NUM_FEATURE_LEVELS: 4
NUM_ENC_N_POINTS: 8
BBOX_EMBED_DIFF_EACH_LAYER: False
LABEL_SMOOTHING_ALPHA: 0.0
MATCHER:
COST_CLASS: 4
COST_BBOX: 5
COST_GIOU: 2
BNY_LOSS: True
BEFORE: False
LOSS_COFS:
MASK_COF: 1
DICE_COF: 4
BBOX_COF: 5
GIOU_COF: 2
PERSON_COF: 3
EOS_COF: 0.5
WEIGHT: 10
CLIPS_MAX_NORM: 0.1
LOG:
BASE_PATH: '/path/to/save/JHMDB'
LOG_DIR: 'tb_log'
SAVE_DIR: 'checkpoints'
EVAL_DIR: '/path/to/save/JHMDB/eval'
RES_DIR: CM_ViT-B_{}-{}/res
EXP_NAME: CM_ViT-B_{}-{}
DISPLAY_FREQ: 1000