-
Notifications
You must be signed in to change notification settings - Fork 3
/
phoenix-2014t_s2g.yaml
88 lines (87 loc) · 2.42 KB
/
phoenix-2014t_s2g.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
task: S2G
device: cuda
do_translation: False
do_recognition: True
data:
train_label_path: data/Phoenix-2014T/Phoenix-2014T.train
dev_label_path: data/Phoenix-2014T/Phoenix-2014T.dev
test_label_path: data/Phoenix-2014T/Phoenix-2014T.test
max_length: 300
dataset_name: Phoenix-2014T
input_streams: keypoint
level: word #word or char
txt_lowercase: true
max_sent_length: 400
gloss:
gloss2id_file: data/Phoenix-2014T/gloss2ids.pkl
testing:
recognition:
beam_size: 5
translation: {}
training:
wandb: disabled # online or disabled
model_dir: outputs/Phoenix-2014T_SLR
validation:
recognition:
beam_size: 1
translation: {}
optimization:
optimizer: Adam
learning_rate:
default: 1.0e-3
weight_decay: 0.001
betas:
- 0.9
- 0.998
scheduler: cosineannealing
t_max: 100
model:
RecognitionNetwork:
input_type: keypoint
DSTA-Net:
net: [[64, 64, 16, 7, 2], [64, 64, 16, 3, 1],
[64, 128, 32, 3, 1], [128, 128, 32, 3, 1],
[128, 256, 64, 3, 2], [256, 256, 64, 3, 1],
[256, 256, 64, 3, 1], [256, 256, 64, 3, 1],]
body: [0,1,3,5,7,9,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,2,4,6,8,10,112,113,
114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,23,26,29,33,36,39,41,43,46,48,
53,56,59,62,65,68,71,72,73,74,75,76,77,79,80,81]
left: [0,1,3,5,7,9,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111]
right: [0,2,4,6,8,10,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132]
face: [23,26,29,33,36,39,41,43,46,48,53,56,59,62,65,68,71,72,73,74,75,76,77,79,80,81]
mouth: [71,72,73,74,75,76,77,79,80,81]
GlossTokenizer:
gloss2id_file: data/Phoenix-2014T/gloss2ids.pkl
body_visual_head:
input_size: 256
hidden_size: 512
ff_size: 2048
pe: True
ff_kernelsize:
- 3
- 3
fuse_visual_head:
input_size: 1024
hidden_size: 512
ff_size: 2048
pe: True
ff_kernelsize:
- 3
- 3
left_visual_head:
input_size: 512
hidden_size: 512
ff_size: 2048
pe: True
ff_kernelsize:
- 3
- 3
right_visual_head:
input_size: 512
hidden_size: 512
ff_size: 2048
pe: True
ff_kernelsize:
- 3
- 3
cross_distillation: True