-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsvtr_large_train_stn.yml
158 lines (156 loc) · 2.77 KB
/
svtr_large_train_stn.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
Global:
use_gpu: True
epoch_num: 500
log_smooth_window: 20
print_batch_step: 10
save_model_dir: ./svtr_large_stn
save_epoch_step: 400
# evaluation is run every 2000 iterations after the 0th iteration
eval_batch_step: [0, 5000]
cal_metric_during_train: True
pretrained_model:
checkpoints:
save_inference_dir:
use_visualdl: False
infer_img: data/DDT_crop/test/
# for data or label process
character_dict_path: ./ppocr/utils/EN_symbol_dict.txt
max_text_length: 25
infer_mode: False
use_space_char: False
save_res_path: ./svtr_large_stn.csv
Optimizer:
name: AdamW
beta1: 0.9
beta2: 0.99
epsilon: 0.00000008
weight_decay: 0.05
no_weight_decay_name: norm pos_embed
one_dim_param_no_weight_decay: true
lr:
name: Cosine
learning_rate: 0.0005
warmup_epoch: 10
Architecture:
model_type: rec
algorithm: SVTR
Backbone:
name: SVTRNet
img_size:
- 32
- 200
out_char_num: 40
out_channels: 384
patch_merging: Conv
embed_dim:
- 192
- 256
- 512
depth:
- 3
- 9
- 9
num_heads:
- 6
- 8
- 16
mixer:
- Local
- Local
- Local
- Local
- Local
- Local
- Local
- Local
- Local
- Local
- Global
- Global
- Global
- Global
- Global
- Global
- Global
- Global
- Global
- Global
- Global
local_mixer:
- - 7
- 11
- - 7
- 11
- - 7
- 11
prenorm: false
Neck:
name: SequenceEncoder
encoder_type: reshape
Head:
name: CTCHead
Loss:
name: CTCLoss
PostProcess:
name: CTCLabelDecode
Metric:
name: RecMetric
main_indicator: acc
Train:
dataset:
name: SimpleDataSet
label_file_list:
- ./data/train.txt
data_dir: ./data/DDT_crop/train
transforms:
- DecodeImage:
img_mode: BGR
channel_first: false
- RecAug: null
- CTCLabelEncode: null
- RecResizeImg:
character_dict_path: null
image_shape:
- 3
- 32
- 200
padding: false
- KeepKeys:
keep_keys:
- image
- label
- length
loader:
shuffle: true
batch_size_per_card: 128
drop_last: true
num_workers: 20
Eval:
dataset:
name: SimpleDataSet
label_file_list:
- ./data/val.txt
data_dir: ./data/DDT_crop/train
transforms:
- DecodeImage:
img_mode: BGR
channel_first: false
- CTCLabelEncode: null
- RecResizeImg:
character_dict_path: null
image_shape:
- 3
- 32
- 200
padding: false
- KeepKeys:
keep_keys:
- image
- label
- length
loader:
shuffle: false
drop_last: false
batch_size_per_card: 64
num_workers: 4
profiler_options: null