rec_resnet_stn_bilstm_att.yml 2.43 KB
Newer Older
tink2123's avatar
tink2123 committed
1
Global:
tink2123's avatar
tink2123 committed
2
  use_gpu: True
tink2123's avatar
tink2123 committed
3
4
5
  epoch_num: 400
  log_smooth_window: 20
  print_batch_step: 10
tink2123's avatar
tink2123 committed
6
  save_model_dir: ./output/rec/seed
tink2123's avatar
tink2123 committed
7
8
9
10
11
12
13
14
  save_epoch_step: 3
  # evaluation is run every 5000 iterations after the 4000th iteration
  eval_batch_step: [0, 2000]
  cal_metric_during_train: True
  pretrained_model:
  checkpoints:
  save_inference_dir:
  use_visualdl: False
tink2123's avatar
tink2123 committed
15
  infer_img: doc/imgs_words_en/word_10.png
tink2123's avatar
tink2123 committed
16
  # for data or label process
tink2123's avatar
tink2123 committed
17
  character_dict_path: ppocr/utils/EN_symbol_dict.txt
tink2123's avatar
tink2123 committed
18
  max_text_length: 100
tink2123's avatar
tink2123 committed
19
20
  infer_mode: False
  use_space_char: False
tink2123's avatar
tink2123 committed
21
  save_res_path: ./output/rec/predicts_seed.txt
tink2123's avatar
tink2123 committed
22
23
24


Optimizer:
tink2123's avatar
tink2123 committed
25
26
27
  name: Adadelta
  weight_deacy: 0.0
  momentum: 0.9
tink2123's avatar
tink2123 committed
28
  lr:
tink2123's avatar
tink2123 committed
29
30
31
    name: Piecewise
    decay_epochs: [4,5,8]
    values: [1.0, 0.1, 0.01]
tink2123's avatar
tink2123 committed
32
33
  regularizer:
    name: 'L2'
tink2123's avatar
tink2123 committed
34
35
    factor: 2.0e-05

tink2123's avatar
tink2123 committed
36
37

Architecture:
tink2123's avatar
tink2123 committed
38
  model_type: rec
tink2123's avatar
tink2123 committed
39
  algorithm: SEED
tink2123's avatar
tink2123 committed
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
  Transform:
    name: STN_ON
    tps_inputsize: [32, 64]
    tps_outputsize: [32, 100]
    num_control_points: 20
    tps_margins: [0.05,0.05]
    stn_activation: none
  Backbone:
    name: ResNet_ASTER
  Head:
    name: AsterHead  # AttentionHead
    sDim: 512
    attDim: 512
    max_len_labels: 100

Loss:
  name: AsterLoss

PostProcess:
tink2123's avatar
tink2123 committed
59
  name: SEEDLabelDecode
tink2123's avatar
tink2123 committed
60
61
62
63

Metric:
  name: RecMetric
  main_indicator: acc
tink2123's avatar
tink2123 committed
64
  is_filter: True
tink2123's avatar
tink2123 committed
65
66
67

Train:
  dataset:
tink2123's avatar
tink2123 committed
68
69
    name: LMDBDataSet
    data_dir: ./train_data/data_lmdb_release/training/
tink2123's avatar
tink2123 committed
70
    transforms:
tink2123's avatar
tink2123 committed
71
72
      - Fasttext:
          path: "./cc.en.300.bin"
tink2123's avatar
tink2123 committed
73
74
75
      - DecodeImage: # load image
          img_mode: BGR
          channel_first: False
tink2123's avatar
tink2123 committed
76
      - SEEDLabelEncode: # Class handling label
tink2123's avatar
tink2123 committed
77
      - RecResizeImg:
tink2123's avatar
tink2123 committed
78
          character_dict_path:
tink2123's avatar
tink2123 committed
79
          image_shape: [3, 64, 256]
tink2123's avatar
tink2123 committed
80
          padding: False
tink2123's avatar
tink2123 committed
81
      - KeepKeys:
tink2123's avatar
tink2123 committed
82
          keep_keys: ['image', 'label', 'length', 'fast_label'] # dataloader will return list in this order
tink2123's avatar
tink2123 committed
83
84
  loader:
    shuffle: True
tink2123's avatar
tink2123 committed
85
    batch_size_per_card: 256
tink2123's avatar
tink2123 committed
86
    drop_last: True
tink2123's avatar
tink2123 committed
87
    num_workers: 6
tink2123's avatar
tink2123 committed
88
89
90

Eval:
  dataset:
tink2123's avatar
tink2123 committed
91
92
    name: LMDBDataSet
    data_dir: ./train_data/data_lmdb_release/evaluation/
tink2123's avatar
tink2123 committed
93
94
95
96
    transforms:
      - DecodeImage: # load image
          img_mode: BGR
          channel_first: False
tink2123's avatar
tink2123 committed
97
      - SEEDLabelEncode: # Class handling label
tink2123's avatar
tink2123 committed
98
      - RecResizeImg:
tink2123's avatar
tink2123 committed
99
          character_dict_path:
tink2123's avatar
tink2123 committed
100
          image_shape: [3, 64, 256]
tink2123's avatar
tink2123 committed
101
          padding: False
tink2123's avatar
tink2123 committed
102
103
104
105
      - KeepKeys:
          keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
  loader:
    shuffle: False
tink2123's avatar
tink2123 committed
106
107
108
    drop_last: True
    batch_size_per_card: 256
    num_workers: 4