resnet45_trans_matrn.yml 2.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495
  1. Global:
  2. device: gpu
  3. epoch_num: 20
  4. log_smooth_window: 20
  5. print_batch_step: 10
  6. output_dir: ./output/rec/u14m_filter/resnet45_trans_matrn/
  7. eval_epoch_step: [0, 1]
  8. eval_batch_step: [0, 500]
  9. cal_metric_during_train: True
  10. pretrained_model:
  11. # ./openocr_nolang_abinet_lang.pth
  12. checkpoints:
  13. use_tensorboard: false
  14. infer_img:
  15. # for data or label process
  16. character_dict_path: ./tools/utils/EN_symbol_dict.txt
  17. max_text_length: 25
  18. use_space_char: False
  19. save_res_path: ./output/rec/u14m_filter/predicts_resnet45_trans_matrn.txt
  20. grad_clip_val: 20
  21. use_amp: True
  22. Optimizer:
  23. name: Adam
  24. lr: 0.000133 # 4gpus 128bs/gpu
  25. weight_decay: 0.0
  26. filter_bias_and_bn: False
  27. LRScheduler:
  28. name: MultiStepLR
  29. milestones: [12, 18]
  30. gamma: 0.1
  31. Architecture:
  32. model_type: rec
  33. algorithm: MATRN
  34. Transform:
  35. Encoder:
  36. name: ResNet45
  37. in_channels: 3
  38. strides: [2, 1, 2, 1, 1]
  39. Decoder:
  40. name: MATRNDecoder
  41. iter_size: 3
  42. Loss:
  43. name: ABINetLoss
  44. align_weight: 3.0
  45. PostProcess:
  46. name: ABINetLabelDecode
  47. Metric:
  48. name: RecMetric
  49. main_indicator: acc
  50. is_filter: True
  51. Train:
  52. dataset:
  53. name: LMDBDataSet
  54. data_dir: ../Union14M-L-LMDB-Filtered
  55. transforms:
  56. - DecodeImagePIL: # load image
  57. img_mode: RGB
  58. - PARSeqAugPIL:
  59. - ABINetLabelEncode:
  60. - RecTVResize:
  61. image_shape: [32, 128]
  62. padding: False
  63. - KeepKeys:
  64. keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
  65. loader:
  66. shuffle: True
  67. batch_size_per_card: 128
  68. drop_last: True
  69. num_workers: 4
  70. Eval:
  71. dataset:
  72. name: LMDBDataSet
  73. data_dir: ../evaluation
  74. transforms:
  75. - DecodeImagePIL: # load image
  76. img_mode: RGB
  77. - ABINetLabelEncode:
  78. - RecTVResize:
  79. image_shape: [32, 128]
  80. padding: False
  81. - KeepKeys:
  82. keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
  83. loader:
  84. shuffle: False
  85. drop_last: False
  86. batch_size_per_card: 256
  87. num_workers: 2