resnet31_lstm_seed_tps_on.yml 2.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. Global:
  2. device: gpu
  3. epoch_num: 20
  4. log_smooth_window: 20
  5. print_batch_step: 10
  6. output_dir: ./output/rec/u14m_filter/resnet31_lstm_seed_tps_on
  7. eval_epoch_step: [0, 1]
  8. eval_batch_step: [0, 500]
  9. cal_metric_during_train: True
  10. pretrained_model:
  11. checkpoints:
  12. use_tensorboard: false
  13. infer_img:
  14. # for data or label process
  15. character_dict_path: ./tools/utils/EN_symbol_dict.txt
  16. max_text_length: 25
  17. use_space_char: False
  18. save_res_path: ./output/rec/predicts_aster_tps.txt
  19. use_amp: True
  20. grad_clip_val: 1.0
  21. Optimizer:
  22. name: Adam
  23. lr: 0.002 # for 1gpus bs1024/gpu
  24. weight_decay: 0.0
  25. filter_bias_and_bn: False
  26. LRScheduler:
  27. name: OneCycleLR
  28. warmup_epoch: 1.5 # pct_start 0.075*20 = 1.5ep
  29. cycle_momentum: False
  30. Architecture:
  31. model_type: rec
  32. algorithm: aster
  33. Transform:
  34. name: Aster_TPS
  35. tps_inputsize: [32, 64]
  36. tps_outputsize: [32, 128]
  37. Encoder:
  38. name: ResNet_ASTER
  39. Decoder:
  40. name: ASTERDecoder
  41. seed: True
  42. Loss:
  43. name: SEEDLoss
  44. Metric:
  45. name: RecMetric
  46. main_indicator: acc
  47. is_filter: True
  48. PostProcess:
  49. name: ARLabelDecode
  50. Train:
  51. dataset:
  52. name: LMDBDataSet
  53. data_dir: ../Union14M-L-LMDB-Filtered
  54. transforms:
  55. - DecodeImagePIL: # load image
  56. img_mode: RGB
  57. - PARSeqAugPIL:
  58. - Fasttext:
  59. path: './cc.en.300.bin' # wget https://dl.fbaipublicfiles.com/fasttext/vectors-crawl/cc.en.300.bin.gz; gzip -dk cc.en.300.bin.gz
  60. - ARLabelEncode: # Class handling label
  61. - RecTVResize:
  62. image_shape: [64, 256]
  63. padding: False
  64. - KeepKeys:
  65. keep_keys: ['image', 'label', 'length', 'fast_label'] # dataloader will return list in this order
  66. loader:
  67. shuffle: True
  68. batch_size_per_card: 1024
  69. drop_last: True
  70. num_workers: 4
  71. Eval:
  72. dataset:
  73. name: LMDBDataSet
  74. data_dir: ../evaluation
  75. transforms:
  76. - DecodeImagePIL: # load image
  77. img_mode: RGB
  78. - ARLabelEncode: # Class handling label
  79. - RecTVResize:
  80. image_shape: [64, 256]
  81. padding: False
  82. - KeepKeys:
  83. keep_keys: ['image', 'label', 'length'] # dataloader will return list in this order
  84. loader:
  85. shuffle: False
  86. drop_last: False
  87. batch_size_per_card: 256
  88. num_workers: 2