ch_PP-OCRv3_rotnet.yml 2.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798
  1. Global:
  2. debug: false
  3. use_gpu: true
  4. epoch_num: 100
  5. log_smooth_window: 20
  6. print_batch_step: 10
  7. save_model_dir: ./output/rec_ppocr_v3_rotnet
  8. save_epoch_step: 3
  9. eval_batch_step: [0, 2000]
  10. cal_metric_during_train: true
  11. pretrained_model: null
  12. checkpoints: null
  13. save_inference_dir: null
  14. use_visualdl: false
  15. infer_img: doc/imgs_words/ch/word_1.jpg
  16. character_dict_path: ppocr/utils/ppocr_keys_v1.txt
  17. max_text_length: 25
  18. infer_mode: false
  19. use_space_char: true
  20. save_res_path: ./output/rec/predicts_chinese_lite_v2.0.txt
  21. Optimizer:
  22. name: Adam
  23. beta1: 0.9
  24. beta2: 0.999
  25. lr:
  26. name: Cosine
  27. learning_rate: 0.001
  28. regularizer:
  29. name: L2
  30. factor: 1.0e-05
  31. Architecture:
  32. model_type: cls
  33. algorithm: CLS
  34. Transform: null
  35. Backbone:
  36. name: MobileNetV1Enhance
  37. scale: 0.5
  38. last_conv_stride: [1, 2]
  39. last_pool_type: avg
  40. Neck:
  41. Head:
  42. name: ClsHead
  43. class_dim: 4
  44. Loss:
  45. name: ClsLoss
  46. main_indicator: acc
  47. PostProcess:
  48. name: ClsPostProcess
  49. Metric:
  50. name: ClsMetric
  51. main_indicator: acc
  52. Train:
  53. dataset:
  54. name: SimpleDataSet
  55. data_dir: ./train_data
  56. label_file_list:
  57. - ./train_data/train_list.txt
  58. transforms:
  59. - DecodeImage:
  60. img_mode: BGR
  61. channel_first: false
  62. - BaseDataAugmentation:
  63. - RandAugment:
  64. - SSLRotateResize:
  65. image_shape: [3, 48, 320]
  66. - KeepKeys:
  67. keep_keys: ["image", "label"]
  68. loader:
  69. collate_fn: "SSLRotateCollate"
  70. shuffle: true
  71. batch_size_per_card: 32
  72. drop_last: true
  73. num_workers: 8
  74. Eval:
  75. dataset:
  76. name: SimpleDataSet
  77. data_dir: ./train_data
  78. label_file_list:
  79. - ./train_data/val_list.txt
  80. transforms:
  81. - DecodeImage:
  82. img_mode: BGR
  83. channel_first: false
  84. - SSLRotateResize:
  85. image_shape: [3, 48, 320]
  86. - KeepKeys:
  87. keep_keys: ["image", "label"]
  88. loader:
  89. collate_fn: "SSLRotateCollate"
  90. shuffle: false
  91. drop_last: false
  92. batch_size_per_card: 64
  93. num_workers: 8
  94. profiler_options: null