PP-OCRv4_mobile_det.yaml 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170
  1. Global:
  2. debug: false
  3. use_gpu: true
  4. epoch_num: 100
  5. log_smooth_window: 20
  6. print_batch_step: 10
  7. save_model_dir: output
  8. save_epoch_step: 1
  9. eval_batch_step:
  10. - 0
  11. - 100
  12. cal_metric_during_train: false
  13. checkpoints:
  14. pretrained_model: https://paddleocr.bj.bcebos.com/pretrained/ch_PP-OCRv4_det_trained.pdparams
  15. save_inference_dir: null
  16. use_visualdl: false
  17. distributed: true
  18. Architecture:
  19. model_type: det
  20. algorithm: DB
  21. Transform: null
  22. Backbone:
  23. name: PPLCNetV3
  24. scale: 0.75
  25. det: True
  26. Neck:
  27. name: RSEFPN
  28. out_channels: 96
  29. shortcut: True
  30. Head:
  31. name: DBHead
  32. k: 50
  33. fix_nan: True
  34. Loss:
  35. name: DBLoss
  36. balance_loss: true
  37. main_loss_type: DiceLoss
  38. alpha: 5
  39. beta: 10
  40. ohem_ratio: 3
  41. Optimizer:
  42. name: Adam
  43. beta1: 0.9
  44. beta2: 0.999
  45. lr:
  46. name: Cosine
  47. learning_rate: 0.001
  48. warmup_epoch: 2
  49. regularizer:
  50. name: L2
  51. factor: 1e-6
  52. PostProcess:
  53. name: DBPostProcess
  54. thresh: 0.3
  55. box_thresh: 0.6
  56. max_candidates: 1000
  57. unclip_ratio: 1.5
  58. Metric:
  59. name: DetMetric
  60. main_indicator: hmean
  61. Train:
  62. dataset:
  63. name: TextDetDataset
  64. data_dir: datasets/ICDAR2015
  65. label_file_list:
  66. - datasets/ICDAR2015/train.txt
  67. transforms:
  68. - DecodeImage:
  69. img_mode: BGR
  70. channel_first: false
  71. - DetLabelEncode: null
  72. - CopyPaste: null
  73. - IaaAugment:
  74. augmenter_args:
  75. - type: Fliplr
  76. args:
  77. p: 0.5
  78. - type: Affine
  79. args:
  80. rotate:
  81. - -10
  82. - 10
  83. - type: Resize
  84. args:
  85. size:
  86. - 0.5
  87. - 3
  88. - EastRandomCropData:
  89. size:
  90. - 640
  91. - 640
  92. max_tries: 50
  93. keep_ratio: true
  94. - MakeBorderMap:
  95. shrink_ratio: 0.4
  96. thresh_min: 0.3
  97. thresh_max: 0.7
  98. total_epoch: 500
  99. - MakeShrinkMap:
  100. shrink_ratio: 0.4
  101. min_text_size: 8
  102. total_epoch: 500
  103. - NormalizeImage:
  104. scale: 1./255.
  105. mean:
  106. - 0.485
  107. - 0.456
  108. - 0.406
  109. std:
  110. - 0.229
  111. - 0.224
  112. - 0.225
  113. order: hwc
  114. - ToCHWImage: null
  115. - KeepKeys:
  116. keep_keys:
  117. - image
  118. - threshold_map
  119. - threshold_mask
  120. - shrink_map
  121. - shrink_mask
  122. loader:
  123. shuffle: true
  124. drop_last: false
  125. batch_size_per_card: 8
  126. num_workers: 3
  127. Eval:
  128. dataset:
  129. name: TextDetDataset
  130. data_dir: datasets/ICDAR2015
  131. label_file_list:
  132. - datasets/ICDAR2015/val.txt
  133. transforms:
  134. - DecodeImage:
  135. img_mode: BGR
  136. channel_first: false
  137. - DetLabelEncode: null
  138. - DetResizeForTest:
  139. resize_long: 960
  140. - NormalizeImage:
  141. scale: 1./255.
  142. mean:
  143. - 0.485
  144. - 0.456
  145. - 0.406
  146. std:
  147. - 0.229
  148. - 0.224
  149. - 0.225
  150. order: hwc
  151. - ToCHWImage: null
  152. - KeepKeys:
  153. keep_keys:
  154. - image
  155. - shape
  156. - polys
  157. - ignore_tags
  158. loader:
  159. shuffle: false
  160. drop_last: false
  161. batch_size_per_card: 1
  162. num_workers: 0
  163. profiler_options: null