PP-OCRv4_server_det.yaml 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169
  1. Global:
  2. debug: false
  3. use_gpu: true
  4. epoch_num: 100
  5. log_smooth_window: 20
  6. print_batch_step: 10
  7. save_model_dir: output
  8. save_epoch_step: 1
  9. eval_batch_step:
  10. - 0
  11. - 100
  12. cal_metric_during_train: false
  13. checkpoints:
  14. pretrained_model: https://paddleocr.bj.bcebos.com/pretrained/ch_PP-OCRv4_det_server_trained.pdparams
  15. save_inference_dir: null
  16. use_visualdl: false
  17. distributed: true
  18. Architecture:
  19. model_type: det
  20. algorithm: DB
  21. Transform: null
  22. Backbone:
  23. name: PPHGNet_small
  24. det: True
  25. Neck:
  26. name: LKPAN
  27. out_channels: 256
  28. intracl: true
  29. Head:
  30. name: PFHeadLocal
  31. k: 50
  32. mode: "large"
  33. Loss:
  34. name: DBLoss
  35. balance_loss: true
  36. main_loss_type: DiceLoss
  37. alpha: 5
  38. beta: 10
  39. ohem_ratio: 3
  40. Optimizer:
  41. name: Adam
  42. beta1: 0.9
  43. beta2: 0.999
  44. lr:
  45. name: Cosine
  46. learning_rate: 0.001
  47. warmup_epoch: 2
  48. regularizer:
  49. name: L2
  50. factor: 1e-6
  51. PostProcess:
  52. name: DBPostProcess
  53. thresh: 0.3
  54. box_thresh: 0.6
  55. max_candidates: 1000
  56. unclip_ratio: 1.5
  57. Metric:
  58. name: DetMetric
  59. main_indicator: hmean
  60. Train:
  61. dataset:
  62. name: TextDetDataset
  63. data_dir: datasets/ICDAR2015
  64. label_file_list:
  65. - datasets/ICDAR2015/train.txt
  66. transforms:
  67. - DecodeImage:
  68. img_mode: BGR
  69. channel_first: false
  70. - DetLabelEncode: null
  71. - CopyPaste: null
  72. - IaaAugment:
  73. augmenter_args:
  74. - type: Fliplr
  75. args:
  76. p: 0.5
  77. - type: Affine
  78. args:
  79. rotate:
  80. - -10
  81. - 10
  82. - type: Resize
  83. args:
  84. size:
  85. - 0.5
  86. - 3
  87. - EastRandomCropData:
  88. size:
  89. - 640
  90. - 640
  91. max_tries: 50
  92. keep_ratio: true
  93. - MakeBorderMap:
  94. shrink_ratio: 0.4
  95. thresh_min: 0.3
  96. thresh_max: 0.7
  97. total_epoch: 500
  98. - MakeShrinkMap:
  99. shrink_ratio: 0.4
  100. min_text_size: 8
  101. total_epoch: 500
  102. - NormalizeImage:
  103. scale: 1./255.
  104. mean:
  105. - 0.485
  106. - 0.456
  107. - 0.406
  108. std:
  109. - 0.229
  110. - 0.224
  111. - 0.225
  112. order: hwc
  113. - ToCHWImage: null
  114. - KeepKeys:
  115. keep_keys:
  116. - image
  117. - threshold_map
  118. - threshold_mask
  119. - shrink_map
  120. - shrink_mask
  121. loader:
  122. shuffle: true
  123. drop_last: false
  124. batch_size_per_card: 4
  125. num_workers: 3
  126. Eval:
  127. dataset:
  128. name: TextDetDataset
  129. data_dir: datasets/ICDAR2015
  130. label_file_list:
  131. - datasets/ICDAR2015/val.txt
  132. transforms:
  133. - DecodeImage:
  134. img_mode: BGR
  135. channel_first: false
  136. - DetLabelEncode: null
  137. - DetResizeForTest:
  138. resize_long: 960
  139. - NormalizeImage:
  140. scale: 1./255.
  141. mean:
  142. - 0.485
  143. - 0.456
  144. - 0.406
  145. std:
  146. - 0.229
  147. - 0.224
  148. - 0.225
  149. order: hwc
  150. - ToCHWImage: null
  151. - KeepKeys:
  152. keep_keys:
  153. - image
  154. - shape
  155. - polys
  156. - ignore_tags
  157. loader:
  158. shuffle: false
  159. drop_last: false
  160. batch_size_per_card: 1
  161. num_workers: 0
  162. profiler_options: null