FasterNet-S.yaml 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165
  1. # global configs
  2. Global:
  3. checkpoints: null
  4. pretrained_model: null
  5. output_dir: ./output/
  6. device: gpu
  7. save_interval: 1
  8. eval_during_train: False
  9. eval_interval: 1
  10. epochs: 300
  11. print_batch_step: 10
  12. use_visualdl: False
  13. # used for static mode and model export
  14. image_shape: [3, 224, 224]
  15. save_inference_dir: ./inference
  16. # mixed precision
  17. AMP:
  18. use_amp: True
  19. use_fp16_test: False
  20. scale_loss: 128.0
  21. use_dynamic_loss_scaling: True
  22. use_promote: False
  23. # O1: mixed fp16, O2: pure fp16
  24. level: O1
  25. # model architecture
  26. Arch:
  27. name: FasterNet_S
  28. class_num: 1000
  29. # loss function config for traing/eval process
  30. Loss:
  31. Train:
  32. - CELoss:
  33. weight: 1.0
  34. epsilon: 0.1
  35. Eval:
  36. - CELoss:
  37. weight: 1.0
  38. Optimizer:
  39. name: AdamW
  40. beta1: 0.9
  41. beta2: 0.999
  42. epsilon: 1e-8
  43. weight_decay: 0.03
  44. clip_grad: null
  45. no_weight_decay_name: null
  46. one_dim_param_no_weight_decay: True
  47. lr:
  48. name: Cosine
  49. learning_rate: 0.0006
  50. warmup_start_lr: 0.000001
  51. warmup_epoch: 20
  52. eta_min: 0.00001
  53. # data loader for train and eval
  54. DataLoader:
  55. Train:
  56. dataset:
  57. name: ImageNetDataset
  58. image_root: ./dataset/ILSVRC2012/
  59. cls_label_path: ./dataset/ILSVRC2012/train_list.txt
  60. transform_ops:
  61. - DecodeImage:
  62. backend: pil
  63. channel_first: False
  64. - RandCropImage:
  65. size: 224
  66. interpolation: bicubic
  67. backend: pil
  68. - RandFlipImage:
  69. flip_code: 1
  70. - TimmAutoAugment:
  71. config_str: rand-m7-mstd0.5-inc1
  72. - NormalizeImage:
  73. scale: 1.0/255.0
  74. mean: [0.485, 0.456, 0.406]
  75. std: [0.229, 0.224, 0.225]
  76. order: ''
  77. batch_transform_ops:
  78. - OpSampler:
  79. MixupOperator:
  80. alpha: 0.3
  81. prob: 0.5
  82. CutmixOperator:
  83. alpha: 1.0
  84. prob: 0.5
  85. sampler:
  86. name: DistributedBatchSampler
  87. batch_size: 64
  88. drop_last: False
  89. shuffle: True
  90. loader:
  91. num_workers: 12
  92. use_shared_memory: True
  93. Eval:
  94. dataset:
  95. name: ImageNetDataset
  96. image_root: ./dataset/ILSVRC2012/
  97. cls_label_path: ./dataset/ILSVRC2012/val_list.txt
  98. transform_ops:
  99. - DecodeImage:
  100. backend: pil
  101. to_np: False
  102. channel_first: False
  103. - ResizeImage: ##RandomResized
  104. interpolation: bicubic
  105. backend: pil
  106. resize_short: 248
  107. - CropImage:
  108. size: 224
  109. - NormalizeImage:
  110. scale: 1.0/255.0
  111. mean: [0.485, 0.456, 0.406]
  112. std: [0.229, 0.224, 0.225]
  113. order: 'hwc'
  114. sampler:
  115. name: DistributedBatchSampler
  116. batch_size: 4
  117. drop_last: False
  118. shuffle: False
  119. loader:
  120. num_workers: 6
  121. use_shared_memory: True
  122. Infer:
  123. infer_imgs: docs/images/inference_deployment/whl_demo.jpg
  124. batch_size: 10
  125. transforms:
  126. - DecodeImage:
  127. to_rgb: True
  128. channel_first: False
  129. - ResizeImage:
  130. interpolation: bicubic
  131. backend: pil
  132. resize_short: 248
  133. - CropImage:
  134. size: 224
  135. - NormalizeImage:
  136. scale: 1.0/255.0
  137. mean: [0.485, 0.456, 0.406]
  138. std: [0.229, 0.224, 0.225]
  139. order: ''
  140. - ToCHWImage:
  141. PostProcess:
  142. name: Topk
  143. topk: 5
  144. class_id_map_file: ppcls/utils/imagenet1k_label_list.txt
  145. Metric:
  146. Train:
  147. - TopkAcc:
  148. topk: [1, 5]
  149. Eval:
  150. - TopkAcc:
  151. topk: [1, 5]