FasterNet-T0.yaml 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163
  1. # global configs
  2. Global:
  3. checkpoints: null
  4. pretrained_model: null
  5. output_dir: ./output/
  6. device: gpu
  7. save_interval: 1
  8. eval_during_train: False
  9. eval_interval: 1
  10. epochs: 300
  11. print_batch_step: 10
  12. use_visualdl: False
  13. # used for static mode and model export
  14. image_shape: [3, 224, 224]
  15. save_inference_dir: ./inference
  16. # mixed precision
  17. AMP:
  18. use_amp: True
  19. use_fp16_test: False
  20. scale_loss: 128.0
  21. use_dynamic_loss_scaling: True
  22. use_promote: False
  23. # O1: mixed fp16, O2: pure fp16
  24. level: O1
  25. # model architecture
  26. Arch:
  27. name: FasterNet_T0
  28. class_num: 1000
  29. # loss function config for traing/eval process
  30. Loss:
  31. Train:
  32. - CELoss:
  33. weight: 1.0
  34. epsilon: 0.1
  35. Eval:
  36. - CELoss:
  37. weight: 1.0
  38. Optimizer:
  39. name: AdamW
  40. beta1: 0.9
  41. beta2: 0.999
  42. epsilon: 1e-8
  43. weight_decay: 0.005
  44. clip_grad: null
  45. no_weight_decay_name: null
  46. one_dim_param_no_weight_decay: True
  47. lr:
  48. name: Cosine
  49. learning_rate: 0.0006 # 8gpu
  50. warmup_start_lr: 0.000001
  51. warmup_epoch: 20
  52. eta_min: 0.00001
  53. # data loader for train and eval
  54. DataLoader:
  55. Train:
  56. dataset:
  57. name: ImageNetDataset
  58. image_root: ./dataset/ILSVRC2012/
  59. cls_label_path: ./dataset/ILSVRC2012/train_list.txt
  60. transform_ops:
  61. - DecodeImage:
  62. backend: pil
  63. channel_first: False
  64. - RandCropImage:
  65. size: 224
  66. interpolation: bicubic
  67. backend: pil
  68. - RandFlipImage:
  69. flip_code: 1
  70. - NormalizeImage:
  71. scale: 1.0/255.0
  72. mean: [0.485, 0.456, 0.406]
  73. std: [0.229, 0.224, 0.225]
  74. order: ''
  75. batch_transform_ops:
  76. - OpSampler:
  77. MixupOperator:
  78. alpha: 0.05
  79. prob: 0.5
  80. CutmixOperator:
  81. alpha: 1.0
  82. prob: 0.5
  83. sampler:
  84. name: DistributedBatchSampler
  85. batch_size: 64
  86. drop_last: False
  87. shuffle: True
  88. loader:
  89. num_workers: 12
  90. use_shared_memory: True
  91. Eval:
  92. dataset:
  93. name: ImageNetDataset
  94. image_root: ./dataset/ILSVRC2012/
  95. cls_label_path: ./dataset/ILSVRC2012/val_list.txt
  96. transform_ops:
  97. - DecodeImage:
  98. backend: pil
  99. to_np: False
  100. channel_first: False
  101. - ResizeImage:
  102. interpolation: bicubic
  103. backend: pil
  104. resize_short: 248
  105. - CropImage:
  106. size: 224
  107. - NormalizeImage:
  108. scale: 1.0/255.0
  109. mean: [0.485, 0.456, 0.406]
  110. std: [0.229, 0.224, 0.225]
  111. order: 'hwc'
  112. sampler:
  113. name: DistributedBatchSampler
  114. batch_size: 4
  115. drop_last: False
  116. shuffle: False
  117. loader:
  118. num_workers: 6
  119. use_shared_memory: True
  120. Infer:
  121. infer_imgs: docs/images/inference_deployment/whl_demo.jpg
  122. batch_size: 10
  123. transforms:
  124. - DecodeImage:
  125. to_rgb: True
  126. channel_first: False
  127. - ResizeImage:
  128. interpolation: bicubic
  129. backend: pil
  130. resize_short: 248
  131. - CropImage:
  132. size: 224
  133. - NormalizeImage:
  134. scale: 1.0/255.0
  135. mean: [0.485, 0.456, 0.406]
  136. std: [0.229, 0.224, 0.225]
  137. order: ''
  138. - ToCHWImage:
  139. PostProcess:
  140. name: Topk
  141. topk: 5
  142. class_id_map_file: ppcls/utils/imagenet1k_label_list.txt
  143. Metric:
  144. Train:
  145. - TopkAcc:
  146. topk: [1, 5]
  147. Eval:
  148. - TopkAcc:
  149. topk: [1, 5]