StarNet-S4.yaml 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167
  1. # global configs
  2. Global:
  3. checkpoints: null
  4. pretrained_model: null
  5. output_dir: ./output/
  6. device: gpu
  7. save_interval: 1
  8. eval_during_train: True
  9. eval_interval: 1
  10. epochs: 300
  11. print_batch_step: 10
  12. use_visualdl: False
  13. # used for static mode and model export
  14. image_shape: [3, 224, 224]
  15. save_inference_dir: ./inference
  16. # mixed precision
  17. AMP:
  18. use_amp: True
  19. use_fp16_test: False
  20. scale_loss: 128.0
  21. use_dynamic_loss_scaling: True
  22. use_promote: False
  23. # O1: mixed fp16, O2: pure fp16
  24. level: O1
  25. # model architecture
  26. Arch:
  27. name: StarNet_S4
  28. drop_rate: 0
  29. drop_path_rate: 0.02
  30. class_num: 1000
  31. # loss function config for traing/eval process
  32. Loss:
  33. Train:
  34. - CELoss:
  35. weight: 1.0
  36. epsilon: 0.1
  37. Eval:
  38. - CELoss:
  39. weight: 1.0
  40. Optimizer:
  41. name: AdamW
  42. beta1: 0.9
  43. beta2: 0.999
  44. epsilon: 1e-8
  45. weight_decay: 0.05
  46. clip_grad: None
  47. no_weight_decay_name: null
  48. one_dim_param_no_weight_decay: True
  49. lr:
  50. name: Cosine
  51. learning_rate: 3e-3
  52. eta_min: 1e-5
  53. warmup_epoch: 5
  54. warmup_start_lr: 1e-6
  55. # data loader for train and eval
  56. DataLoader:
  57. Train:
  58. dataset:
  59. name: ImageNetDataset
  60. image_root: ./dataset/ILSVRC2012/
  61. cls_label_path: ./dataset/ILSVRC2012/train_list.txt
  62. transform_ops:
  63. - DecodeImage:
  64. to_rgb: True
  65. channel_first: False
  66. - RandCropImage:
  67. size: 224
  68. - RandFlipImage:
  69. flip_code: 1
  70. - TimmAutoAugment:
  71. config_str: rand-m1-mstd0.5-inc1
  72. interpolation: random
  73. img_size: 224
  74. - NormalizeImage:
  75. scale: 1.0/255.0
  76. mean: [0.485, 0.456, 0.406]
  77. std: [0.229, 0.224, 0.225]
  78. order: ''
  79. - RandomErasing:
  80. EPSILON: 0.25
  81. mode: pixel
  82. batch_transform_ops:
  83. - OpSampler:
  84. MixupOperator:
  85. alpha: 0.8
  86. prob: 0.5
  87. CutmixOperator:
  88. alpha: 0.2
  89. prob: 0.5
  90. sampler:
  91. name: DistributedBatchSampler
  92. batch_size: 256
  93. drop_last: False
  94. shuffle: True
  95. loader:
  96. num_workers: 4
  97. use_shared_memory: False
  98. Eval:
  99. dataset:
  100. name: ImageNetDataset
  101. image_root: ./dataset/ILSVRC2012/
  102. cls_label_path: ./dataset/ILSVRC2012/val_list.txt
  103. transform_ops:
  104. - DecodeImage:
  105. backend: pil
  106. channel_first: False
  107. - ResizeImage:
  108. interpolation: bicubic
  109. backend: pil
  110. resize_short: 256
  111. - CropImage:
  112. size: 224
  113. - NormalizeImage:
  114. scale: 1.0/255.0
  115. mean: [0.485, 0.456, 0.406]
  116. std: [0.229, 0.224, 0.225]
  117. order: 'hwc'
  118. sampler:
  119. name: DistributedBatchSampler
  120. batch_size: 4
  121. drop_last: False
  122. shuffle: False
  123. loader:
  124. num_workers: 4
  125. use_shared_memory: False
  126. Infer:
  127. infer_imgs: docs/images/inference_deployment/whl_demo.jpg
  128. batch_size: 10
  129. transforms:
  130. - DecodeImage:
  131. to_rgb: True
  132. channel_first: False
  133. - ResizeImage:
  134. interpolation: bicubic
  135. backend: pil
  136. resize_short: 256
  137. - CropImage:
  138. size: 224
  139. - NormalizeImage:
  140. scale: 1.0/255.0
  141. mean: [0.485, 0.456, 0.406]
  142. std: [0.229, 0.224, 0.225]
  143. order: ''
  144. - ToCHWImage:
  145. PostProcess:
  146. name: Topk
  147. topk: 5
  148. class_id_map_file: ppcls/utils/imagenet1k_label_list.txt
  149. Metric:
  150. Train:
  151. - TopkAcc:
  152. topk: [1, 5]
  153. Eval:
  154. - TopkAcc:
  155. topk: [1, 5]