train.py 1.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950
  1. import paddlex as pdx
  2. from paddlex import transforms as T
  3. # 定义训练和验证时的transforms
  4. # API说明:https://github.com/PaddlePaddle/PaddleX/blob/release/2.0-rc/paddlex/cv/transforms/operators.py
  5. train_transforms = T.Compose([
  6. T.RandomResizeByShort(
  7. short_sizes=[640, 672, 704, 736, 768, 800],
  8. max_size=1333,
  9. interp='CUBIC'), T.RandomHorizontalFlip(), T.Normalize(
  10. mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
  11. ])
  12. eval_transforms = T.Compose([
  13. T.ResizeByShort(
  14. short_size=800, max_size=1333, interp='CUBIC'), T.Normalize(
  15. mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
  16. ])
  17. # 定义训练和验证所用的数据集
  18. # API说明:https://github.com/PaddlePaddle/PaddleX/blob/develop/dygraph/paddlex/cv/datasets/coco.py#L26
  19. train_dataset = pdx.datasets.CocoDetection(
  20. data_dir='dataset/JPEGImages',
  21. ann_file='dataset/train.json',
  22. transforms=train_transforms,
  23. shuffle=True)
  24. eval_dataset = pdx.datasets.CocoDetection(
  25. data_dir='dataset/JPEGImages',
  26. ann_file='dataset/val.json',
  27. transforms=eval_transforms)
  28. # 初始化模型,并进行训练
  29. # 可使用VisualDL查看训练指标,参考https://github.com/PaddlePaddle/PaddleX/tree/release/2.0-rc/tutorials/train#visualdl可视化训练指标
  30. num_classes = len(train_dataset.labels)
  31. model = pdx.models.MaskRCNN(
  32. num_classes=num_classes, backbone='ResNet50', with_fpn=True)
  33. # API说明:https://github.com/PaddlePaddle/PaddleX/blob/release/2.0-rc/paddlex/cv/models/detector.py#L155
  34. # 各参数介绍与调整说明:https://paddlex.readthedocs.io/zh_CN/develop/appendix/parameters.html
  35. model.train(
  36. num_epochs=12,
  37. train_dataset=train_dataset,
  38. train_batch_size=1,
  39. eval_dataset=eval_dataset,
  40. learning_rate=0.00125,
  41. lr_decay_epochs=[8, 11],
  42. warmup_steps=10,
  43. warmup_start_lr=0.0,
  44. save_dir='output/mask_rcnn_r50_fpn',
  45. use_vdl=True)