split.py 1.8 KB

1234567891011121314151617181920212223242526272829303132333435363738394041
  1. #!/usr/bin/env python
  2. # coding: utf-8
  3. # Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
  4. #
  5. # Licensed under the Apache License, Version 2.0 (the "License");
  6. # you may not use this file except in compliance with the License.
  7. # You may obtain a copy of the License at
  8. #
  9. # http://www.apache.org/licenses/LICENSE-2.0
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS,
  13. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. # See the License for the specific language governing permissions and
  15. # limitations under the License.
  16. from .dataset_split.coco_split import split_coco_dataset
  17. from .dataset_split.voc_split import split_voc_dataset
  18. from .dataset_split.imagenet_split import split_imagenet_dataset
  19. from .dataset_split.seg_split import split_seg_dataset
  20. def dataset_split(dataset_dir, dataset_form, val_value, test_value, save_dir):
  21. print(dataset_dir, dataset_form, val_value, test_value, save_dir)
  22. if dataset_form == "coco":
  23. train_num, val_num, test_num = split_coco_dataset(
  24. dataset_dir, val_value, test_value, save_dir)
  25. elif dataset_form == "voc":
  26. train_num, val_num, test_num = split_voc_dataset(
  27. dataset_dir, val_value, test_value, save_dir)
  28. elif dataset_form == "seg":
  29. train_num, val_num, test_num = split_seg_dataset(
  30. dataset_dir, val_value, test_value, save_dir)
  31. elif dataset_form == "imagenet":
  32. train_num, val_num, test_num = split_imagenet_dataset(
  33. dataset_dir, val_value, test_value, save_dir)
  34. print("Dataset Split Done.")
  35. print("Train samples: {}".format(train_num))
  36. print("Eval samples: {}".format(val_num))
  37. print("Test samples: {}".format(test_num))
  38. print("Split file saved in {}".format(save_dir))