SynthText.yaml 1.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940
  1. name: DBNet
  2. dataset:
  3. train:
  4. dataset:
  5. type: SynthTextDataset # 数据集类型
  6. args:
  7. data_path: ''# SynthTextDataset 根目录
  8. pre_processes: # 数据的预处理过程,包含augment和标签制作
  9. - type: IaaAugment # 使用imgaug进行变换
  10. args:
  11. - {'type':Fliplr, 'args':{'p':0.5}}
  12. - {'type': Affine, 'args':{'rotate':[-10,10]}}
  13. - {'type':Resize,'args':{'size':[0.5,3]}}
  14. - type: EastRandomCropData
  15. args:
  16. size: [640,640]
  17. max_tries: 50
  18. keep_ratio: true
  19. - type: MakeBorderMap
  20. args:
  21. shrink_ratio: 0.4
  22. - type: MakeShrinkMap
  23. args:
  24. shrink_ratio: 0.4
  25. min_text_size: 8
  26. transforms: # 对图片进行的变换方式
  27. - type: ToTensor
  28. args: {}
  29. - type: Normalize
  30. args:
  31. mean: [0.485, 0.456, 0.406]
  32. std: [0.229, 0.224, 0.225]
  33. img_mode: RGB
  34. filter_keys: ['img_path','img_name','text_polys','texts','ignore_tags','shape'] # 返回数据之前,从数据字典里删除的key
  35. ignore_tags: ['*', '###']
  36. loader:
  37. batch_size: 1
  38. shuffle: true
  39. num_workers: 0
  40. collate_fn: ''