default.yaml 8.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
  1. # Ultralytics YOLO 🚀, AGPL-3.0 license
  2. # Default training settings and hyperparameters for medium-augmentation COCO training
  3. task: detect # (str) YOLO task, i.e. detect, segment, classify, pose
  4. mode: train # (str) YOLO mode, i.e. train, val, predict, export, track, benchmark
  5. # 添加一个参数判断是否在 VINNO AI平台训练 ,暂时只支持 detect 和 segment
  6. is_train_on_platform: True # True # False # (bool) 是否在 VINNO AI平台训练
  7. # Train settings -------------------------------------------------------------------------------------------------------
  8. model: # (str, optional) path to model file, i.e. yolov8n.pt, yolov8n.yaml
  9. data: # (str, optional) path to data file, i.e. coco8.yaml
  10. epochs: 100 # (int) number of epochs to train for
  11. time: # (float, optional) number of hours to train for, overrides epochs if supplied
  12. patience: 100 # (int) epochs to wait for no observable improvement for early stopping of training
  13. batch: 16 # (int) number of images per batch (-1 for AutoBatch)
  14. imgsz: 640 # (int | list) input images size as int for train and val modes, or list[h,w] for predict and export modes
  15. save: True # (bool) save train checkpoints and predict results
  16. save_period: -1 # (int) Save checkpoint every x epochs (disabled if < 1)
  17. cache: False # (bool) True/ram, disk or False. Use cache for data loading
  18. device: # (int | str | list, optional) device to run on, i.e. cuda device=0 or device=0,1,2,3 or device=cpu
  19. workers: 8 # (int) number of worker threads for data loading (per RANK if DDP)
  20. project: # (str, optional) project name
  21. name: # (str, optional) experiment name, results saved to 'project/name' directory
  22. exist_ok: False # (bool) whether to overwrite existing experiment
  23. pretrained: True # (bool | str) whether to use a pretrained model (bool) or a model to load weights from (str)
  24. optimizer: auto # (str) optimizer to use, choices=[SGD, Adam, Adamax, AdamW, NAdam, RAdam, RMSProp, auto]
  25. verbose: True # (bool) whether to print verbose output
  26. seed: 0 # (int) random seed for reproducibility
  27. deterministic: True # (bool) whether to enable deterministic mode
  28. single_cls: False # (bool) train multi-class data as single-class
  29. rect: False # (bool) rectangular training if mode='train' or rectangular validation if mode='val'
  30. cos_lr: False # (bool) use cosine learning rate scheduler
  31. close_mosaic: 10 # (int) disable mosaic augmentation for final epochs (0 to disable)
  32. resume: False # (bool) resume training from last checkpoint
  33. amp: True # (bool) Automatic Mixed Precision (AMP) training, choices=[True, False], True runs AMP check
  34. fraction: 1.0 # (float) dataset fraction to train on (default is 1.0, all images in train set)
  35. profile: False # (bool) profile ONNX and TensorRT speeds during training for loggers
  36. freeze: None # (int | list, optional) freeze first n layers, or freeze list of layer indices during training
  37. multi_scale: False # (bool) Whether to use multiscale during training
  38. # Segmentation
  39. overlap_mask: True # (bool) masks should overlap during training (segment train only)
  40. mask_ratio: 4 # (int) mask downsample ratio (segment train only)
  41. # Classification
  42. dropout: 0.0 # (float) use dropout regularization (classify train only)
  43. # Val/Test settings ----------------------------------------------------------------------------------------------------
  44. val: True # (bool) validate/test during training
  45. split: val # (str) dataset split to use for validation, i.e. 'val', 'test' or 'train'
  46. save_json: False # (bool) save results to JSON file
  47. save_hybrid: False # (bool) save hybrid version of labels (labels + additional predictions)
  48. conf: # (float, optional) object confidence threshold for detection (default 0.25 predict, 0.001 val)
  49. iou: 0.7 # (float) intersection over union (IoU) threshold for NMS
  50. max_det: 300 # (int) maximum number of detections per image
  51. half: False # (bool) use half precision (FP16)
  52. dnn: False # (bool) use OpenCV DNN for ONNX inference
  53. plots: True # (bool) save plots and images during train/val
  54. # Predict settings -----------------------------------------------------------------------------------------------------
  55. source: # (str, optional) source directory for images or videos
  56. vid_stride: 1 # (int) video frame-rate stride
  57. stream_buffer: False # (bool) buffer all streaming frames (True) or return the most recent frame (False)
  58. visualize: False # (bool) visualize model features
  59. augment: False # (bool) apply image augmentation to prediction sources
  60. agnostic_nms: False # (bool) class-agnostic NMS
  61. classes: # (int | list[int], optional) filter results by class, i.e. classes=0, or classes=[0,2,3]
  62. retina_masks: False # (bool) use high-resolution segmentation masks
  63. embed: # (list[int], optional) return feature vectors/embeddings from given layers
  64. # Visualize settings ---------------------------------------------------------------------------------------------------
  65. show: False # (bool) show predicted images and videos if environment allows
  66. save_frames: False # (bool) save predicted individual video frames
  67. save_txt: False # (bool) save results as .txt file
  68. save_conf: False # (bool) save results with confidence scores
  69. save_crop: False # (bool) save cropped images with results
  70. show_labels: True # (bool) show prediction labels, i.e. 'person'
  71. show_conf: True # (bool) show prediction confidence, i.e. '0.99'
  72. show_boxes: True # (bool) show prediction boxes
  73. line_width: # (int, optional) line width of the bounding boxes. Scaled to image size if None.
  74. # Export settings ------------------------------------------------------------------------------------------------------
  75. format: torchscript # (str) format to export to, choices at https://docs.ultralytics.com/modes/export/#export-formats
  76. keras: False # (bool) use Kera=s
  77. optimize: False # (bool) TorchScript: optimize for mobile
  78. int8: False # (bool) CoreML/TF INT8 quantization
  79. dynamic: False # (bool) ONNX/TF/TensorRT: dynamic axes
  80. simplify: False # (bool) ONNX: simplify model using `onnxslim`
  81. opset: # (int, optional) ONNX: opset version
  82. workspace: 4 # (int) TensorRT: workspace size (GB)
  83. nms: False # (bool) CoreML: add NMS
  84. # Hyperparameters ------------------------------------------------------------------------------------------------------
  85. lr0: 0.01 # (float) initial learning rate (i.e. SGD=1E-2, Adam=1E-3)
  86. lrf: 0.01 # (float) final learning rate (lr0 * lrf)
  87. momentum: 0.937 # (float) SGD momentum/Adam beta1
  88. weight_decay: 0.0005 # (float) optimizer weight decay 5e-4
  89. warmup_epochs: 3.0 # (float) warmup epochs (fractions ok)
  90. warmup_momentum: 0.8 # (float) warmup initial momentum
  91. warmup_bias_lr: 0.1 # (float) warmup initial bias lr
  92. box: 7.5 # (float) box loss gain
  93. cls: 0.5 # (float) cls loss gain (scale with pixels)
  94. dfl: 1.5 # (float) dfl loss gain
  95. pose: 12.0 # (float) pose loss gain
  96. kobj: 1.0 # (float) keypoint obj loss gain
  97. label_smoothing: 0.0 # (float) label smoothing (fraction)
  98. nbs: 64 # (int) nominal batch size
  99. hsv_h: 0.015 # (float) image HSV-Hue augmentation (fraction)
  100. hsv_s: 0.7 # (float) image HSV-Saturation augmentation (fraction)
  101. hsv_v: 0.4 # (float) image HSV-Value augmentation (fraction)
  102. degrees: 0.0 # (float) image rotation (+/- deg)
  103. translate: 0.1 # (float) image translation (+/- fraction)
  104. scale: 0.5 # (float) image scale (+/- gain)
  105. shear: 0.0 # (float) image shear (+/- deg)
  106. perspective: 0.0 # (float) image perspective (+/- fraction), range 0-0.001
  107. flipud: 0.0 # (float) image flip up-down (probability)
  108. fliplr: 0.5 # (float) image flip left-right (probability)
  109. bgr: 0.0 # (float) image channel BGR (probability)
  110. mosaic: 1.0 # (float) image mosaic (probability)
  111. mixup: 0.0 # (float) image mixup (probability)
  112. copy_paste: 0.0 # (float) segment copy-paste (probability)
  113. auto_augment: randaugment # (str) auto augmentation policy for classification (randaugment, autoaugment, augmix)
  114. erasing: 0.4 # (float) probability of random erasing during classification training (0-0.9), 0 means no erasing, must be less than 1.0.
  115. crop_fraction: 1.0 # (float) image crop fraction for classification (0.1-1), 1.0 means no crop, must be greater than 0.
  116. # Custom config.yaml ---------------------------------------------------------------------------------------------------
  117. cfg: # (str, optional) for overriding defaults.yaml
  118. # Tracker settings ------------------------------------------------------------------------------------------------------
  119. tracker: botsort.yaml # (str) tracker type, choices=[botsort.yaml, bytetrack.yaml]