YOLOv8-ultralytics-8.2.103部分代码阅读笔记-default.yaml

default.yaml

ultralytics\cfg\default.yaml
python 复制代码
# Ultralytics YOLO 🚀, AGPL-3.0 license
# Default training settings and hyperparameters for medium-augmentation COCO training

task: detect # (str) YOLO task, i.e. detect, segment, classify, pose    (str) YOLO 任务，即 detect , segment , classify , pose 。
mode: train # (str) YOLO mode, i.e. train, val, predict, export, track, benchmark    YOLO 模式，即训练、验证、预测、导出、跟踪、基准。

# Train settings -------------------------------------------------------------------------------------------------------
model: # (str, optional) path to model file, i.e. yolov8n.pt, yolov8n.yaml    （str，可选）模型文件路径，即 yolov8n.pt、yolov8n.yaml。
data: # (str, optional) path to data file, i.e. coco8.yaml    （str，可选）数据文件路径，即 coco8.yaml。
epochs: 100 # (int) number of epochs to train for    （int）训练的 epoch 数。
time: # (float, optional) number of hours to train for, overrides epochs if supplied    （float，可选）训练的小时数，如果提供则覆盖 epoch。
patience: 100 # (int) epochs to wait for no observable improvement for early stopping of training    （int）等待没有明显改进的 epoch，以便提前停止训练。
batch: 16 # (int) number of images per batch (-1 for AutoBatch)    （int）每批图像数（AutoBatch 为 -1）。
imgsz: 640 # (int | list) input images size as int for train and val modes, or list[h,w] for predict and export modes    （int | list）输入图像大小为训练和验证模式的 int，或预测和导出模式的 list[h,w]。
save: True # (bool) save train checkpoints and predict results    （bool）保存训练检查点并预测结果。
save_period: -1 # (int) Save checkpoint every x epochs (disabled if < 1)    （int）每 x 个 epoch 保存检查点（如果 < 则禁用1)。
cache: False # (bool) True/ram, disk or False. Use cache for data loading    (bool) True/ram、磁盘或 False。使用缓存加载数据（布尔值）True/ram、disk或 False。使用缓存加载数据。
device: # (int | str | list, optional) device to run on, i.e. cuda device=0 or device=0,1,2,3 or device=cpu    (int | str | list, 可选) 运行设备，即 cuda device=0 或 device=0,1,2,3 或 device=cpu。
workers: 8 # (int) number of worker threads for data loading (per RANK if DDP)    (int) 数据加载工作线程数（如果是 DDP，则按 RANK 计算）。
project: # (str, optional) project name    (str, 可选) 项目名称。
name: # (str, optional) experiment name, results saved to 'project/name' directory    (str, 可选) 实验名称，结果保存到 'project/name' 目录。
exist_ok: False # (bool) whether to overwrite existing experiment    (bool) 是否覆盖现有实验。
pretrained: True # (bool | str) whether to use a pretrained model (bool) or a model to load weights from (str)    (bool | str) 是否使用预训练模型 (bool) 或从中加载权重的模型 (str)。

optimizer: auto # (str) optimizer to use, choices=[SGD, Adam, Adamax, AdamW, NAdam, RAdam, RMSProp, auto]    (str) 要使用的优化器，choices=[SGD, Adam, Adamax, AdamW, NAdam, RAdam, RMSProp, auto]。
verbose: True # (bool) whether to print verbose output    (bool) 是否打印详细输出。
seed: 0 # (int) random seed for reproducibility    (int) 随机种子，用于可重复性。
deterministic: True # (bool) whether to enable deterministic mode    (bool) 是否启用确定性模式。
single_cls: False # (bool) train multi-class data as single-class    (bool) 将多类数据训练为单类。
rect: False # (bool) rectangular training if mode='train' or rectangular validation if mode='val'    (bool) 如果 mode='train'，则进行矩形训练，如果 mode='val'，则进行矩形验证。
cos_lr: False # (bool) use cosine learning rate scheduler    (bool) 使用余弦学习率调度程序。
close_mosaic: 10 # (int) disable mosaic augmentation for final epochs (0 to disable)    (int) 禁用最终时期的马赛克增强（0 表示禁用）。
resume: False # (bool) resume training from last checkpoint    (bool) 从上一个检查点恢复训练。
amp: True # (bool) Automatic Mixed Precision (AMP) training, choices=[True, False], True runs AMP check    (bool) 自动混合精度 (AMP) 训练，choices=[True, False]，True 运行 AMP 检查。
fraction: 1.0 # (float) dataset fraction to train on (default is 1.0, all images in train set)    (float) 要训练的数据集分数（默认值为 1.0，训练集中的所有图像）。
profile: False # (bool) profile ONNX and TensorRT speeds during training for loggers    (bool) 在训练期间为记录器分析 ONNX 和 TensorRT 速度。
freeze: None # (int | list, optional) freeze first n layers, or freeze list of layer indices during training    （int | list，可选）冻结前 n 层，或在训练期间冻结层索引列表。
multi_scale: False # (bool) Whether to use multiscale during training    （bool）是否在训练期间使用多尺度。
# Segmentation
overlap_mask: True # (bool) masks should overlap during training (segment train only)    (bool) 训练期间掩码应重叠（仅限分段训练）。
mask_ratio: 4 # (int) mask downsample ratio (segment train only)    (int) 掩码下采样率（仅限分段训练）。
# Classification
dropout: 0.0 # (float) use dropout regularization (classify train only)    (float) 使用 dropout 正则化（仅限分类训练）。

# Val/Test settings ----------------------------------------------------------------------------------------------------
val: True # (bool) validate/test during training    (bool) 在训练期间验证/测试。
split: val # (str) dataset split to use for validation, i.e. 'val', 'test' or 'train'    (str) 用于验证的数据集拆分，即"val"、"test"或"train"。
save_json: False # (bool) save results to JSON file    (bool) 将结果保存到 JSON 文件。
save_hybrid: False # (bool) save hybrid version of labels (labels + additional predictions)    (bool) 保存标签的混合版本（标签 + 附加预测）。
conf: # (float, optional) object confidence threshold for detection (default 0.25 predict, 0.001 val)    （float，可选）用于检测的对象置信度阈值（默认 0.25 预测，0.001 val）。
iou: 0.7 # (float) intersection over union (IoU) threshold for NMS    (float) NMS 的交并比 (IoU) 阈值。
max_det: 300 # (int) maximum number of detections per image    (int) 每个图像的最大检测次数。
half: False # (bool) use half precision (FP16)    (bool) 使用半精度（FP16）。
dnn: False # (bool) use OpenCV DNN for ONNX inference    (bool) 使用 OpenCV DNN 进行 ONNX 推理。
plots: True # (bool) save plots and images during train/val    (bool) 在训练/val 期间保存图和图像。

# Predict settings -----------------------------------------------------------------------------------------------------
source: # (str, optional) source directory for images or videos    （str，可选）图像或视频的源目录。
vid_stride: 1 # (int) video frame-rate stride    （int）视频帧速率步幅。
stream_buffer: False # (bool) buffer all streaming frames (True) or return the most recent frame (False)    （bool）缓冲所有流式传输帧（True）或返回最新帧（False）。
visualize: False # (bool) visualize model features    （bool）可视化模型特征。
augment: False # (bool) apply image augmentation to prediction sources    （bool）将图像增强应用于预测源。
agnostic_nms: False # (bool) class-agnostic NMS    （bool）类不可知 NMS。
classes: # (int | list[int], optional) filter results by class, i.e. classes=0, or classes=[0,2,3]    （int | list[int]，可选）按类别过滤结果，即 classes=0 或 classes=[0,2,3]。
retina_masks: False # (bool) use high-resolution segmentation masks    （bool）使用高分辨率分割掩码。
embed: # (list[int], optional) return feature vectors/embeddings from given layers    （list[int]，可选）从给定层返回特征向量/嵌入。

# Visualize settings ---------------------------------------------------------------------------------------------------
show: False # (bool) show predicted images and videos if environment allows    (bool) 如果环境允许，则显示预测的图像和视频。
save_frames: False # (bool) save predicted individual video frames    (bool) 保存预测的单个视频帧。
save_txt: False # (bool) save results as .txt file    (bool) 将结果保存为 .txt 文件。
save_conf: False # (bool) save results with confidence scores    (bool) 保存结果和置信度分数。
save_crop: False # (bool) save cropped images with results    (bool) 保存裁剪的图像和结果。
show_labels: True # (bool) show prediction labels, i.e. 'person'    (bool) 显示预测标签，即"person"。
show_conf: True # (bool) show prediction confidence, i.e. '0.99'    (bool) 显示预测置信度，即"0.99"。
show_boxes: True # (bool) show prediction boxes    (bool) 显示预测框。
line_width: # (int, optional) line width of the bounding boxes. Scaled to image size if None.    (int，可选) 边界框的线宽。如果为 None，则缩放到图像大小。

# Export settings ------------------------------------------------------------------------------------------------------
format: torchscript # (str) format to export to, choices at https://docs.ultralytics.com/modes/export/#export-formats    (str) 导出格式，可在 https://docs.ultralytics.com/modes/export/#export-formats 上选择。
keras: False # (bool) use Kera=s    (bool) 使用 Kera=s。
optimize: False # (bool) TorchScript: optimize for mobile    (bool) TorchScript：针对移动设备进行优化。
int8: False # (bool) CoreML/TF INT8 quantization    (bool) CoreML/TF INT8 量化。
dynamic: False # (bool) ONNX/TF/TensorRT: dynamic axes    (bool) ONNX/TF/TensorRT：动态轴。
simplify: True # (bool) ONNX: simplify model using `onnxslim`    (bool) ONNX：使用 `onnxslim` 简化模型。
opset: # (int, optional) ONNX: opset version    (int，可选) ONNX：opset 版本。
workspace: 4 # (int) TensorRT: workspace size (GB)    (int) TensorRT：工作区大小 (GB)。
nms: False # (bool) CoreML: add NMS    (bool) CoreML：添加 NMS。

# Hyperparameters ------------------------------------------------------------------------------------------------------
lr0: 0.01 # (float) initial learning rate (i.e. SGD=1E-2, Adam=1E-3)    (浮点数) 初始学习率（即 SGD=1E-2，Adam=1E-3）。
lrf: 0.01 # (float) final learning rate (lr0 * lrf)    (浮点数) 最终学习率 (lr0 * lrf)。
momentum: 0.937 # (float) SGD momentum/Adam beta1    (浮点数) SGD 动量/Adam beta1。
weight_decay: 0.0005 # (float) optimizer weight decay 5e-4    (浮点数) 优化器权重衰减 5e-4。
warmup_epochs: 3.0 # (float) warmup epochs (fractions ok)    (浮点数) 预热时期（可以分数）。
warmup_momentum: 0.8 # (float) warmup initial momentum    (浮点数) 预热初始动量。
warmup_bias_lr: 0.1 # (float) warmup initial bias lr    (浮点数) 预热初始偏差 lr。
box: 7.5 # (float) box loss gain    (浮点数) 框损失增益。
cls: 0.5 # (float) cls loss gain (scale with pixels)    (浮点数) cls 损失增益（按像素缩放）。
dfl: 1.5 # (float) dfl loss gain    (浮点数) dfl 损失增益。
pose: 12.0 # (float) pose loss gain    (浮点) 姿势损失增益。
kobj: 1.0 # (float) keypoint obj loss gain    (浮点) 关键点对象损失增益。
label_smoothing: 0.0 # (float) label smoothing (fraction)    (浮点) 标签平滑 (分数)。
nbs: 64 # (int) nominal batch size    (整数) 名义批量大小。
hsv_h: 0.015 # (float) image HSV-Hue augmentation (fraction)    (浮点) 图像 HSV-色调增强 (分数)。
hsv_s: 0.7 # (float) image HSV-Saturation augmentation (fraction)    (浮点) 图像 HSV-饱和度增强 (分数)。
hsv_v: 0.4 # (float) image HSV-Value augmentation (fraction)    (浮点) 图像 HSV-值增强 (分数)。
degrees: 0.0 # (float) image rotation (+/- deg)    (浮点) 图像旋转 (+/- 度)。
translate: 0.1 # (float) image translation (+/- fraction)    (浮点) 图像平移 (+/- 分数)。
scale: 0.5 # (float) image scale (+/- gain)    (浮点) 图像比例 (+/- 增益)。
shear: 0.0 # (float) image shear (+/- deg)    (浮点) 图像剪切 (+/- 度)。
perspective: 0.0 # (float) image perspective (+/- fraction), range 0-0.001    (浮点) 图像透视 (+/- 分数)，范围0-0.001。
flipud: 0.0 # (float) image flip up-down (probability)    (浮点数) 图像上下翻转 (概率)。
fliplr: 0.5 # (float) image flip left-right (probability)    (浮点数) 图像左右翻转 (概率)。
bgr: 0.0 # (float) image channel BGR (probability)    (浮点数) 图像通道 BGR (概率)。
mosaic: 1.0 # (float) image mosaic (probability)    (浮点数) 图像马赛克 (概率)。
mixup: 0.0 # (float) image mixup (probability)    (浮点数) 图像混合 (概率)。
copy_paste: 0.0 # (float) segment copy-paste (probability)    (浮点数) 片段复制粘贴 (概率)。
auto_augment: randaugment # (str) auto augmentation policy for classification (randaugment, autoaugment, augmix)    (str) 分类的自动增强策略 (randaugment, autoaugment, augmix)。
erasing: 0.4 # (float) probability of random erasing during classification training (0-0.9), 0 means no erasing, must be less than 1.0.    (浮点数) 分类训练期间随机擦除的概率 (0-0.9)，0 表示不擦除，必须小于 1.0。
crop_fraction: 1.0 # (float) image crop fraction for classification (0.1-1), 1.0 means no crop, must be greater than 0.    （浮点数）用于分类的图像裁剪分数（0.1-1），1.0 表示无裁剪，必须大于 0。

# Custom config.yaml ---------------------------------------------------------------------------------------------------
cfg: # (str, optional) for overriding defaults.yaml    (str，可选) 用于覆盖 defaults.yaml。

# Tracker settings ------------------------------------------------------------------------------------------------------
tracker: botsort.yaml # (str) tracker type, choices=[botsort.yaml, bytetrack.yaml]    (str) 跟踪器类型，choices=[botsort.yaml, bytetrack.yaml]。