trainer: name: supervised_segmentation train: seed: 42 deterministic: false epochs: 200 batch_size: 4 val_batch_size: 4 accum_steps: 1 amp: true num_workers: 4 pin_memory: true persistent_workers: true prefetch_factor: 2 device: cuda grad_clip: enabled: true max_norm: 1.0 norm_type: 2.0 metrics: task_mode: binary metrics: - name: dice - name: iou loss: name: dicece task_mode: binary params: include_background: true lambda_dice: 0.7 lambda_ce: 0.3 validation: enabled: true interval: 1 threshold: 0.5 early_stopping: true early_stopping_patience: 40 early_stopping_min_delta: 0.0 metrics: task_mode: binary metrics: - name: dice - name: iou dataset: dataset_name: BUSI root: data/BUSI split: train val_split: val image_size: [256, 256] in_channels: 3 num_classes: 1 model: in_channels: 3 encoder_channels: [32, 64, 128, 192] encoder_depths: [2, 2, 2, 2] decoder_channels: [128, 64, 32] stem_channels: 24 bottleneck_depth: 1 global_ratio: 2.0 wavelet_type: haar wavelet_level: 1 use_wavelet_branch: true use_global_branch_stage1: false ssm_d_state: 16 ssm_forward_type: v3 ssm_backend: auto use_frequency_refine: true low_freq_radius_h: 0.25 low_freq_radius_w: 0.25 learnable_low_freq_radius: true guide_mode: affine out_channels: null optimizer: name: adamw lr: 1.0e-4 weight_decay: 0.05 scheduler: name: cosine warmup: name: linear params: start_factor: 0.1 total_iters: 10 params: T_max: 190 eta_min: 1.0e-6 augmentation: train: random_flip: true random_rotate_90: true random_brightness_contrast: true brightness_limit: 0.15 contrast_limit: 0.15 random_gaussian_noise: true gaussian_noise_std: 0.03 val: {} checkpoint: dir: outputs/experiments/supervised/BUSI save: true save_last: true monitor: dice monitor_mode: max resume: null resume_strict: true resume_training: true logging: log_interval: 10 print_training_setup: true use_swanlab: true project: X_SSL_Net experiment_name: xnet_sup_busi swanlab_mode: null