1 месяц назад · 92bf26dc75
--- a/configs/segmentation/train_sup_us_template.yaml
+++ b/configs/segmentation/train_sup_us_template.yaml
@@ -3,9 +3,11 @@ trainer:
 
															 train:
														
 
															   seed: 42
														
 
															+  deterministic: false
														
 
															   epochs: 200
														
 
															   batch_size: 4
														
 
															   val_batch_size: 4
														
 
															+  accum_steps: 1
														
 
															   amp: true
														
 
															   num_workers: 4
														
 
															   pin_memory: true
														
@@ -30,6 +32,14 @@ metrics:
 
															     - name: dice
														
 
															     - name: iou
														
 
															+loss:
														
 
															+  name: dicece
														
 
															+  task_mode: binary
														
 
															+  params:
														
 
															+    include_background: true
														
 
															+    lambda_dice: 0.7
														
 
															+    lambda_ce: 0.3
														
 
															+
														
 
															 validation:
														
 
															   enabled: true
														
 
															   interval: 1
														
@@ -59,11 +69,6 @@ model:
 
															   model_name: swinv2_tiny_patch4_window8_256
														
 
															   load_weights: false
														
 
															   decoder_channels: [384, 192, 96, 96]
														
 
															-  fwta_wavelet: haar
														
 
															-  fwta_level: 1
														
 
															-  fwta_sigma_ratio: 0.35
														
 
															-  fwta_tau_fourier: 0.15
														
 
															-  fwta_gate_temperature: 1.0
														
 
															   use_multiscale_features: true
														
 
															   include_patch_embed: true
														
@@ -83,6 +88,17 @@ scheduler:
 
															     T_max: 190
														
 
															     eta_min: 1.0e-6
														
 
															+augmentation:
														
 
															+  train:
														
 
															+    random_flip: true
														
 
															+    random_rotate_90: true
														
 
															+    random_brightness_contrast: true
														
 
															+    brightness_limit: 0.15
														
 
															+    contrast_limit: 0.15
														
 
															+    random_gaussian_noise: true
														
 
															+    gaussian_noise_std: 0.03
														
 
															+  val: {}
														
 
															+
														
 
															 checkpoint:
														
 
															   dir: outputs/supervised_segmentation/train_sup_us_template
														
 
															   save: true
														
--- a/configs/segmentation/us_exp_sup_busi.yaml
+++ b/configs/segmentation/us_exp_sup_busi.yaml
@@ -3,9 +3,11 @@ trainer:
 
															 train:
														
 
															   seed: 42
														
 
															+  deterministic: false
														
 
															   epochs: 200
														
 
															   batch_size: 4
														
 
															   val_batch_size: 4
														
 
															+  accum_steps: 1
														
 
															   amp: true
														
 
															   num_workers: 4
														
 
															   pin_memory: true
														
@@ -23,6 +25,14 @@ metrics:
 
															     - name: dice
														
 
															     - name: iou
														
 
															+loss:
														
 
															+  name: dicece
														
 
															+  task_mode: binary
														
 
															+  params:
														
 
															+    include_background: true
														
 
															+    lambda_dice: 0.7
														
 
															+    lambda_ce: 0.3
														
 
															+
														
 
															 validation:
														
 
															   enabled: true
														
 
															   interval: 1
														
@@ -49,11 +59,6 @@ model:
 
															   model_name: swinv2_tiny_patch4_window8_256
														
 
															   load_weights: false
														
 
															   decoder_channels: [384, 192, 96, 96]
														
 
															-  fwta_wavelet: haar
														
 
															-  fwta_level: 1
														
 
															-  fwta_sigma_ratio: 0.35
														
 
															-  fwta_tau_fourier: 0.15
														
 
															-  fwta_gate_temperature: 1.0
														
 
															   use_multiscale_features: true
														
 
															   include_patch_embed: true
														
@@ -73,6 +78,17 @@ scheduler:
 
															     T_max: 190
														
 
															     eta_min: 1.0e-6
														
 
															+augmentation:
														
 
															+  train:
														
 
															+    random_flip: true
														
 
															+    random_rotate_90: true
														
 
															+    random_brightness_contrast: true
														
 
															+    brightness_limit: 0.15
														
 
															+    contrast_limit: 0.15
														
 
															+    random_gaussian_noise: true
														
 
															+    gaussian_noise_std: 0.03
														
 
															+  val: {}
														
 
															+
														
 
															 checkpoint:
														
 
															   dir: outputs/experiments/supervised/BUSI
														
 
															   save: true
														
--- a/configs/segmentation/us_exp_sup_busi_ablation.yaml
+++ b/configs/segmentation/us_exp_sup_busi_ablation.yaml
@@ -0,0 +1,108 @@
 
															+trainer:
														
 
															+  name: supervised_segmentation
														
 
															+
														
 
															+train:
														
 
															+  seed: 42
														
 
															+  deterministic: false
														
 
															+  epochs: 200
														
 
															+  batch_size: 4
														
 
															+  val_batch_size: 4
														
 
															+  accum_steps: 1
														
 
															+  amp: true
														
 
															+  num_workers: 4
														
 
															+  pin_memory: true
														
 
															+  persistent_workers: true
														
 
															+  prefetch_factor: 2
														
 
															+  device: cuda
														
 
															+  grad_clip:
														
 
															+    enabled: true
														
 
															+    max_norm: 1.0
														
 
															+    norm_type: 2.0
														
 
															+
														
 
															+metrics:
														
 
															+  task_mode: binary
														
 
															+  metrics:
														
 
															+    - name: dice
														
 
															+    - name: iou
														
 
															+
														
 
															+loss:
														
 
															+  name: dicece
														
 
															+  task_mode: binary
														
 
															+  params:
														
 
															+    include_background: true
														
 
															+    lambda_dice: 0.7
														
 
															+    lambda_ce: 0.3
														
 
															+
														
 
															+validation:
														
 
															+  enabled: true
														
 
															+  interval: 1
														
 
															+  threshold: 0.5
														
 
															+  early_stopping: true
														
 
															+  early_stopping_patience: 40
														
 
															+  early_stopping_min_delta: 0.0
														
 
															+  metrics:
														
 
															+    task_mode: binary
														
 
															+    metrics:
														
 
															+      - name: dice
														
 
															+      - name: iou
														
 
															+
														
 
															+dataset:
														
 
															+  dataset_name: BUSI
														
 
															+  root: data/BUSI
														
 
															+  split: train
														
 
															+  val_split: val
														
 
															+  image_size: [256, 256]
														
 
															+  in_channels: 3
														
 
															+  num_classes: 1
														
 
															+
														
 
															+model:
														
 
															+  model_name: swinv2_tiny_patch4_window8_256
														
 
															+  load_weights: false
														
 
															+  decoder_channels: [384, 192, 96, 96]
														
 
															+  use_multiscale_features: true
														
 
															+  include_patch_embed: true
														
 
															+
														
 
															+optimizer:
														
 
															+  name: adamw
														
 
															+  lr: 1.0e-4
														
 
															+  weight_decay: 0.05
														
 
															+
														
 
															+scheduler:
														
 
															+  name: cosine
														
 
															+  warmup:
														
 
															+    name: linear
														
 
															+    params:
														
 
															+      start_factor: 0.1
														
 
															+      total_iters: 10
														
 
															+  params:
														
 
															+    T_max: 190
														
 
															+    eta_min: 1.0e-6
														
 
															+
														
 
															+augmentation:
														
 
															+  train:
														
 
															+    random_flip: true
														
 
															+    random_rotate_90: true
														
 
															+    random_brightness_contrast: true
														
 
															+    brightness_limit: 0.15
														
 
															+    contrast_limit: 0.15
														
 
															+    random_gaussian_noise: true
														
 
															+    gaussian_noise_std: 0.03
														
 
															+  val: {}
														
 
															+
														
 
															+checkpoint:
														
 
															+  dir: outputs/experiments/supervised/BUSI_ablation
														
 
															+  save: true
														
 
															+  save_last: true
														
 
															+  monitor: dice
														
 
															+  monitor_mode: max
														
 
															+  resume: null
														
 
															+  resume_strict: true
														
 
															+  resume_training: true
														
 
															+
														
 
															+logging:
														
 
															+  log_interval: 10
														
 
															+  print_training_setup: true
														
 
															+  use_swanlab: true
														
 
															+  project: X_SSL_Net
														
 
															+  experiment_name: sup_busi_ablation
														
 
															+  swanlab_mode: null
														
--- a/lib/modules/__init__.py
+++ b/lib/modules/__init__.py
@@ -1,8 +1,7 @@
 
															 from .attentions_2d import CirculantAttention2d, ComplexLinear, WaveletAttentionGlobalBranch2d
														
 
															 from .blocks_2d import WaveletFFTBlock2d, WaveletFFTMRFFIModule2d
														
 
															 from .build_swinv2 import build_swinv2, build_swinv2_auto
														
 
															-from .decoder_2d import BoundaryRefineBlock2d, StructureAwareDecodeBlock2d, StructureAwareDecoder2d
														
 
															-from .fwta_2d import FourierWaveletTokenAggregation
														
 
															+from .decoder_2d import DecodeRefineBlock2d, SegmentationDecodeBlock2d, SegmentationDecoder2d
														
 
															 from .layers_2d import (
														
 
															     BNLinear1d,
														
 
															     Conv2dBN,
														
@@ -13,8 +12,8 @@ from .layers_2d import (
 
															     Residual,
														
 
															     Scale,
														
 
															 )
														
 
															-from .segmentation_2d import GlobalTokenConditioning2d, SegmentationNet2d
														
 
															-from .swinv2_fwta_encoder_2d import SwinV2FWTAEncoder2d
														
 
															+from .segmentation_2d import SegmentationModel2d
														
 
															+from .swinv2_encoder_2d import SwinV2Encoder2d
														
 
															 __all__ = [
														
 
															     "CirculantAttention2d",
														
@@ -24,10 +23,9 @@ __all__ = [
 
															     "WaveletFFTMRFFIModule2d",
														
 
															     "build_swinv2",
														
 
															     "build_swinv2_auto",
														
 
															-    "BoundaryRefineBlock2d",
														
 
															-    "StructureAwareDecodeBlock2d",
														
 
															-    "StructureAwareDecoder2d",
														
 
															-    "FourierWaveletTokenAggregation",
														
 
															+    "DecodeRefineBlock2d",
														
 
															+    "SegmentationDecodeBlock2d",
														
 
															+    "SegmentationDecoder2d",
														
 
															     "BNLinear1d",
														
 
															     "Conv2dBN",
														
 
															     "DWConv2dBNReLU",
														
@@ -36,7 +34,6 @@ __all__ = [
 
															     "PatchMerging2d",
														
 
															     "Residual",
														
 
															     "Scale",
														
 
															-    "GlobalTokenConditioning2d",
														
 
															-    "SegmentationNet2d",
														
 
															-    "SwinV2FWTAEncoder2d",
														
 
															+    "SegmentationModel2d",
														
 
															+    "SwinV2Encoder2d",
														
 
															 ]
														
--- a/lib/modules/decoder_2d.py
+++ b/lib/modules/decoder_2d.py
@@ -9,9 +9,9 @@ import torch.nn.functional as F
 
															 from .layers_2d import Conv2dBN
														
 
															-class BoundaryRefineBlock2d(nn.Module):
														
 
															+class DecodeRefineBlock2d(nn.Module):
														
 
															     """
														
 
															-    使用边界提示和稳定性图对解码特征做轻量细化。
														
 
															+    对解码后的融合特征做轻量残差细化。
														
 
															     """
														
 
															     def __init__(self, channels: int) -> None:
														
@@ -22,32 +22,13 @@ class BoundaryRefineBlock2d(nn.Module):
 
															             Conv2dBN(channels, channels, 3, 1, 1),
														
 
															         )
														
 
															-    def forward(
														
 
															-            self,
														
 
															-            x: torch.Tensor,
														
 
															-            boundary_hint: torch.Tensor | None = None,
														
 
															-            stability_map: torch.Tensor | None = None,
														
 
															-    ) -> torch.Tensor:
														
 
															-        modulator = 1.0
														
 
															-
														
 
															-        if stability_map is not None:
														
 
															-            stability_map = F.interpolate(
														
 
															-                stability_map, size=x.shape[-2:], mode="bilinear", align_corners=False
														
 
															-            )
														
 
															-            modulator = modulator + stability_map
														
 
															-
														
 
															-        if boundary_hint is not None:
														
 
															-            boundary_hint = F.interpolate(
														
 
															-                boundary_hint, size=x.shape[-2:], mode="bilinear", align_corners=False
														
 
															-            )
														
 
															-            modulator = modulator + boundary_hint
														
 
															-
														
 
															-        return x + self.refine(x * modulator)
														
 
															+    def forward(self, x: torch.Tensor) -> torch.Tensor:
														
 
															+        return x + self.refine(x)
														
 
															-class StructureAwareDecodeBlock2d(nn.Module):
														
 
															+class SegmentationDecodeBlock2d(nn.Module):
														
 
															     """
														
 
															-    单层结构感知解码块。
														
 
															+    单层解码块：上采样高层特征，与 skip 特征融合后细化。
														
 
															     """
														
 
															     def __init__(self, in_channels: int, skip_channels: int, out_channels: int) -> None:
														
@@ -66,31 +47,28 @@ class StructureAwareDecodeBlock2d(nn.Module):
 
															             Conv2dBN(out_channels, out_channels, 3, 1, 1),
														
 
															             nn.ReLU(inplace=True),
														
 
															         )
														
 
															-        self.refine = BoundaryRefineBlock2d(out_channels)
														
 
															+        self.refine = DecodeRefineBlock2d(out_channels)
														
 
															-    def forward(
														
 
															-            self,
														
 
															-            x: torch.Tensor,
														
 
															-            skip: torch.Tensor,
														
 
															-            stability_map: torch.Tensor | None = None,
														
 
															-            boundary_hint: torch.Tensor | None = None,
														
 
															-    ) -> torch.Tensor:
														
 
															+    def forward(self, x: torch.Tensor, skip: torch.Tensor) -> torch.Tensor:
														
 
															         x = F.interpolate(x, size=skip.shape[-2:], mode="bilinear", align_corners=False)
														
 
															         x = self.high_proj(x)
														
 
															         skip = self.skip_proj(skip)
														
 
															         x = self.fuse(torch.cat([x, skip], dim=1))
														
 
															-        x = self.refine(x, boundary_hint=boundary_hint, stability_map=stability_map)
														
 
															-        return x
														
 
															+        return self.refine(x)
														
 
															-class StructureAwareDecoder2d(nn.Module):
														
 
															+class SegmentationDecoder2d(nn.Module):
														
 
															     """
														
 
															-    第一版结构感知解码器骨架。
														
 
															+    纯净的多尺度解码器骨架。
														
 
															     输入特征默认按从浅到深排列，最后一个特征视为最深层输入。
														
 
															     """
														
 
															-    def __init__(self, encoder_channels: Sequence[int], decoder_channels: Sequence[int] | None = None) -> None:
														
 
															+    def __init__(
														
 
															+            self,
														
 
															+            encoder_channels: Sequence[int],
														
 
															+            decoder_channels: Sequence[int] | None = None,
														
 
															+    ) -> None:
														
 
															         super().__init__()
														
 
															         if len(encoder_channels) < 2:
														
 
															             raise ValueError("encoder_channels must contain at least two stages.")
														
@@ -107,17 +85,12 @@ class StructureAwareDecoder2d(nn.Module):
 
															         blocks = []
														
 
															         for skip_ch, out_ch in zip(skip_channels, decoder_channels):
														
 
															-            blocks.append(StructureAwareDecodeBlock2d(in_channels, skip_ch, out_ch))
														
 
															+            blocks.append(SegmentationDecodeBlock2d(in_channels, skip_ch, out_ch))
														
 
															             in_channels = out_ch
														
 
															         self.blocks = nn.ModuleList(blocks)
														
 
															         self.out_channels = in_channels
														
 
															-    def forward(
														
 
															-            self,
														
 
															-            features: Sequence[torch.Tensor],
														
 
															-            stability_map: torch.Tensor | None = None,
														
 
															-            boundary_hints: Sequence[torch.Tensor] | None = None,
														
 
															-    ) -> tuple[torch.Tensor, list[torch.Tensor]]:
														
 
															+    def forward(self, features: Sequence[torch.Tensor]) -> tuple[torch.Tensor, list[torch.Tensor]]:
														
 
															         if len(features) != len(self.encoder_channels):
														
 
															             raise ValueError(
														
 
															                 f"feature count mismatch: got {len(features)}, expected {len(self.encoder_channels)}"
														
@@ -127,13 +100,8 @@ class StructureAwareDecoder2d(nn.Module):
 
															         skips = list(reversed(features[:-1]))
														
 
															         decoder_features = []
														
 
															-        if boundary_hints is None:
														
 
															-            boundary_hints = [None] * len(self.blocks)
														
 
															-        elif len(boundary_hints) != len(self.blocks):
														
 
															-            raise ValueError("boundary_hints length must match decoder depth.")
														
 
															-
														
 
															-        for block, skip, boundary_hint in zip(self.blocks, skips, boundary_hints):
														
 
															-            x = block(x, skip, stability_map=stability_map, boundary_hint=boundary_hint)
														
 
															+        for block, skip in zip(self.blocks, skips):
														
 
															+            x = block(x, skip)
														
 
															             decoder_features.append(x)
														
 
															         return x, decoder_features
														
--- a/lib/modules/segmentation_2d.py
+++ b/lib/modules/segmentation_2d.py
@@ -8,9 +8,9 @@ import torch
 
															 import torch.nn as nn
														
 
															 import torch.nn.functional as F
														
 
															-from .decoder_2d import StructureAwareDecoder2d
														
 
															+from .decoder_2d import SegmentationDecoder2d
														
 
															 from .layers_2d import Conv2dBN
														
 
															-from .swinv2_fwta_encoder_2d import SwinV2FWTAEncoder2d
														
 
															+from .swinv2_encoder_2d import SwinV2Encoder2d
														
 
															 class SegmentationHead2d(nn.Module):
														
@@ -27,49 +27,9 @@ class SegmentationHead2d(nn.Module):
 
															         return F.interpolate(x, size=output_size, mode="bilinear", align_corners=False)
														
 
															-class BoundaryHead2d(nn.Module):
														
 
															-    def __init__(self, in_channels: int, out_channels: int = 1) -> None:
														
 
															-        super().__init__()
														
 
															-        self.block = nn.Sequential(
														
 
															-            Conv2dBN(in_channels, in_channels, 3, 1, 1),
														
 
															-            nn.ReLU(inplace=True),
														
 
															-            nn.Conv2d(in_channels, out_channels, kernel_size=1, bias=True),
														
 
															-        )
														
 
															-
														
 
															-    def forward(self, x: torch.Tensor, output_size: tuple[int, int]) -> torch.Tensor:
														
 
															-        x = self.block(x)
														
 
															-        return F.interpolate(x, size=output_size, mode="bilinear", align_corners=False)
														
 
															-
														
 
															-
														
 
															-class GlobalTokenConditioning2d(nn.Module):
														
 
															-    """
														
 
															-    使用 FWTA 更新后的全局前景 token 对解码特征做通道调制。
														
 
															+class SegmentationModel2d(nn.Module):
														
 
															     """
														
 
															-
														
 
															-    def __init__(self, token_channels: int, feature_channels: int) -> None:
														
 
															-        super().__init__()
														
 
															-        hidden_channels = max(feature_channels // 2, 32)
														
 
															-        self.gate = nn.Sequential(
														
 
															-            nn.LayerNorm(token_channels),
														
 
															-            nn.Linear(token_channels, hidden_channels),
														
 
															-            nn.GELU(),
														
 
															-            nn.Linear(hidden_channels, feature_channels),
														
 
															-            nn.Sigmoid(),
														
 
															-        )
														
 
															-
														
 
															-    def forward(self, x: torch.Tensor, global_token: torch.Tensor) -> tuple[torch.Tensor, torch.Tensor]:
														
 
															-        channel_gate = self.gate(global_token).unsqueeze(-1).unsqueeze(-1)
														
 
															-        return x * (1.0 + channel_gate), channel_gate
														
 
															-
														
 
															-
														
 
															-class SegmentationNet2d(nn.Module):
														
 
															-    """
														
 
															-    第一版超声分割主网络骨架。
														
 
															-
														
 
															-    当前职责：
														
 
															-    - 编码器输出多尺度特征和稳定性图
														
 
															-    - 结构感知解码器恢复分割特征
														
 
															-    - 同时输出分割图和边界图
														
 
															+    简化后的超声分割网络。
														
 
															     """
														
 
															     def __init__(
														
@@ -85,7 +45,7 @@ class SegmentationNet2d(nn.Module):
 
															             **encoder_kwargs: Any,
														
 
															     ) -> None:
														
 
															         super().__init__()
														
 
															-        self.encoder = SwinV2FWTAEncoder2d(
														
 
															+        self.encoder = SwinV2Encoder2d(
														
 
															             model_name=model_name,
														
 
															             config_path=config_path,
														
 
															             weight_path=weight_path,
														
@@ -93,46 +53,16 @@ class SegmentationNet2d(nn.Module):
 
															             load_weights=load_weights,
														
 
															             **encoder_kwargs,
														
 
															         )
														
 
															-        self.decoder = StructureAwareDecoder2d(
														
 
															+        self.decoder = SegmentationDecoder2d(
														
 
															             encoder_channels=self.encoder.stage_channels,
														
 
															             decoder_channels=decoder_channels,
														
 
															         )
														
 
															-        self.global_conditioning = GlobalTokenConditioning2d(
														
 
															-            token_channels=self.encoder.stage_channels[-1],
														
 
															-            feature_channels=self.decoder.out_channels,
														
 
															-        )
														
 
															         self.segmentation_head = SegmentationHead2d(self.decoder.out_channels, num_classes)
														
 
															-        self.boundary_head = BoundaryHead2d(self.decoder.out_channels, out_channels=1)
														
 
															-
														
 
															-    def forward(self, x: torch.Tensor) -> dict[str, torch.Tensor | list[torch.Tensor]]:
														
 
															-        encoder_outputs = self.encoder(x)
														
 
															-        features = encoder_outputs["features"]
														
 
															-        stability_map = encoder_outputs["stability_map"]
														
 
															-        decoder_out, decoder_features = self.decoder(
														
 
															-            features=features,
														
 
															-            stability_map=stability_map,
														
 
															-        )
														
 
															-        conditioned_decoder_out, global_channel_gate = self.global_conditioning(
														
 
															-            decoder_out,
														
 
															-            encoder_outputs["global_token"],
														
 
															-        )
														
 
															+    def forward(self, x: torch.Tensor) -> dict[str, torch.Tensor]:
														
 
															+        features = self.encoder(x)["features"]
														
 
															+        decoder_out, _ = self.decoder(features)
														
 
															         output_size = x.shape[-2:]
														
 
															-        seg_logits = self.segmentation_head(conditioned_decoder_out, output_size=output_size)
														
 
															-        boundary_logits = self.boundary_head(conditioned_decoder_out, output_size=output_size)
														
 
															-
														
 
															-        return {
														
 
															-            "seg_logits": seg_logits,
														
 
															-            "boundary_logits": boundary_logits,
														
 
															-            "stability_map": F.interpolate(
														
 
															-                stability_map, size=output_size, mode="bilinear", align_corners=False
														
 
															-            ),
														
 
															-            "encoder_features": features,
														
 
															-            "decoder_features": decoder_features,
														
 
															-            "conditioned_decoder_feature": conditioned_decoder_out,
														
 
															-            "deepest_feature": encoder_outputs["deepest_feature"],
														
 
															-            "global_token": encoder_outputs["global_token"],
														
 
															-            "global_channel_gate": global_channel_gate,
														
 
															-            "token_gate": encoder_outputs["token_gate"],
														
 
															-        }
														
 
															+        seg_logits = self.segmentation_head(decoder_out, output_size=output_size)
														
 
															+        return {"seg_logits": seg_logits}
														
--- a/lib/tools/__init__.py
+++ b/lib/tools/__init__.py
@@ -1,6 +1,4 @@
 
															-from .boundary import boundary_band_map, logits_to_boundary, logits_to_binary_mask, mask_to_boundary_map
														
 
															 from .loss import DEFAULT_TASK_LOSS, LOSS_REGISTRY, build_loss
														
 
															-from .loss import BinaryBoundaryLoss, MaskBoundaryConsistencyLoss
														
 
															 from .metrics import (
														
 
															     DEFAULT_METRIC_CONFIG,
														
 
															     METRIC_REGISTRY,
														
@@ -28,13 +26,7 @@ __all__ = [
 
															     "METRIC_REGISTRY",
														
 
															     "OPTIMIZER_REGISTRY",
														
 
															     "SCHEDULER_REGISTRY",
														
 
															-    "mask_to_boundary_map",
														
 
															-    "logits_to_binary_mask",
														
 
															-    "logits_to_boundary",
														
 
															-    "boundary_band_map",
														
 
															     "build_loss",
														
 
															-    "BinaryBoundaryLoss",
														
 
															-    "MaskBoundaryConsistencyLoss",
														
 
															     "build_metric",
														
 
															     "build_metrics",
														
 
															     "compute_metrics",
														
--- a/lib/trainers/supervised.py
+++ b/lib/trainers/supervised.py
@@ -6,53 +6,46 @@ from typing import Any
 
															 import torch
														
 
															 from torch.utils.data import DataLoader
														
 
															-from lib.modules import SegmentationNet2d
														
 
															-from lib.tools import (
														
 
															-    BinaryBoundaryLoss,
														
 
															-    MaskBoundaryConsistencyLoss,
														
 
															-    build_optimizer,
														
 
															-    build_scheduler,
														
 
															-    mask_to_boundary_map,
														
 
															-)
														
 
															+from lib.modules import SegmentationModel2d
														
 
															+from lib.tools import build_loss, build_optimizer, build_scheduler
														
 
															 from .base import BaseTrainer
														
 
															 class SupervisedSegmentationTrainer(BaseTrainer):
														
 
															     def __init__(self, cfg: dict[str, Any], args: Any | None = None) -> None:
														
 
															         super().__init__(cfg=cfg, args=args)
														
 
															-        self.model: SegmentationNet2d | None = None
														
 
															+        self.model: SegmentationModel2d | None = None
														
 
															         self.optimizer = None
														
 
															         self.scheduler = None
														
 
															         self.loader: DataLoader | None = None
														
 
															         self.val_loader: DataLoader | None = None
														
 
															         self.seg_loss = None
														
 
															-        self.boundary_loss = BinaryBoundaryLoss()
														
 
															-        self.consistency_loss = MaskBoundaryConsistencyLoss()
														
 
															     def build(self) -> None:
														
 
															         dataset_cfg = self.cfg["dataset"]
														
 
															         model_cfg = self.cfg["model"]
														
 
															         train_cfg = self.cfg["train"]
														
 
															-        self.model = SegmentationNet2d(
														
 
															+        self.model = SegmentationModel2d(
														
 
															             num_classes=dataset_cfg["num_classes"],
														
 
															             model_name=model_cfg["model_name"],
														
 
															             load_weights=model_cfg.get("load_weights", False),
														
 
															             decoder_channels=model_cfg.get("decoder_channels"),
														
 
															-            fwta_wavelet=model_cfg.get("fwta_wavelet", "haar"),
														
 
															-            fwta_level=model_cfg.get("fwta_level", 1),
														
 
															-            fwta_sigma_ratio=model_cfg.get("fwta_sigma_ratio", 0.35),
														
 
															-            fwta_tau_fourier=model_cfg.get("fwta_tau_fourier", 0.15),
														
 
															-            fwta_gate_temperature=model_cfg.get("fwta_gate_temperature", 1.0),
														
 
															+            use_multiscale_features=model_cfg.get("use_multiscale_features", True),
														
 
															+            include_patch_embed=model_cfg.get("include_patch_embed", True),
														
 
															         ).to(self.device)
														
 
															         self.optimizer = build_optimizer(self.model, self.cfg["optimizer"])
														
 
															         self.scheduler = build_scheduler(self.optimizer, self.cfg.get("scheduler"))
														
 
															+        loss_cfg = self.cfg.get("loss")
														
 
															+        if loss_cfg is not None:
														
 
															+            self.seg_loss = build_loss(loss_cfg)
														
 
															         self.loader = self._build_segmentation_loader(
														
 
															             split=str(dataset_cfg.get("split", "train")),
														
 
															             split_file=dataset_cfg.get("split_file"),
														
 
															             batch_size=self._resolve_batch_size("batch_size", 4),
														
 
															             shuffle=bool(train_cfg.get("shuffle", True)),
														
 
															+            augmentation_config=self.cfg.get("augmentation", {}).get("train"),
														
 
															         )
														
 
															         self.val_loader = self._build_val_loader(
														
 
															             batch_size=self._resolve_batch_size(
														
@@ -78,19 +71,17 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															         with torch.autocast(device_type=self.device.type, enabled=self._amp_enabled()):
														
 
															             outputs = self.model(image)
														
 
															             seg_logits = outputs["seg_logits"]
														
 
															-            boundary_logits = outputs["boundary_logits"]
														
 
															-            seg_loss = torch.nn.functional.binary_cross_entropy_with_logits(seg_logits, mask)
														
 
															-            boundary_target = mask_to_boundary_map(mask)
														
 
															-            boundary_loss = self.boundary_loss(boundary_logits, boundary_target)
														
 
															-            consistency_loss = self.consistency_loss(seg_logits, boundary_logits)
														
 
															-            total_loss = seg_loss + boundary_loss + 0.1 * consistency_loss
														
 
															+            if self.seg_loss is None:
														
 
															+                seg_loss = torch.nn.functional.binary_cross_entropy_with_logits(seg_logits, mask)
														
 
															+            else:
														
 
															+                seg_loss = self.seg_loss(seg_logits, mask)
														
 
															+
														
 
															+            total_loss = seg_loss
														
 
															         losses = {
														
 
															             "total": total_loss,
														
 
															             "seg": seg_loss,
														
 
															-            "boundary": boundary_loss,
														
 
															-            "consistency": consistency_loss,
														
 
															         }
														
 
															         return outputs, losses
														
@@ -106,8 +97,6 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															         metrics = self._build_validation_metrics()
														
 
															         total = 0.0
														
 
															         seg = 0.0
														
 
															-        boundary = 0.0
														
 
															-        consistency = 0.0
														
 
															         steps = 0
														
 
															         with torch.no_grad():
														
 
															             for batch in self.val_loader:
														
@@ -116,8 +105,6 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															                 outputs, losses = self._compute_losses(image, mask)
														
 
															                 total += float(losses["total"].detach().cpu())
														
 
															                 seg += float(losses["seg"].detach().cpu())
														
 
															-                boundary += float(losses["boundary"].detach().cpu())
														
 
															-                consistency += float(losses["consistency"].detach().cpu())
														
 
															                 self._update_validation_metrics(
														
 
															                     metrics,
														
 
															                     logits=outputs["seg_logits"],
														
@@ -130,8 +117,6 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															         val_metrics = {
														
 
															             "total": total / steps,
														
 
															             "seg": seg / steps,
														
 
															-            "boundary": boundary / steps,
														
 
															-            "consistency": consistency / steps,
														
 
															         }
														
 
															         val_metrics.update(self._compute_validation_metric_values(metrics))
														
 
															         return val_metrics
														
@@ -141,6 +126,7 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															             raise RuntimeError("Trainer.build() must be called before train().")
														
 
															         epochs = int(self.cfg["train"].get("epochs", 1))
														
 
															+        accum_steps = self._accum_steps()
														
 
															         try:
														
 
															             self._print_training_setup(
														
 
															                 model_map={"model": self.model},
														
@@ -150,11 +136,10 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															             )
														
 
															             for epoch in range(self.start_epoch, epochs):
														
 
															                 self.model.train()
														
 
															+                self.optimizer.zero_grad()
														
 
															                 train_metric_sums = {
														
 
															                     "total": 0.0,
														
 
															                     "seg": 0.0,
														
 
															-                    "boundary": 0.0,
														
 
															-                    "consistency": 0.0,
														
 
															                 }
														
 
															                 train_metrics: dict[str, float] | None = None
														
 
															                 end_time = time.perf_counter()
														
@@ -165,14 +150,17 @@ class SupervisedSegmentationTrainer(BaseTrainer):
 
															                     image = batch["image"].to(self.device)
														
 
															                     mask = batch["mask"].to(self.device)
														
 
															                     _, losses = self._compute_losses(image, mask)
														
 
															-                    self.optimizer.zero_grad()
														
 
															-                    self.grad_scaler.scale(losses["total"]).backward()
														
 
															+                    scaled_total_loss = losses["total"] / accum_steps
														
 
															+                    self.grad_scaler.scale(scaled_total_loss).backward()
														
 
															                     grad_norm = None
														
 
															-                    if self._grad_clip_enabled():
														
 
															-                        self.grad_scaler.unscale_(self.optimizer)
														
 
															-                        grad_norm = self._clip_gradients(self.model)
														
 
															-                    self.grad_scaler.step(self.optimizer)
														
 
															-                    self.grad_scaler.update()
														
 
															+                    should_step = (step % accum_steps == 0) or (step == num_steps)
														
 
															+                    if should_step:
														
 
															+                        if self._grad_clip_enabled():
														
 
															+                            self.grad_scaler.unscale_(self.optimizer)
														
 
															+                            grad_norm = self._clip_gradients(self.model)
														
 
															+                        self.grad_scaler.step(self.optimizer)
														
 
															+                        self.grad_scaler.update()
														
 
															+                        self.optimizer.zero_grad()
														
 
															                     train_metrics = self._detach_metrics(losses)
														
 
															                     if grad_norm is not None:
														
 
															                         train_metrics["grad_norm"] = grad_norm
														
--- a/tmp/docs/training/当前项目详解与纯文本架构流程图.md
+++ b/tmp/docs/training/当前项目详解与纯文本架构流程图.md
@@ -0,0 +1,822 @@
 
															+# 当前项目详解与纯文本架构流程图
														
 
															+
														
 
															+## 1. 当前项目定位
														
 
															+
														
 
															+当前项目的现役主路径已经收缩为一个纯净的超声分割全监督基线。
														
 
															+
														
 
															+现在真实生效的模型与训练链路只有一条：
														
 
															+
														
 
															+`输入图像 -> 纯 SwinV2 编码器 -> 纯分割解码器 -> 分割头 -> seg_logits -> 分割损失`
														
 
															+
														
 
															+当前主路径已经满足以下要求：
														
 
															+
														
 
															+1. 不调用 FWTA
														
 
															+2. 不调用 FWTA 编码器
														
 
															+3. 不存在边界分支
														
 
															+4. 不存在边界损失
														
 
															+5. 不存在一致性损失
														
 
															+6. 配置文件中不再使用 `aux_loss`
														
 
															+7. 实验脚本中不再做边界相关消融
														
 
															+
														
 
															+这份文档只描述当前真实主链，不再记录历史结构语义。
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 2. 当前项目一句话概述
														
 
															+
														
 
															+`X_SSL_Net` 当前可以理解为：
														
 
															+
														
 
															+`一个面向超声图像分割的纯单头 2D segmentation baseline，主干为 SwinV2 encoder + segmentation decoder。`
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 3. 当前主链总览
														
 
															+
														
 
															+### 3.1 当前训练入口
														
 
															+
														
 
															+训练统一从下面这个入口启动：
														
 
															+
														
 
															+`tools/train.py`
														
 
															+
														
 
															+它负责：
														
 
															+
														
 
															+1. 读取 YAML 配置
														
 
															+2. 接收命令行 `--set` 覆盖参数
														
 
															+3. 构建 trainer
														
 
															+4. 调用 `trainer.train()`
														
 
															+
														
 
															+### 3.2 当前 trainer
														
 
															+
														
 
															+当前正式 trainer 仍然叫：
														
 
															+
														
 
															+`SupervisedSegmentationTrainer`
														
 
															+
														
 
															+但它现在已经只做纯分割训练，不再处理任何边界辅助分支。
														
 
															+
														
 
															+### 3.3 当前模型
														
 
															+
														
 
															+当前现役模型是：
														
 
															+
														
 
															+`SegmentationModel2d`
														
 
															+
														
 
															+它的内部结构为：
														
 
															+
														
 
															+1. `SwinV2Encoder2d`
														
 
															+2. `SegmentationDecoder2d`
														
 
															+3. `SegmentationHead2d`
														
 
															+
														
 
															+最终只输出：
														
 
															+
														
 
															+1. `seg_logits`
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 4. 目录职责总览
														
 
															+
														
 
															+```text
														
 
															+X_SSL_Net/
														
 
															+|
														
 
															+|-- tools/
														
 
															+|   |-- train.py
														
 
															+|   |-- run_us_experiments.sh
														
 
															+|   `-- summarize_results.py
														
 
															+|
														
 
															+|-- configs/
														
 
															+|   |-- segmentation/
														
 
															+|   `-- swinv2/
														
 
															+|
														
 
															+|-- lib/
														
 
															+|   |-- trainers/
														
 
															+|   |-- modules/
														
 
															+|   |-- data/
														
 
															+|   `-- tools/
														
 
															+|
														
 
															+`-- tmp/docs/training/
														
 
															+```
														
 
															+
														
 
															+### 4.1 `tools/`
														
 
															+
														
 
															+1. `tools/train.py`
														
 
															+   统一训练启动入口
														
 
															+2. `tools/run_us_experiments.sh`
														
 
															+   纯分割实验脚本
														
 
															+3. `tools/summarize_results.py`
														
 
															+   汇总 `best.pth` 中的实验结果
														
 
															+
														
 
															+### 4.2 `configs/segmentation/`
														
 
															+
														
 
															+1. `train_sup_us_template.yaml`
														
 
															+   当前最核心的纯分割训练模板
														
 
															+2. `us_exp_sup_busi.yaml`
														
 
															+   BUSI 示例配置
														
 
															+3. `us_exp_sup_busi_ablation.yaml`
														
 
															+   目前内容已与普通纯分割配置对齐，不再承载边界消融语义
														
 
															+
														
 
															+### 4.3 `lib/trainers/`
														
 
															+
														
 
															+1. `builder.py`
														
 
															+   trainer 注册与构建
														
 
															+2. `base.py`
														
 
															+   训练公共底座
														
 
															+3. `supervised.py`
														
 
															+   当前纯分割训练流程实现
														
 
															+
														
 
															+### 4.4 `lib/modules/`
														
 
															+
														
 
															+1. `swinv2_encoder_2d.py`
														
 
															+   纯 SwinV2 编码器封装
														
 
															+2. `decoder_2d.py`
														
 
															+   当前纯分割解码器实现
														
 
															+3. `segmentation_2d.py`
														
 
															+   当前主模型封装
														
 
															+4. `build_swinv2.py`
														
 
															+   SwinV2 backbone 构建器
														
 
															+
														
 
															+### 4.5 `lib/data/`
														
 
															+
														
 
															+1. `builder.py`
														
 
															+   构建样本索引
														
 
															+2. `loaders.py`
														
 
															+   构建 dataset 与 dataloader
														
 
															+3. `datasets.py`
														
 
															+   真正读取 image 和 mask
														
 
															+4. `augment.py`
														
 
															+   数据增强
														
 
															+
														
 
															+### 4.6 `lib/tools/`
														
 
															+
														
 
															+当前主路径真正会用到的核心工具只有：
														
 
															+
														
 
															+1. `loss.py`
														
 
															+   主分割损失构建
														
 
															+2. `metrics.py`
														
 
															+   Dice / IoU 等验证指标
														
 
															+3. `optim.py`
														
 
															+   optimizer 和 scheduler 构建
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 5. 当前纯文本架构图
														
 
															+
														
 
															+### 5.1 训练系统总架构图
														
 
															+
														
 
															+```text
														
 
															++----------------------------------------------------------------------------------+
														
 
															+|                              当前纯分割训练系统                                  |
														
 
															++----------------------------------------------------------------------------------+
														
 
															+|                                                                                  |
														
 
															+|  tools/train.py                                                                  |
														
 
															+|      |                                                                           |
														
 
															+|      v                                                                           |
														
 
															+|  读取 YAML 配置 + 应用 --set 覆盖                                                |
														
 
															+|      |                                                                           |
														
 
															+|      v                                                                           |
														
 
															+|  build_trainer(cfg)                                                              |
														
 
															+|      |                                                                           |
														
 
															+|      v                                                                           |
														
 
															+|  SupervisedSegmentationTrainer                                                   |
														
 
															+|      |                                                                           |
														
 
															+|      +------------------- build() -------------------+                           |
														
 
															+|      |                                               |                           |
														
 
															+|      v                                               v                           |
														
 
															+|  build_dataloader()                            SegmentationModel2d               |
														
 
															+|      |                                               |                           |
														
 
															+|      v                                               v                           |
														
 
															+|  SegmentationRecordDataset                     SwinV2Encoder2d                   |
														
 
															+|      |                                               |                           |
														
 
															+|      v                                               v                           |
														
 
															+|  image, mask batch                            multi-scale features               |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                              SegmentationDecoder2d              |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                                decoded feature                   |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                                SegmentationHead2d                |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                                     seg_logits                   |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                                     seg_loss                     |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                            backward + optimizer.step()           |
														
 
															+|                                                        |                         |
														
 
															+|                                                        v                         |
														
 
															+|                                          validation / metric / checkpoint        |
														
 
															+|                                                                                  |
														
 
															++----------------------------------------------------------------------------------+
														
 
															+```
														
 
															+
														
 
															+### 5.2 模型内部结构图
														
 
															+
														
 
															+```text
														
 
															+Input Image [B, 3, H, W]
														
 
															+    |
														
 
															+    v
														
 
															+SwinV2Encoder2d
														
 
															+    |
														
 
															+    +-- feature_0  (可选 patch_embed 特征)
														
 
															+    +-- feature_1
														
 
															+    +-- feature_2
														
 
															+    +-- feature_3
														
 
															+    `-- feature_4
														
 
															+            |
														
 
															+            v
														
 
															+SegmentationDecoder2d
														
 
															+    |
														
 
															+    +-- Decode Block 1: deepest + skip_3
														
 
															+    +-- Decode Block 2: upsample + skip_2
														
 
															+    +-- Decode Block 3: upsample + skip_1
														
 
															+    `-- Decode Block 4: upsample + skip_0
														
 
															+            |
														
 
															+            v
														
 
															+decoded feature
														
 
															+    |
														
 
															+    v
														
 
															+SegmentationHead2d
														
 
															+    |
														
 
															+    v
														
 
															+seg_logits
														
 
															+    |
														
 
															+    v
														
 
															+上采样回输入分辨率
														
 
															+```
														
 
															+
														
 
															+### 5.3 数据系统结构图
														
 
															+
														
 
															+```text
														
 
															+dataset.root
														
 
															+    |
														
 
															+    v
														
 
															+build_dataset_index(dataset_name, root)
														
 
															+    |
														
 
															+    v
														
 
															+apply split
														
 
															+    |
														
 
															+    v
														
 
															+SegmentationRecordDataset
														
 
															+    |
														
 
															+    +-- 读取 image
														
 
															+    +-- 读取 mask
														
 
															+    +-- 应用 augmentation
														
 
															+    +-- resize image/mask
														
 
															+    |
														
 
															+    v
														
 
															+DataLoader
														
 
															+    |
														
 
															+    v
														
 
															+batch = {
														
 
															+    image,
														
 
															+    mask,
														
 
															+    dataset_name,
														
 
															+    sample_id,
														
 
															+    split,
														
 
															+    class_name,
														
 
															+    meta
														
 
															+}
														
 
															+```
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 6. 当前纯文本流程图
														
 
															+
														
 
															+### 6.1 启动流程图
														
 
															+
														
 
															+```text
														
 
															+[开始]
														
 
															+   |
														
 
															+   v
														
 
															+执行 tools/train.py --config xxx.yaml --set key=value ...
														
 
															+   |
														
 
															+   v
														
 
															+parse_args()
														
 
															+   |
														
 
															+   v
														
 
															+load_yaml_config()
														
 
															+   |
														
 
															+   v
														
 
															+apply_dotlist_overrides()
														
 
															+   |
														
 
															+   v
														
 
															+build_trainer(cfg)
														
 
															+   |
														
 
															+   v
														
 
															+trainer.build()
														
 
															+   |
														
 
															+   +--> 构建 model
														
 
															+   +--> 构建 optimizer
														
 
															+   +--> 构建 scheduler
														
 
															+   +--> 构建 train loader
														
 
															+   +--> 构建 val loader
														
 
															+   +--> 恢复 checkpoint（如配置）
														
 
															+   `--> 初始化 SwanLab（如启用）
														
 
															+   |
														
 
															+   v
														
 
															+trainer.train()
														
 
															+   |
														
 
															+   v
														
 
															+[进入 epoch 循环]
														
 
															+```
														
 
															+
														
 
															+### 6.2 单个 epoch 流程图
														
 
															+
														
 
															+```text
														
 
															+[epoch 开始]
														
 
															+   |
														
 
															+   v
														
 
															+model.train()
														
 
															+optimizer.zero_grad()
														
 
															+   |
														
 
															+   v
														
 
															+for batch in train_loader:
														
 
															+   |
														
 
															+   +--> 取 image, mask
														
 
															+   |
														
 
															+   +--> model(image)
														
 
															+   |      |
														
 
															+   |      `--> seg_logits
														
 
															+   |
														
 
															+   +--> 计算 seg_loss
														
 
															+   |
														
 
															+   +--> total_loss = seg_loss
														
 
															+   |
														
 
															+   +--> backward()
														
 
															+   |
														
 
															+   +--> 如果到达 accum_steps:
														
 
															+   |      |
														
 
															+   |      +--> 可选 gradient clipping
														
 
															+   |      +--> optimizer.step()
														
 
															+   |      +--> scaler.update()
														
 
															+   |      `--> optimizer.zero_grad()
														
 
															+   |
														
 
															+   `--> 记录 step 日志
														
 
															+   |
														
 
															+   v
														
 
															+epoch 结束后 scheduler.step()
														
 
															+   |
														
 
															+   v
														
 
															+如果需要验证:
														
 
															+   |
														
 
															+   +--> model.eval()
														
 
															+   +--> 遍历 val_loader
														
 
															+   +--> 统计 val loss
														
 
															+   `--> 统计 Dice / IoU
														
 
															+   |
														
 
															+   v
														
 
															+保存 checkpoint
														
 
															+   |
														
 
															+   v
														
 
															+判断 early stopping
														
 
															+```
														
 
															+
														
 
															+### 6.3 单次前向传播流程图
														
 
															+
														
 
															+```text
														
 
															+image
														
 
															+  |
														
 
															+  v
														
 
															+SegmentationModel2d.forward()
														
 
															+  |
														
 
															+  +--> features = encoder(image)["features"]
														
 
															+  |
														
 
															+  +--> decoder_out, _ = decoder(features)
														
 
															+  |
														
 
															+  `--> seg_logits = segmentation_head(decoder_out, output_size=input_size)
														
 
															+           |
														
 
															+           v
														
 
															+return {
														
 
															+  seg_logits
														
 
															+}
														
 
															+```
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 7. 当前模型链路详解
														
 
															+
														
 
															+### 7.1 `SegmentationModel2d`
														
 
															+
														
 
															+文件：`lib/modules/segmentation_2d.py`
														
 
															+
														
 
															+这是当前主模型封装。
														
 
															+
														
 
															+它的职责非常直接：
														
 
															+
														
 
															+1. 调用编码器提取多尺度特征
														
 
															+2. 调用解码器恢复高分辨率分割特征
														
 
															+3. 调用分割头输出 `seg_logits`
														
 
															+
														
 
															+它不再负责：
														
 
															+
														
 
															+1. 边界输出
														
 
															+2. 多分支辅助预测
														
 
															+3. 任何历史先验注入接口
														
 
															+
														
 
															+### 7.2 `SwinV2Encoder2d`
														
 
															+
														
 
															+文件：`lib/modules/swinv2_encoder_2d.py`
														
 
															+
														
 
															+职责：
														
 
															+
														
 
															+1. 构建 SwinV2 backbone
														
 
															+2. 输出多尺度特征列表
														
 
															+3. 支持是否包含 patch embed 特征
														
 
															+4. 支持是否输出多尺度特征
														
 
															+
														
 
															+当前主链只使用它的：
														
 
															+
														
 
															+1. `features`
														
 
															+
														
 
															+### 7.3 `SegmentationDecoder2d`
														
 
															+
														
 
															+文件：`lib/modules/decoder_2d.py`
														
 
															+
														
 
															+这是当前纯分割解码器。
														
 
															+
														
 
															+每层解码块 `SegmentationDecodeBlock2d` 的工作方式是：
														
 
															+
														
 
															+1. 对高层特征上采样
														
 
															+2. 对 skip 特征做通道映射
														
 
															+3. 拼接后卷积融合
														
 
															+4. 用 `DecodeRefineBlock2d` 做轻量残差细化
														
 
															+
														
 
															+当前已经没有：
														
 
															+
														
 
															+1. FWTA 注入接口
														
 
															+2. stability prior
														
 
															+3. saliency prior
														
 
															+4. boundary hint
														
 
															+
														
 
															+### 7.4 `SegmentationHead2d`
														
 
															+
														
 
															+文件：`lib/modules/segmentation_2d.py`
														
 
															+
														
 
															+职责：
														
 
															+
														
 
															+1. 接收解码器输出特征
														
 
															+2. 经过卷积块生成分割 logits
														
 
															+3. 上采样到输入分辨率
														
 
															+
														
 
															+最终输出：
														
 
															+
														
 
															+1. `seg_logits`
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 8. 当前训练器链路详解
														
 
															+
														
 
															+### 8.1 `SupervisedSegmentationTrainer`
														
 
															+
														
 
															+文件：`lib/trainers/supervised.py`
														
 
															+
														
 
															+虽然类名仍然保留 `SegmentationTrainer` 字样，但当前内容已经是纯单头分割训练。
														
 
															+
														
 
															+### 8.2 `build()`
														
 
															+
														
 
															+`build()` 当前做的事：
														
 
															+
														
 
															+1. 构建 `SegmentationModel2d`
														
 
															+2. 构建 optimizer
														
 
															+3. 构建 scheduler
														
 
															+4. 构建主分割 loss
														
 
															+5. 构建 train loader
														
 
															+6. 构建 val loader
														
 
															+7. 恢复 checkpoint
														
 
															+8. 初始化日志系统
														
 
															+
														
 
															+### 8.3 `_compute_losses()`
														
 
															+
														
 
															+当前 loss 计算已经简化为：
														
 
															+
														
 
															+```text
														
 
															+outputs = model(image)
														
 
															+seg_logits = outputs["seg_logits"]
														
 
															+seg_loss = criterion(seg_logits, mask)
														
 
															+total_loss = seg_loss
														
 
															+```
														
 
															+
														
 
															+也就是：
														
 
															+
														
 
															+```text
														
 
															+total_loss = seg_loss
														
 
															+```
														
 
															+
														
 
															+### 8.4 `train()`
														
 
															+
														
 
															+当前训练循环做的事：
														
 
															+
														
 
															+1. 前向得到 `seg_logits`
														
 
															+2. 计算 `seg_loss`
														
 
															+3. backward
														
 
															+4. 可选梯度累计
														
 
															+5. 可选梯度裁剪
														
 
															+6. optimizer step
														
 
															+7. scheduler step
														
 
															+8. 验证集评估
														
 
															+9. checkpoint 与 early stopping
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 9. 当前数据系统详解
														
 
															+
														
 
															+### 9.1 当前输入输出格式
														
 
															+
														
 
															+`SegmentationRecordDataset` 返回：
														
 
															+
														
 
															+1. `image`
														
 
															+2. `mask`
														
 
															+3. `dataset_name`
														
 
															+4. `sample_id`
														
 
															+5. `split`
														
 
															+6. `class_name`
														
 
															+7. `meta`
														
 
															+
														
 
															+### 9.2 当前数据读取流程
														
 
															+
														
 
															+1. 读 RGB 图像，归一化到 `[0, 1]`
														
 
															+2. 读二值分割 mask
														
 
															+3. 对 image 和 mask 做联合增强
														
 
															+4. resize 到配置指定尺寸
														
 
															+5. 送入 DataLoader
														
 
															+
														
 
															+### 9.3 当前支持的数据集
														
 
															+
														
 
															+当前 `lib/data/builder.py` 支持：
														
 
															+
														
 
															+1. `BUS-UCLM`
														
 
															+2. `BUSI`
														
 
															+3. `BUS-BRA`
														
 
															+4. `BUS_UC`
														
 
															+5. `CCAUI`
														
 
															+6. `DDTI`
														
 
															+7. `OTU_2d`
														
 
															+8. `TN3K`
														
 
															+9. `TG3K`
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 10. 当前损失、指标与优化流程
														
 
															+
														
 
															+### 10.1 当前损失
														
 
															+
														
 
															+当前主路径只保留主分割损失。
														
 
															+
														
 
															+默认配置示例：
														
 
															+
														
 
															+```yaml
														
 
															+loss:
														
 
															+  name: dicece
														
 
															+  task_mode: binary
														
 
															+  params:
														
 
															+    include_background: true
														
 
															+    lambda_dice: 0.7
														
 
															+    lambda_ce: 0.3
														
 
															+```
														
 
															+
														
 
															+也就是说当前优化目标只围绕 mask 分割本身。
														
 
															+
														
 
															+### 10.2 当前指标
														
 
															+
														
 
															+当前验证指标通常为：
														
 
															+
														
 
															+1. `dice`
														
 
															+2. `iou`
														
 
															+
														
 
															+### 10.3 当前优化器
														
 
															+
														
 
															+默认配置：
														
 
															+
														
 
															+1. `adamw`
														
 
															+2. 支持 warmup + cosine scheduler
														
 
															+
														
 
															+### 10.4 当前 AMP
														
 
															+
														
 
															+当前仍支持：
														
 
															+
														
 
															+1. `torch.autocast`
														
 
															+2. `GradScaler`
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 11. 关键配置变量解释（中英对照）
														
 
															+
														
 
															+### 11.1 `trainer.name`
														
 
															+
														
 
															+1. 中文：训练器名称
														
 
															+2. English: trainer name
														
 
															+3. 作用：决定实例化哪个 trainer
														
 
															+4. 当前值：`supervised_segmentation`
														
 
															+
														
 
															+### 11.2 `train.seed`
														
 
															+
														
 
															+1. 中文：随机种子
														
 
															+2. English: random seed
														
 
															+3. 作用：控制随机性
														
 
															+
														
 
															+### 11.3 `train.epochs`
														
 
															+
														
 
															+1. 中文：训练轮数
														
 
															+2. English: number of epochs
														
 
															+3. 作用：决定最大训练轮数
														
 
															+
														
 
															+### 11.4 `train.batch_size`
														
 
															+
														
 
															+1. 中文：训练 batch 大小
														
 
															+2. English: training batch size
														
 
															+3. 作用：控制每批样本数
														
 
															+
														
 
															+### 11.5 `train.val_batch_size`
														
 
															+
														
 
															+1. 中文：验证 batch 大小
														
 
															+2. English: validation batch size
														
 
															+3. 作用：控制验证批次大小
														
 
															+
														
 
															+### 11.6 `train.accum_steps`
														
 
															+
														
 
															+1. 中文：梯度累计步数
														
 
															+2. English: gradient accumulation steps
														
 
															+3. 作用：模拟更大有效 batch
														
 
															+
														
 
															+### 11.7 `train.amp`
														
 
															+
														
 
															+1. 中文：自动混合精度
														
 
															+2. English: automatic mixed precision
														
 
															+3. 作用：降低显存、提高吞吐
														
 
															+
														
 
															+### 11.8 `train.grad_clip.enabled`
														
 
															+
														
 
															+1. 中文：是否启用梯度裁剪
														
 
															+2. English: enable gradient clipping
														
 
															+3. 作用：提升训练稳定性
														
 
															+
														
 
															+### 11.9 `metrics.task_mode`
														
 
															+
														
 
															+1. 中文：指标任务模式
														
 
															+2. English: metric task mode
														
 
															+3. 作用：指定 binary 或 multiclass
														
 
															+
														
 
															+### 11.10 `loss.name`
														
 
															+
														
 
															+1. 中文：损失名称
														
 
															+2. English: loss name
														
 
															+3. 作用：指定分割损失类型
														
 
															+
														
 
															+### 11.11 `dataset.dataset_name`
														
 
															+
														
 
															+1. 中文：数据集名称
														
 
															+2. English: dataset name
														
 
															+3. 作用：决定用哪个数据集构建器
														
 
															+
														
 
															+### 11.12 `dataset.root`
														
 
															+
														
 
															+1. 中文：数据根目录
														
 
															+2. English: dataset root
														
 
															+3. 作用：决定从哪里读取数据
														
 
															+
														
 
															+### 11.13 `dataset.image_size`
														
 
															+
														
 
															+1. 中文：输入图像尺寸
														
 
															+2. English: input image size
														
 
															+3. 作用：控制 resize 大小
														
 
															+
														
 
															+### 11.14 `dataset.num_classes`
														
 
															+
														
 
															+1. 中文：分割类别数
														
 
															+2. English: number of classes
														
 
															+3. 作用：决定分割头输出通道数
														
 
															+
														
 
															+### 11.15 `model.model_name`
														
 
															+
														
 
															+1. 中文：backbone 名称
														
 
															+2. English: backbone model name
														
 
															+3. 作用：决定加载哪个 SwinV2 结构配置
														
 
															+
														
 
															+### 11.16 `model.decoder_channels`
														
 
															+
														
 
															+1. 中文：解码器通道数配置
														
 
															+2. English: decoder channel sizes
														
 
															+3. 作用：控制解码器每层输出维度
														
 
															+
														
 
															+### 11.17 `model.use_multiscale_features`
														
 
															+
														
 
															+1. 中文：是否使用多尺度特征
														
 
															+2. English: use multi-scale features
														
 
															+3. 作用：控制 encoder 是否输出多层特征给 decoder
														
 
															+
														
 
															+### 11.18 `model.include_patch_embed`
														
 
															+
														
 
															+1. 中文：是否包含 patch embed 特征
														
 
															+2. English: include patch embedding feature
														
 
															+3. 作用：控制最浅层特征是否进入解码链
														
 
															+
														
 
															+### 11.19 `optimizer.lr`
														
 
															+
														
 
															+1. 中文：学习率
														
 
															+2. English: learning rate
														
 
															+3. 作用：控制参数更新步长
														
 
															+
														
 
															+### 11.20 `checkpoint.monitor`
														
 
															+
														
 
															+1. 中文：监控指标
														
 
															+2. English: monitored metric
														
 
															+3. 作用：决定 best checkpoint 基于什么指标保存
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 12. 关键运行时变量解释（中英对照）
														
 
															+
														
 
															+### 12.1 `cfg`
														
 
															+
														
 
															+1. 中文：总配置字典
														
 
															+2. English: global config dictionary
														
 
															+3. 作用：控制整个训练流程
														
 
															+
														
 
															+### 12.2 `image`
														
 
															+
														
 
															+1. 中文：输入图像
														
 
															+2. English: input image
														
 
															+3. 典型形状：`[B, C, H, W]`
														
 
															+
														
 
															+### 12.3 `mask`
														
 
															+
														
 
															+1. 中文：真实分割掩膜
														
 
															+2. English: ground-truth mask
														
 
															+3. 典型形状：`[B, 1, H, W]`
														
 
															+
														
 
															+### 12.4 `features`
														
 
															+
														
 
															+1. 中文：编码器多尺度特征
														
 
															+2. English: multi-scale features
														
 
															+3. 作用：供 decoder 恢复空间细节
														
 
															+
														
 
															+### 12.5 `decoder_out`
														
 
															+
														
 
															+1. 中文：解码器输出特征
														
 
															+2. English: decoder output feature
														
 
															+3. 作用：作为分割头输入
														
 
															+
														
 
															+### 12.6 `seg_logits`
														
 
															+
														
 
															+1. 中文：分割 logits
														
 
															+2. English: segmentation logits
														
 
															+3. 作用：主预测结果
														
 
															+
														
 
															+### 12.7 `seg_loss`
														
 
															+
														
 
															+1. 中文：主分割损失
														
 
															+2. English: segmentation loss
														
 
															+3. 作用：训练优化目标
														
 
															+
														
 
															+### 12.8 `total_loss`
														
 
															+
														
 
															+1. 中文：总损失
														
 
															+2. English: total loss
														
 
															+3. 当前关系：`total_loss = seg_loss`
														
 
															+
														
 
															+### 12.9 `best_metric`
														
 
															+
														
 
															+1. 中文：最佳验证指标
														
 
															+2. English: best validation metric
														
 
															+3. 作用：控制 best checkpoint 与 early stopping
														
 
															+
														
 
															+### 12.10 `grad_scaler`
														
 
															+
														
 
															+1. 中文：混合精度梯度缩放器
														
 
															+2. English: gradient scaler
														
 
															+3. 作用：保证 AMP 下训练稳定
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 13. 当前实验脚本的真实含义
														
 
															+
														
 
															+文件：`tools/run_us_experiments.sh`
														
 
															+
														
 
															+当前脚本只做纯分割实验组织。
														
 
															+
														
 
															+支持两种模式：
														
 
															+
														
 
															+1. 单个数据集训练
														
 
															+2. 所有数据集批量训练
														
 
															+
														
 
															+已经不再支持：
														
 
															+
														
 
															+1. 边界辅助损失消融
														
 
															+2. 一致性损失消融
														
 
															+3. FWTA 消融
														
 
															+
														
 
															+---
														
 
															+
														
 
															+## 14. 当前状态的最简结论
														
 
															+
														
 
															+当前项目已经完成主路径净化，可以用下面几句话概括：
														
 
															+
														
 
															+1. 当前主模型是 `SegmentationModel2d`。
														
 
															+2. 当前主结构是 `SwinV2Encoder2d + SegmentationDecoder2d + SegmentationHead2d`。
														
 
															+3. 当前训练只做单头分割，不再有边界分支。
														
 
															+4. 当前总损失就是主分割损失，不再有边界损失和一致性损失。
														
 
															+5. 当前配置文件与实验脚本已经去掉 `aux_loss` 和相关消融入口。
														
 
															+6. 当前现役主链不再调用 FWTA，也不再对外保留 FWTA 语义。
														
 
															+
														
--- a/tools/summarize_results.py
+++ b/tools/summarize_results.py
@@ -34,6 +34,10 @@ def _infer_ratio(ckpt: dict[str, Any], path: Path) -> str:
 
															     return "-"
														
 
															+def _infer_ablation_case(ckpt: dict[str, Any], path: Path) -> str:
														
 
															+    return "-"
														
 
															+
														
 
															+
														
 
															 def _extract_metric(metrics: dict[str, Any], *names: str) -> float | None:
														
 
															     for name in names:
														
 
															         value = metrics.get(name)
														
@@ -50,6 +54,7 @@ def collect_rows(outputs_dir: Path) -> list[dict[str, Any]]:
 
															         row = {
														
 
															             "dataset": _infer_dataset(ckpt, best_path),
														
 
															             "mode": _infer_mode(best_path),
														
 
															+            "ablation_case": _infer_ablation_case(ckpt, best_path),
														
 
															             "ratio": _infer_ratio(ckpt, best_path),
														
 
															             "epoch": ckpt.get("epoch"),
														
 
															             "best_metric": ckpt.get("best_metric"),
														
@@ -63,7 +68,7 @@ def collect_rows(outputs_dir: Path) -> list[dict[str, Any]]:
 
															 def write_csv(rows: list[dict[str, Any]], path: Path) -> None:
														
 
															     path.parent.mkdir(parents=True, exist_ok=True)
														
 
															-    fieldnames = ["dataset", "mode", "ratio", "epoch", "best_metric", "dice", "iou", "checkpoint"]
														
 
															+    fieldnames = ["dataset", "mode", "ablation_case", "ratio", "epoch", "best_metric", "dice", "iou", "checkpoint"]
														
 
															     with path.open("w", encoding="utf-8", newline="") as handle:
														
 
															         writer = csv.DictWriter(handle, fieldnames=fieldnames)
														
 
															         writer.writeheader()
														
@@ -75,16 +80,16 @@ def write_markdown(rows: list[dict[str, Any]], path: Path) -> None:
 
															     lines = [
														
 
															         "# 实验结果汇总",
														
 
															         "",
														
 
															-        "| dataset | mode | ratio | epoch | best_metric | dice | iou | checkpoint |",
														
 
															-        "| --- | --- | --- | --- | --- | --- | --- | --- |",
														
 
															+        "| dataset | mode | ablation_case | ratio | epoch | best_metric | dice | iou | checkpoint |",
														
 
															+        "| --- | --- | --- | --- | --- | --- | --- | --- | --- |",
														
 
															     ]
														
 
															     for row in rows:
														
 
															         lines.append(
														
 
															-            f"| {row['dataset']} | {row['mode']} | {row['ratio']} | {row['epoch']} | "
														
 
															+            f"| {row['dataset']} | {row['mode']} | {row['ablation_case']} | {row['ratio']} | {row['epoch']} | "
														
 
															             f"{row['best_metric']} | {row['dice']} | {row['iou']} | {row['checkpoint']} |"
														
 
															         )
														
 
															     if not rows:
														
 
															-        lines.append("| - | - | - | - | - | - | - | - |")
														
 
															+        lines.append("| - | - | - | - | - | - | - | - | - |")
														
 
															     path.write_text("\n".join(lines) + "\n", encoding="utf-8")
														
@@ -103,7 +108,13 @@ def main() -> None:
 
															     write_csv(rows, csv_path)
														
 
															     write_markdown(rows, md_path)
														
 
															-    print({"num_results": len(rows), "csv": str(csv_path), "markdown": str(md_path)})
														
 
															+    print(
														
 
															+        {
														
 
															+            "num_results": len(rows),
														
 
															+            "csv": str(csv_path),
														
 
															+            "markdown": str(md_path),
														
 
															+        }
														
 
															+    )
														
 
															 if __name__ == "__main__":