ModelTC · de1star · Jun 6, 2025 · Jun 11, 2025 · Jun 11, 2025 · Jun 23, 2025
diff --git a/configs/wan_t2v_dist.json b/configs/wan_t2v_dist.json
@@ -10,6 +10,6 @@
     "sample_shift": 8,
     "enable_cfg": true,
     "cpu_offload": false,
-    "parallel_attn_type": "ulysses",
+    "parallel_attn_type": "pipefusion",
     "parallel_vae": true
 }
diff --git a/lightx2v/dist/wrappers/distrifusion/cache.py b/lightx2v/dist/wrappers/distrifusion/cache.py
@@ -0,0 +1,9 @@
+class DistruFusionKVCacheManager:
+    def __init__(self):
+        pass
+
+    def update_cache(self):
+        pass
+
+    def get_cache(self):
+        pass
diff --git a/lightx2v/dist/wrappers/distrifusion/comm.py b/lightx2v/dist/wrappers/distrifusion/comm.py
@@ -0,0 +1,91 @@
+import torch
+import torch.distributed as dist
+from loguru import logger
+
+
+class DistriFusionCommManager:
+    def __init__(self):
+        self.verbose = True
+
+        self.device = "cuda"
+
+        self.rank = dist.get_rank()
+        self.world_size = dist.get_world_size()
+
+        self.torch_dtype = None
+        self.numel = 0
+        self.numel_dict = {}
+
+        self.buffer_list = None
+
+        self.starts = []
+        self.ends = []
+        self.shapes = []
+
+        self.idx_queue = []
+
+        self.handles = None
+
+    def register_tensor(
+        self, shape: tuple[int, ...] or list[int], torch_dtype: torch.dtype, layer_type: str = None
+    ) -> int:
+        if self.torch_dtype is None:
+            self.torch_dtype = torch_dtype
+        else:
+            assert self.torch_dtype == torch_dtype
+        self.starts.append(self.numel)
+        numel = 1
+        for dim in shape:
+            numel *= dim
+        self.numel += numel
+        if layer_type is not None:
+            if layer_type not in self.numel_dict:
+                self.numel_dict[layer_type] = 0
+            self.numel_dict[layer_type] += numel
+
+        self.ends.append(self.numel)
+        self.shapes.append(shape)
+        return len(self.starts) - 1
+
+    def create_buffer(self):
+        if self.rank == 0 and self.verbose:
+            logger.info(
+                f"Create buffer with {self.numel / 1e6:.3f}M parameters for {len(self.starts)} tensors on each device."
+            )
+            for layer_type, numel in self.numel_dict.items():
+                logger.info(f"  {layer_type}: {numel / 1e6:.3f}M parameters")
+
+        self.buffer_list = [
+            torch.empty(self.numel, dtype=self.torch_dtype, device=self.device) for _ in range(self.world_size)
+        ]
+        self.handels = [None for _ in range(len(self.starts))]
+
+    def get_buffer_list(self, idx: int) -> list[torch.Tensor]:
+        buffer_list = [t[self.starts[idx] : self.ends[idx]].view(self.shapes[idx]) for t in self.buffer_list]
+        return buffer_list
+
+    def communicate(self):
+        start = self.starts[self.idx_queue[0]]
+        end = self.ends[self.idx_queue[-1]]
+        tensor = self.buffer_list[self.rank][start:end]
+        buffer_list = [t[start:end] for t in self.buffer_list]
+        handle = dist.all_gather(buffer_list, tensor, async_op=True)
+        for i in self.idx_queue:
+            self.handles[i] = handle
+        self.idx_queue = []
+
+    def enqueue(self, idx: int, tensor: torch.Tensor):
+        if idx == 0 and len(self.idx_queue) > 0:
+            self.communicate()
+        assert len(self.idx_queue) == 0 or self.idx_queue[-1] == idx - 1
+        self.idx_queue.append(idx)
+        self.buffer_list[self.rank][self.starts[idx] : self.ends[idx]].copy_(tensor.flatten())
+
+    def clear(self):
+        if len(self.idx_queue) > 0:
+            self.communicate()
+        if self.handles is not None:
+            for i in range(len(self.handles)):
+                if self.handles[i] is not None:
+                    self.handles[i].wait()
+                    self.handles[i] = None
diff --git a/lightx2v/dist/wrappers/distrifusion/infer.py b/lightx2v/dist/wrappers/distrifusion/infer.py
@@ -0,0 +1,8 @@
+from lightx2v.models.networks.wan.infer.transformer_infer import (
+    WanTransformerInfer,
+)
+
+
+class DistriFusionWanTransformerInferWrapper:
+    def __init__(self, transformer_infer: WanTransformerInfer, config):
+        pass
diff --git a/lightx2v/dist/wrappers/distrifusion/model.py b/lightx2v/dist/wrappers/distrifusion/model.py
@@ -0,0 +1,30 @@
+from lightx2v.models.networks.wan.model import WanModel
+from lightx2v.dist.wrappers.distrifusion.infer import DistriFusionWanTransformerInferWrapper
+from lightx2v.dist.wrappers.distrifusion.weights import DistriFusionWanTransformerWeightsWrapper
+
+
+class DistriFusionWanModelWrapper:
+    def __init__(self, model: WanModel, config):
+        self.model = model
+        self.config = config
+
+        self._wrap_transformer(self.model, self.config)
+
+    def __getattr__(self, name: str):
+        if name in self.__dict__:
+            return getattr(self, name)
+        else:
+            return getattr(self.model, name)
+
+    def __delattr__(self, name: str):
+        if name in self.__dict__:
+            del self.__dict__[name]
+        else:
+            del self.model.__dict__[name]
+
+    def _wrap_transformer(self, model, config):
+        model.transformer_weights = DistriFusionWanTransformerWeightsWrapper(model.transformer_weights, config)
+        model.transformer_infer = DistriFusionWanTransformerInferWrapper(model.transformer_infer, config)
+
+    def infer(self, inputs, is_warmup=True):
+        pass
diff --git a/lightx2v/dist/wrappers/distrifusion/runner.py b/lightx2v/dist/wrappers/distrifusion/runner.py
@@ -0,0 +1,17 @@
+from lightx2v.models.runners.wan.wan_runner import WanRunner
+
+
+class DistriFusionWanRunnerWrapper:
+    def __init__(self, runner: WanRunner, config):
+        self.runner = runner
+        self.config = config
+
+    def __getattr__(self, name: str):
+        if name in self.__dict__:
+            return getattr(self, name)
+        else:
+            return getattr(self.runner, name)
+
+    def _wrap(self, runner, config):
+        runner.model = DistriFusionWanModelWrapper(runner.model, config)
+        self.runner.run = self.run
diff --git a/lightx2v/dist/wrappers/distrifusion/weights.py b/lightx2v/dist/wrappers/distrifusion/weights.py
@@ -0,0 +1,9 @@
+import torch.distributed as dist
+from lightx2v.models.networks.wan.weights.transformer_weights import (
+    WanTransformerWeights,
+)
+
+
+class DistriFusionWanTransformerWeightsWrapper:
+    def __init__(self, transformer_weights: WanTransformerWeights, config):
+        pass