pytorch · H-Huang · Sep 5, 2024 · Sep 5, 2024 · wconstab · Sep 5, 2024
diff --git a/torchtitan/parallelisms/pipelining_utils.py b/torchtitan/parallelisms/pipelining_utils.py
@@ -41,6 +41,18 @@ def build_pipeline_schedule(job_config, stages, loss_fn):
     if n_microbatches is None:
         n_microbatches = job_config.experimental.pipeline_parallel_degree
 
+    # Validation that the stages are compatible with the schedule
+    if isinstance(schedule_class, PipelineScheduleSingle):
 stages if looped_schedule else stages[0], 
 stages if looped_schedule else stages[0], 
+        if len(stages) != 1:
+            raise ValueError(
+                f"PipelineScheduleSingle requires exactly one stage, got {len(stages)}"
+            )
+    elif isinstance(schedule_class, PipelineScheduleMulti):
+        if len(stages) < 2:
+            raise ValueError(
+                f"PipelineScheduleMulti requires at least two stages, got {len(stages)}"
+            )
+
     return schedule_class(
         stages if looped_schedule else stages[0],
         n_microbatches=n_microbatches,