ai-dynamo
diff --git a/‎.github/labeler.yml‎
Lines changed: 6 additions & 0 deletions b/‎.github/labeler.yml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎.github/workflows/generate-allure-report.yml‎
Lines changed: 5 additions & 46 deletions b/‎.github/workflows/generate-allure-report.yml‎
Lines changed: 5 additions & 46 deletions
diff --git a/‎components/src/dynamo/common/protocols/image_protocol.py‎
Lines changed: 3 additions & 0 deletions b/‎components/src/dynamo/common/protocols/image_protocol.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎components/src/dynamo/sglang/protocol.py‎
Lines changed: 9 additions & 13 deletions b/‎components/src/dynamo/sglang/protocol.py‎
Lines changed: 9 additions & 13 deletions
diff --git a/‎components/src/dynamo/sglang/request_handlers/image_diffusion/image_diffusion_handler.py‎
Lines changed: 28 additions & 10 deletions b/‎components/src/dynamo/sglang/request_handlers/image_diffusion/image_diffusion_handler.py‎
Lines changed: 28 additions & 10 deletions
diff --git a/‎components/src/dynamo/sglang/tests/test_sglang_image_diffusion_handler.py‎
Lines changed: 57 additions & 2 deletions b/‎components/src/dynamo/sglang/tests/test_sglang_image_diffusion_handler.py‎
Lines changed: 57 additions & 2 deletions
diff --git a/‎deploy/operator/internal/controller/dynamographdeployment_controller.go‎
Lines changed: 22 additions & 0 deletions b/‎deploy/operator/internal/controller/dynamographdeployment_controller.go‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎deploy/operator/internal/discovery/resource.go‎
Lines changed: 1 addition & 1 deletion b/‎deploy/operator/internal/discovery/resource.go‎
Lines changed: 1 addition & 1 deletion
@@ -94,6 +94,12 @@ documentation:
           - '**/*.md'
           - '**/*.rst'
 
+xpu:
+  - changed-files:
+      - any-glob-to-any-file:
+          - '**/xpu/**'
+          - '**/*xpu*'
+
 multimodal:
   - changed-files:
       - any-glob-to-any-file:
 
@@ -94,15 +94,6 @@ jobs:
         run: |
           git fetch origin gh-pages:gh-pages 2>/dev/null || echo "No gh-pages branch yet"
 
-          # Restore history for Allure 3 report (primary, at allure/${SUBDIR}/)
-          # Allure 3 uses history.jsonl (not history/*.json like Allure 2)
-          if git show "gh-pages:allure/${SUBDIR}/history.jsonl" 2>/dev/null; then
-            git show "gh-pages:allure/${SUBDIR}/history.jsonl" > allure-v3-history.jsonl
-            echo "Restored Allure 3 history.jsonl from gh-pages/allure/${SUBDIR}"
-          else
-            echo "No previous Allure 3 history found"
-          fi
-
           # Restore history for Allure 2 report (at allure/v2/${SUBDIR}/)
           if git show "gh-pages:allure/v2/${SUBDIR}/history" 2>/dev/null; then
             mkdir -p allure-results/history
@@ -119,20 +110,6 @@ jobs:
         run: |
           ./allure2-cli/bin/allure generate allure-results -o allure-report --clean
 
-      - name: Generate Allure 3 Report
-        if: steps.check-results.outputs.has_results == 'true'
-        run: |
-          mkdir -p allure-v3-workspace/allure-results
-          # Copy results but exclude Allure 2 history dir to avoid format confusion
-          rsync -a --exclude='history' allure-results/ allure-v3-workspace/allure-results/
-          # Restore Allure 3 history.jsonl into the workspace
-          if [ -f allure-v3-history.jsonl ]; then
-            cp allure-v3-history.jsonl allure-v3-workspace/history.jsonl
-          fi
-          # historyPath requires a config file
-          echo 'export default { historyPath: "./history.jsonl" };' > allure-v3-workspace/allurerc.mjs
-          npx allure generate --config="${GITHUB_WORKSPACE}/allure-v3-workspace/allurerc.mjs" --cwd allure-v3-workspace -o allure-report-v3
-
       - name: Generate unified dashboard
         if: steps.check-results.outputs.has_results == 'true'
         env:
@@ -149,18 +126,18 @@ jobs:
           for dir in pr post-merge nightly release; do
             if [ "$dir" = "$SUBDIR" ]; then continue; fi
             if git show "gh-pages:dashboard-results/${dir}" 2>/dev/null; then
-              mkdir -p "unified-workspace/allure-results/${dir}-imported"
               git archive gh-pages "dashboard-results/${dir}" | tar -x -C /tmp/
-              cp -r "/tmp/dashboard-results/${dir}/"* "unified-workspace/allure-results/${dir}-imported/" 2>/dev/null || true
+              cp -r "/tmp/dashboard-results/${dir}/"* "unified-workspace/allure-results/" 2>/dev/null || true
             fi
           done
 
-          # Restore unified dashboard history for trend charts
+          # Restore unified dashboard history for trend charts (or seed empty file)
           if git show "gh-pages:allure/history.jsonl" 2>/dev/null; then
             git show "gh-pages:allure/history.jsonl" > unified-workspace/history.jsonl
             echo "Restored unified dashboard history from gh-pages"
           else
             echo "No previous unified dashboard history found"
+            touch unified-workspace/history.jsonl
           fi
 
           # Generate unified dashboard using allurerc.mjs
@@ -189,23 +166,6 @@ jobs:
             git checkout --orphan gh-pages
           fi
 
-          # One-time cleanup: remove old path layout from before allure/ prefix migration
-          for old_dir in allure-all pre-merge pre-merge-v2 post-merge post-merge-v2 nightly nightly-v2 release release-v2; do
-            if [ -d "$old_dir" ]; then
-              echo "Removing legacy directory: $old_dir"
-              rm -rf "$old_dir"
-            fi
-          done
-
-          # Deploy Allure 3 report (primary)
-          mkdir -p "allure/${SUBDIR}"
-          rm -rf "allure/${SUBDIR}/"*
-          cp -r "${GITHUB_WORKSPACE}/allure-report-v3/"* "allure/${SUBDIR}/"
-          # Persist Allure 3 history.jsonl for trend charts
-          if [ -f "${GITHUB_WORKSPACE}/allure-v3-workspace/history.jsonl" ]; then
-            cp "${GITHUB_WORKSPACE}/allure-v3-workspace/history.jsonl" "allure/${SUBDIR}/history.jsonl"
-          fi
-
           # Deploy Allure 2 report
           mkdir -p "allure/v2/${SUBDIR}"
           rm -rf "allure/v2/${SUBDIR}/"*
@@ -216,7 +176,7 @@ jobs:
           rm -rf "dashboard-results/${SUBDIR}/"*
           rsync -a --exclude='history' "${GITHUB_WORKSPACE}/allure-results/" "dashboard-results/${SUBDIR}/"
 
-          # Deploy unified dashboard (overwrites report files, preserves subdirs)
+          # Deploy unified dashboard (per-workflow tabs generated by allurerc.mjs plugins)
           mkdir -p allure
           cp -r "${GITHUB_WORKSPACE}/allure-all-report/"* allure/
           # Persist history.jsonl for trend charts
@@ -248,6 +208,5 @@ jobs:
         run: |
           echo "## Allure Reports" >> $GITHUB_STEP_SUMMARY
           echo "" >> $GITHUB_STEP_SUMMARY
-          echo "- [Allure Report](https://ai-dynamo.github.io/dynamo/allure/${SUBDIR}/)" >> $GITHUB_STEP_SUMMARY
+          echo "- [Allure Dashboard](https://ai-dynamo.github.io/dynamo/allure/)" >> $GITHUB_STEP_SUMMARY
           echo "- [Allure 2 Report](https://ai-dynamo.github.io/dynamo/allure/v2/${SUBDIR}/)" >> $GITHUB_STEP_SUMMARY
-          echo "- [Unified Dashboard](https://ai-dynamo.github.io/dynamo/allure/)" >> $GITHUB_STEP_SUMMARY
@@ -65,6 +65,9 @@ class NvCreateImageRequest(BaseModel):
     moderation: Optional[str] = None
     """Content moderation level: auto or low."""
 
+    input_reference: Optional[str] = None
+    """Optional image reference that guides generation (for I2I)."""
+
     nvext: Optional[ImageNvExt] = None
     """NVIDIA extensions."""
 
 
@@ -7,6 +7,7 @@
 from sglang.srt.entrypoints.openai.protocol import ChatCompletionRequest
 
 from dynamo.common.multimodal import TransferRequest
+from dynamo.common.protocols.image_protocol import ImageNvExt
 
 TokenIdType = int
 
@@ -143,18 +144,13 @@ class DisaggSglangMultimodalRequest(BaseModel):
 # ============================================================================
 
 
-class NvExt(BaseModel):
-    """NVIDIA extensions for image generation"""
-
-    negative_prompt: Optional[str] = None
-    num_inference_steps: Optional[int] = 50
-    guidance_scale: float = 7.5
-    seed: Optional[int] = None
-    annotations: Optional[list[str]] = None
-
-
 class CreateImageRequest(BaseModel):
-    """OpenAI /v1/images/generations compatible request"""
+    """OpenAI /v1/images/generations and /v1/images/edits compatible request.
+
+    Generation params (seed, guidance_scale, num_inference_steps, negative_prompt)
+    are specified under ``nvext``.  SGLang-specific defaults (guidance_scale=7.5,
+    num_inference_steps=50) are applied in the handler, not the model.
+    """
 
     prompt: str
     model: str  # e.g. "stabilityai/stable-diffusion-3.5-medium"
@@ -163,9 +159,9 @@ class CreateImageRequest(BaseModel):
     quality: Optional[str] = "standard"  # standard, hd
     response_format: Optional[str] = "url"  # url or b64_json
     user: Optional[str] = None
+    input_reference: Optional[str] = None  # For I2I/TI2I - image path/url
 
-    # NVIDIA extensions nested under nvext
-    nvext: Optional[NvExt] = None
+    nvext: Optional[ImageNvExt] = None
 
 
 class ImageData(BaseModel):
 
@@ -14,16 +14,19 @@
 from PIL import Image
 
 from dynamo._core import Context
+from dynamo.common.protocols.image_protocol import ImageNvExt
 from dynamo.common.storage import upload_to_fs
 from dynamo.common.utils.otel_tracing import build_trace_headers
 from dynamo.sglang.args import Config
-from dynamo.sglang.protocol import CreateImageRequest, ImageData, ImagesResponse, NvExt
+from dynamo.sglang.protocol import CreateImageRequest, ImageData, ImagesResponse
 from dynamo.sglang.publisher import DynamoSglangPublisher
 from dynamo.sglang.request_handlers.handler_base import BaseGenerativeHandler
 
 logger = logging.getLogger(__name__)
 
 MAX_NUM_INFERENCE_STEPS = 50
+DEFAULT_NUM_INFERENCE_STEPS = 50
+DEFAULT_GUIDANCE_SCALE = 7.5
 
 
 class ImageDiffusionWorkerHandler(BaseGenerativeHandler):
@@ -92,11 +95,17 @@ async def generate(
         try:
             req = CreateImageRequest(**request)
 
-            # get extra parameters
-            nvext = req.nvext or NvExt()
-            nvext.num_inference_steps = min(
-                nvext.num_inference_steps or 50, MAX_NUM_INFERENCE_STEPS
-            )
+            nvext = req.nvext or ImageNvExt()
+
+            # Apply SGLang-specific defaults for unset values
+            raw_steps = nvext.num_inference_steps or DEFAULT_NUM_INFERENCE_STEPS
+            if raw_steps > MAX_NUM_INFERENCE_STEPS:
+                logger.warning(
+                    f"num_inference_steps={raw_steps} exceeds max "
+                    f"{MAX_NUM_INFERENCE_STEPS}, clamping"
+                )
+            num_inference_steps = min(raw_steps, MAX_NUM_INFERENCE_STEPS)
+            guidance_scale = nvext.guidance_scale or DEFAULT_GUIDANCE_SCALE
 
             width, height = self._parse_size(req.size)
 
@@ -105,9 +114,10 @@ async def generate(
                 negative_prompt=nvext.negative_prompt,
                 width=width,
                 height=height,
-                num_inference_steps=nvext.num_inference_steps,
-                guidance_scale=nvext.guidance_scale,
+                num_inference_steps=num_inference_steps,
+                guidance_scale=guidance_scale,
                 seed=nvext.seed,
+                input_reference=req.input_reference,
             )
 
             context_id = context.id()
@@ -145,6 +155,7 @@ async def _generate_images(
         guidance_scale: float,
         seed: Optional[int],
         negative_prompt: Optional[str] = None,
+        input_reference: Optional[str] = None,
     ) -> list[bytes]:
         """Generate images using SGLang DiffGenerator"""
         args = {
@@ -155,8 +166,15 @@ async def _generate_images(
             "num_inference_steps": num_inference_steps,
             "save_output": False,  # We handle saving ourselves
             "guidance_scale": guidance_scale,
-            "seed": seed if seed else random.randint(0, 1000000),
+            "seed": seed if seed is not None else random.randint(0, 1000000),
         }
+
+        # Add image_path for I2I/TI2I if provided
+        if input_reference is not None:
+            if not input_reference.strip():
+                raise ValueError("input_reference must be a non-empty string")
+            args["image_path"] = input_reference
+
         result = await asyncio.to_thread(
             self.generator.generate,
             sampling_params_kwargs=args,
@@ -175,7 +193,7 @@ async def _generate_images(
         for img in images:
             if isinstance(img, bytes):
                 image_bytes_list.append(img)
-            elif Image is not None and isinstance(img, Image.Image):
+            elif isinstance(img, Image.Image):
                 # Convert PIL Image to bytes
                 buf = io.BytesIO()
                 img.save(buf, format="PNG")
 
@@ -6,7 +6,7 @@
 import base64
 import io
 from types import SimpleNamespace
-from unittest.mock import MagicMock, Mock, patch
+from unittest.mock import AsyncMock, MagicMock, Mock, patch
 
 import pytest
 from PIL import Image
@@ -347,7 +347,7 @@ async def test_generate_with_nvext(self, handler, mock_context):
         """Test that nvext parameters are passed to the generator."""
         test_image = Image.new("RGB", (256, 256), color="yellow")
 
-        handler._generate_images = Mock(return_value=[test_image.tobytes()])
+        handler._generate_images = AsyncMock(return_value=[test_image.tobytes()])
 
         request = {
             "prompt": "A yellow square",
@@ -382,4 +382,59 @@ async def test_generate_with_nvext(self, handler, mock_context):
             guidance_scale=7.5,
             seed=42,
             negative_prompt="negative",
+            input_reference=None,
         )
+
+    @pytest.mark.asyncio
+    async def test_generate_i2i_passes_image_path(
+        self, handler, mock_context, tmp_path
+    ):
+        """Test that input_reference is passed as image_path to the generator."""
+        test_image = Image.new("RGB", (256, 256), color="green")
+
+        handler.generator.generate = Mock(
+            return_value=SimpleNamespace(frames=[test_image])
+        )
+
+        input_ref = str(tmp_path / "test_input.png")
+        request = {
+            "prompt": "Transform this image",
+            "model": "test-model",
+            "size": "256x256",
+            "response_format": "b64_json",
+            "input_reference": input_ref,
+        }
+
+        results = []
+        async for result in handler.generate(request, mock_context):
+            results.append(result)
+
+        # Verify image_path was passed to the generator
+        call_args = handler.generator.generate.call_args
+        sampling_params = call_args[1]["sampling_params_kwargs"]
+        assert sampling_params["image_path"] == input_ref
+
+    @pytest.mark.asyncio
+    async def test_generate_t2i_no_image_path(self, handler, mock_context):
+        """Test that image_path is NOT passed when input_reference is absent."""
+        test_image = Image.new("RGB", (256, 256), color="red")
+
+        handler.generator.generate = Mock(
+            return_value=SimpleNamespace(frames=[test_image])
+        )
+
+        request = {
+            "prompt": "A red square",
+            "model": "test-model",
+            "size": "256x256",
+            "response_format": "b64_json",
+        }
+
+        results = []
+        async for result in handler.generate(request, mock_context):
+            results.append(result)
+
+        # Verify image_path was NOT passed
+        call_args = handler.generator.generate.call_args
+        sampling_params = call_args[1]["sampling_params_kwargs"]
+        assert "image_path" not in sampling_params
@@ -326,6 +326,13 @@ func (r *DynamoGraphDeploymentReconciler) reconcileResources(ctx context.Context
 		return ReconcileResult{}, fmt.Errorf("failed to reconcile EPP resources: %w", err)
 	}
 
+	// Reconcile the wait-for-leader ConfigMap for multinode mp deployments
+	err = r.reconcileWaitLeaderConfigMap(ctx, dynamoDeployment)
+	if err != nil {
+		logger.Error(err, "Failed to reconcile wait-leader ConfigMap")
+		return ReconcileResult{}, fmt.Errorf("failed to reconcile wait-leader ConfigMap: %w", err)
+	}
+
 	// Determine if any service is multinode
 	hasMultinode := dynamoDeployment.HasAnyMultinodeService()
 
@@ -1582,6 +1589,21 @@ func (r *DynamoGraphDeploymentReconciler) reconcileEPPResources(ctx context.Cont
 	return nil
 }
 
+// reconcileWaitLeaderConfigMap ensures the wait-for-leader Python script
+// ConfigMap exists for multinode DGDs. The ConfigMap is only mounted by
+// vLLM mp worker pods (via UpdatePodSpec); for other backends it is inert.
+func (r *DynamoGraphDeploymentReconciler) reconcileWaitLeaderConfigMap(ctx context.Context, dgd *nvidiacomv1alpha1.DynamoGraphDeployment) error {
+	if !dgd.HasAnyMultinodeService() {
+		return nil
+	}
+
+	cm := dynamo.GenerateWaitLeaderConfigMap(dgd.Name, dgd.Namespace)
+	_, _, err := commoncontroller.SyncResource(ctx, r, dgd, func(ctx context.Context) (*corev1.ConfigMap, bool, error) {
+		return cm, false, nil
+	})
+	return err
+}
+
 func (r *DynamoGraphDeploymentReconciler) FinalizeResource(ctx context.Context, dynamoDeployment *nvidiacomv1alpha1.DynamoGraphDeployment) error {
 	// for now doing nothing
 	return nil
 
@@ -55,7 +55,7 @@ func GetK8sDiscoveryRole(dgdName string, namespace string) *rbacv1.Role {
 		Rules: []rbacv1.PolicyRule{
 			{
 				APIGroups: []string{apiGroupCore},
-				Resources: []string{"endpoints"},
+				Resources: []string{"endpoints", "pods"},
 				Verbs:     []string{"get", "list", "watch"},
 			},
 			{
Original file line number	Diff line number	Diff line change
`@@ -55,7 +55,7 @@ func GetK8sDiscoveryRole(dgdName string, namespace string) *rbacv1.Role {`
`55`	`55`	`Rules: []rbacv1.PolicyRule{`
`56`	`56`	`{`
`57`	`57`	`APIGroups: []string{apiGroupCore},`
`58`		`- Resources: []string{"endpoints"},`
	`58`	`+ Resources: []string{"endpoints", "pods"},`
`59`	`59`	`Verbs: []string{"get", "list", "watch"},`
`60`	`60`	`},`
`61`	`61`	`{`