add eval custom lambda arn to hyperparameter

zhaoqizqwang · zhaoqizqwang · commit 471a2460eacc · 2025-12-17T05:57:19.000-08:00
For commit: aws/sagemaker-python-sdk-staging@bcd5348
diff --git a/sagemaker-train/src/sagemaker/train/sm_recipes/utils.py b/sagemaker-train/src/sagemaker/train/sm_recipes/utils.py
@@ -322,10 +322,19 @@ def _get_args_from_recipe(
         args["source_code"].requirements = os.path.basename(requirements)
 
     # Update args with compute and hyperparameters
+    hyperparameters = {"config-path": ".", "config-name": "recipe.yaml"}
+    
+    # Handle eval custom lambda configuration
+    if recipe.get("evaluation", {}):
+        processor = recipe.get("processor", {})
+        lambda_arn = processor.get("lambda_arn", "")
+        if lambda_arn:
+            hyperparameters["lambda_arn"] = lambda_arn
+    
     args.update(
         {
             "compute": compute,
-            "hyperparameters": {"config-path": ".", "config-name": "recipe.yaml"},
+            "hyperparameters": hyperparameters,
         }
     )
 
diff --git a/sagemaker-train/tests/unit/train/sm_recipes/test_utils.py b/sagemaker-train/tests/unit/train/sm_recipes/test_utils.py
@@ -201,38 +201,72 @@ def test_get_args_from_recipe_compute(
             )
             assert mock_gpu_args.call_count == 0
             assert mock_trainium_args.call_count == 0
-            assert args is None
-
-    @pytest.mark.parametrize(
-        "test_case",
-        [
-            {
-                "model_type": "llama_v3",
-                "script": "llama_pretrain.py",
-                "model_base_name": "llama_v3",
-            },
-            {
-                "model_type": "mistral",
-                "script": "mistral_pretrain.py",
-                "model_base_name": "mistral",
-            },
-            {
-                "model_type": "deepseek_llamav3",
-                "script": "deepseek_pretrain.py",
-                "model_base_name": "deepseek",
-            },
-            {
-                "model_type": "deepseek_qwenv2",
-                "script": "deepseek_pretrain.py",
-                "model_base_name": "deepseek",
-            },
-        ],
+
+@pytest.mark.parametrize(
+    "test_case",
+    [
+        {
+            "model_type": "llama_v3",
+            "model_base_name": "llama",
+            "script": "llama_pretrain.py",
+        },
+        {
+            "model_type": "mistral",
+            "model_base_name": "mistral",
+            "script": "mistral_pretrain.py",
+        },
+        {
+            "model_type": "deepseek_llamav3",
+            "model_base_name": "deepseek",
+            "script": "deepseek_pretrain.py",
+        },
+        {
+            "model_type": "deepseek_qwenv2",
+            "model_base_name": "deepseek",
+            "script": "deepseek_pretrain.py",
+        },
+    ],
+)
+def test_get_trainining_recipe_gpu_model_name_and_script(test_case):
+    model_base_name, script = _get_trainining_recipe_gpu_model_name_and_script(
+        test_case["model_type"]
     )
-    def test_get_trainining_recipe_gpu_model_name_and_script(test_case):
-        model_type = test_case["model_type"]
-        script = test_case["script"]
-        model_base_name, script = _get_trainining_recipe_gpu_model_name_and_script(
-            model_type, script
-        )
-        assert model_base_name == test_case["model_base_name"]
-        assert script == test_case["script"]
+    assert model_base_name == test_case["model_base_name"]
+    assert script == test_case["script"]
+
+
+def test_get_args_from_recipe_with_evaluation(temporary_recipe):
+    import tempfile
+    import os
+    from sagemaker.train.configs import SourceCode
+    
+    # Create a recipe with evaluation config
+    recipe_data = {
+        "trainer": {"num_nodes": 1},
+        "model": {"model_type": "llama_v3"},
+        "evaluation": {"task": "gen_qa"},
+        "processor": {"lambda_arn": "arn:aws:lambda:us-east-1:123456789012:function:MyFunc"},
+    }
+    
+    with NamedTemporaryFile(suffix=".yaml", delete=False) as f:
+        with open(f.name, "w") as file:
+            yaml.dump(recipe_data, file)
+        recipe_path = f.name
+    
+    try:
+        compute = Compute(instance_type="ml.p4d.24xlarge", instance_count=1)
+        with patch("sagemaker.train.sm_recipes.utils._configure_gpu_args") as mock_gpu:
+            mock_source = SourceCode()
+            mock_source.source_dir = "/tmp/test"
+            mock_gpu.return_value = {"source_code": mock_source, "hyperparameters": {}}
+            with patch("sagemaker.train.sm_recipes.utils.OmegaConf.save"):
+                args, _ = _get_args_from_recipe(
+                    training_recipe=recipe_path,
+                    compute=compute,
+                    region_name="us-west-2",
+                    recipe_overrides=None,
+                    requirements=None,
+                )
+                assert args["hyperparameters"]["lambda_arn"] == "arn:aws:lambda:us-east-1:123456789012:function:MyFunc"
+    finally:
+        os.unlink(recipe_path)

Original file line number	Diff line number	Diff line change
`@@ -322,10 +322,19 @@ def _get_args_from_recipe(`
`322`	`322`	`args["source_code"].requirements = os.path.basename(requirements)`
`323`	`323`
`324`	`324`	`# Update args with compute and hyperparameters`
	`325`	`+ hyperparameters = {"config-path": ".", "config-name": "recipe.yaml"}`
	`326`	`+`
	`327`	`+ # Handle eval custom lambda configuration`
	`328`	`+ if recipe.get("evaluation", {}):`
	`329`	`+ processor = recipe.get("processor", {})`
	`330`	`+ lambda_arn = processor.get("lambda_arn", "")`
	`331`	`+ if lambda_arn:`
	`332`	`+ hyperparameters["lambda_arn"] = lambda_arn`
	`333`	`+`
`325`	`334`	`args.update(`
`326`	`335`	`{`
`327`	`336`	`"compute": compute,`
`328`		`- "hyperparameters": {"config-path": ".", "config-name": "recipe.yaml"},`
	`337`	`+ "hyperparameters": hyperparameters,`
`329`	`338`	`}`
`330`	`339`	`)`
`331`	`340`