You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@airflow.apache.org by on...@apache.org on 2023/08/31 02:32:09 UTC

[airflow] branch main updated: Raise max runtime for sagemaker jobs in system test (#33942)

This is an automated email from the ASF dual-hosted git repository.

onikolas pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/airflow.git


The following commit(s) were added to refs/heads/main by this push:
     new ba31c68094 Raise max runtime for sagemaker jobs in system test (#33942)
ba31c68094 is described below

commit ba31c680945c14ea5e431b1b2bac6c8bfcc55543
Author: Raphaƫl Vandon <va...@amazon.com>
AuthorDate: Wed Aug 30 19:32:02 2023 -0700

    Raise max runtime for sagemaker jobs in system test (#33942)
    
    We've had several occurences recently of training jobs being terminated before finishing because of this limit
    When this happens, the output are not produced, and the test fails.
    Thus it makes sense to give it a bit more time to complete.
---
 tests/system/providers/amazon/aws/example_sagemaker.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/system/providers/amazon/aws/example_sagemaker.py b/tests/system/providers/amazon/aws/example_sagemaker.py
index c71740f1ca..90211004b4 100644
--- a/tests/system/providers/amazon/aws/example_sagemaker.py
+++ b/tests/system/providers/amazon/aws/example_sagemaker.py
@@ -255,7 +255,7 @@ def set_up(env_id, role_arn):
         "ProcessingResources": {
             "ClusterConfig": resource_config,
         },
-        "StoppingCondition": {"MaxRuntimeInSeconds": 60},
+        "StoppingCondition": {"MaxRuntimeInSeconds": 300},
         "AppSpecification": {
             "ImageUri": ecr_repository_uri,
         },
@@ -294,7 +294,7 @@ def set_up(env_id, role_arn):
         "ExperimentConfig": {"ExperimentName": experiment_name},
         "ResourceConfig": resource_config,
         "RoleArn": role_arn,
-        "StoppingCondition": {"MaxRuntimeInSeconds": 60},
+        "StoppingCondition": {"MaxRuntimeInSeconds": 300},
         "TrainingJobName": training_job_name,
     }
     model_trained_weights = (
@@ -357,7 +357,7 @@ def set_up(env_id, role_arn):
             "OutputDataConfig": {"S3OutputPath": f"s3://{bucket_name}/{training_output_s3_key}"},
             "ResourceConfig": resource_config,
             "RoleArn": role_arn,
-            "StoppingCondition": {"MaxRuntimeInSeconds": 60},
+            "StoppingCondition": {"MaxRuntimeInSeconds": 300},
         },
     }
     transform_config = {