@@ -88,7 +88,7 @@ def test_sdk_e2e_with_gang_scheduling(job_namespace):
88
88
logging .info (TRAINING_CLIENT .list_jobs (job_namespace ))
89
89
90
90
try :
91
- utils .verify_job_e2e (TRAINING_CLIENT , JOB_NAME , job_namespace , wait_timeout = 9000 )
91
+ utils .verify_job_e2e (TRAINING_CLIENT , JOB_NAME , job_namespace , wait_timeout = 900 )
92
92
except Exception as e :
93
93
utils .print_job_results (TRAINING_CLIENT , JOB_NAME , job_namespace )
94
94
TRAINING_CLIENT .delete_job (JOB_NAME , job_namespace )
@@ -123,7 +123,7 @@ def test_sdk_e2e(job_namespace):
123
123
logging .info (TRAINING_CLIENT .list_jobs (job_namespace ))
124
124
125
125
try :
126
- utils .verify_job_e2e (TRAINING_CLIENT , JOB_NAME , job_namespace , wait_timeout = 9000 )
126
+ utils .verify_job_e2e (TRAINING_CLIENT , JOB_NAME , job_namespace , wait_timeout = 900 )
127
127
except Exception as e :
128
128
utils .print_job_results (TRAINING_CLIENT , JOB_NAME , job_namespace )
129
129
TRAINING_CLIENT .delete_job (JOB_NAME , job_namespace )
@@ -156,5 +156,5 @@ def generate_container() -> V1Container:
156
156
return V1Container (
157
157
name = CONTAINER_NAME ,
158
158
image = os .getenv ("JAX_JOB_IMAGE" , "docker.io/kubeflow/jaxjob-dist-spmd-mnist:latest" ),
159
- # resources=V1ResourceRequirements(limits={"memory": "4Gi ", "cpu": "1.6 "}),
159
+ resources = V1ResourceRequirements (limits = {"memory" : "3Gi " , "cpu" : "1.2 " }),
160
160
)
0 commit comments