diff --git a/samples/core/xgboost_training_cm/xgboost_training_cm.py b/samples/core/xgboost_training_cm/xgboost_training_cm.py index 8705c806f5b0..01bf3a989497 100644 --- a/samples/core/xgboost_training_cm/xgboost_training_cm.py +++ b/samples/core/xgboost_training_cm/xgboost_training_cm.py @@ -209,17 +209,17 @@ def xgb_train_pipeline( project='{{kfp-project-id}}', diagnostic_mode='HALT_ON_ERROR', rounds=5, - workers=1, ): output_template = str(output) + '/' + dsl.RUN_ID_PLACEHOLDER + '/data' region='us-central1' - quota_check=[{'region':region,'metric':'CPUS','quota_needed':1.0}] + workers=2 + quota_check=[{'region':region,'metric':'CPUS','quota_needed':12.0}] train_data='gs://ml-pipeline-playground/sfpd/train.csv' eval_data='gs://ml-pipeline-playground/sfpd/eval.csv' schema='gs://ml-pipeline-playground/sfpd/schema.json' true_label='ACTION' target='resolution' - required_apis='storage-api.googleapis.com, dataproc.googleapis.com' + required_apis='dataproc.googleapis.com' cluster_name='xgb-%s' % dsl.RUN_ID_PLACEHOLDER # Current GCP pyspark/spark op do not provide outputs as return values, instead, diff --git a/test/sample-test/configs/xgboost_training_cm.config.yaml b/test/sample-test/configs/xgboost_training_cm.config.yaml index 999777646eb0..7f218ae62170 100644 --- a/test/sample-test/configs/xgboost_training_cm.config.yaml +++ b/test/sample-test/configs/xgboost_training_cm.config.yaml @@ -17,6 +17,5 @@ arguments: output: project: ml-pipeline-test rounds: 5 - workers: 2 diagnostic_mode: False test_timeout: 3600 # xgboost needs extra time, 60 * 60 secs