From bf33dd2e5f57f240679c603caa5965719714faf5 Mon Sep 17 00:00:00 2001 From: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> Date: Sun, 20 Jul 2025 21:59:55 +0200 Subject: [PATCH 1/4] Seicht to large orcale runners Signed-off-by: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> --- .github/workflows/full_kubeflow_integration_test.yaml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/full_kubeflow_integration_test.yaml b/.github/workflows/full_kubeflow_integration_test.yaml index 3fee19a864..72ad31cef4 100644 --- a/.github/workflows/full_kubeflow_integration_test.yaml +++ b/.github/workflows/full_kubeflow_integration_test.yaml @@ -20,8 +20,9 @@ jobs: name: Kubeflow Installation and Testing if: ${{ github.repository == 'kubeflow/manifests' }} runs-on: - labels: ubuntu-latest-16-cores - timeout-minutes: 60 + labels: oracle-vm-16cpu-64gb-x86-64 + # labels: ubuntu-latest-16-cores + timeout-minutes: 30 steps: - name: Checkout uses: actions/checkout@v4 From cf88b3cafda578ee28bf21acda5cfbf6605cbc04 Mon Sep 17 00:00:00 2001 From: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> Date: Mon, 21 Jul 2025 10:06:14 +0200 Subject: [PATCH 2/4] Update full_kubeflow_integration_test.yaml Signed-off-by: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> --- .github/workflows/full_kubeflow_integration_test.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/full_kubeflow_integration_test.yaml b/.github/workflows/full_kubeflow_integration_test.yaml index 72ad31cef4..cac595e241 100644 --- a/.github/workflows/full_kubeflow_integration_test.yaml +++ b/.github/workflows/full_kubeflow_integration_test.yaml @@ -22,7 +22,7 @@ jobs: runs-on: labels: oracle-vm-16cpu-64gb-x86-64 # labels: ubuntu-latest-16-cores - timeout-minutes: 30 + timeout-minutes: 45 steps: - name: Checkout uses: actions/checkout@v4 From 2b12d5d57bd62aef2df843d44b353c5c2fecece2 Mon Sep 17 00:00:00 2001 From: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> Date: Mon, 21 Jul 2025 10:56:18 +0200 Subject: [PATCH 3/4] Update training_operator_test.sh Signed-off-by: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> --- tests/training_operator_test.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/training_operator_test.sh b/tests/training_operator_test.sh index 8a8c99bb11..d78468da97 100755 --- a/tests/training_operator_test.sh +++ b/tests/training_operator_test.sh @@ -12,4 +12,4 @@ kubectl get pods -n $KF_PROFILE --show-labels kubectl wait --for=condition=Ready pod -l training.kubeflow.org/replica-type=worker -n $KF_PROFILE --timeout=180s -kubectl wait --for=condition=Succeeded pytorchjob/pytorch-simple -n $KF_PROFILE --timeout=450s \ No newline at end of file +kubectl wait --for=condition=Succeeded pytorchjob/pytorch-simple -n $KF_PROFILE --timeout=600s From 5cb49d3df617aee35ffad06c051ffb188abb2cf6 Mon Sep 17 00:00:00 2001 From: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> Date: Mon, 21 Jul 2025 11:23:53 +0200 Subject: [PATCH 4/4] Update full_kubeflow_integration_test.yaml Signed-off-by: Julius von Kohout <45896133+juliusvonkohout@users.noreply.github.com> --- .github/workflows/full_kubeflow_integration_test.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/full_kubeflow_integration_test.yaml b/.github/workflows/full_kubeflow_integration_test.yaml index cac595e241..2ee6bcf703 100644 --- a/.github/workflows/full_kubeflow_integration_test.yaml +++ b/.github/workflows/full_kubeflow_integration_test.yaml @@ -106,7 +106,7 @@ jobs: run: chmod u+x tests/*.sh && ./tests/spark_install.sh - name: Wait for All Pods to be Ready - run: kubectl wait --for=condition=Ready pods --all --all-namespaces --timeout 60s --field-selector=status.phase!=Succeeded + run: kubectl wait --for=condition=Ready pods --all --all-namespaces --timeout 90s --field-selector=status.phase!=Succeeded - name: Port-forward the istio-ingress gateway run: ./tests/port_forward_gateway.sh