diff --git a/.github/workflows/e2e-test-tune-api.yaml b/.github/workflows/e2e-test-tune-api.yaml index 329b2ae6173..68426f23bed 100644 --- a/.github/workflows/e2e-test-tune-api.yaml +++ b/.github/workflows/e2e-test-tune-api.yaml @@ -68,10 +68,12 @@ jobs: - name: Fetch Experiment Pod Logs if: always() # Run this step even if previous steps fail run: | + kubectl get pods -n default POD_NAME=$(kubectl get pods -n default --no-headers -o custom-columns=":metadata.name" | grep tune-example-2) echo "Fetching logs for pod: $POD_NAME" kubectl describe pod $POD_NAME -n default kubectl logs $POD_NAME -n default + kubectl get events -n default | grep "tune-example-2" strategy: fail-fast: false diff --git a/test/e2e/v1beta1/scripts/gh-actions/run-e2e-tune-api.py b/test/e2e/v1beta1/scripts/gh-actions/run-e2e-tune-api.py index 1a5f9eed99d..9e327ac6adf 100644 --- a/test/e2e/v1beta1/scripts/gh-actions/run-e2e-tune-api.py +++ b/test/e2e/v1beta1/scripts/gh-actions/run-e2e-tune-api.py @@ -14,7 +14,7 @@ from verify import verify_experiment_results # Experiment timeout is 40 min. -EXPERIMENT_TIMEOUT = 60 * 40 +EXPERIMENT_TIMEOUT = 60 * 15 # The default logging config. logging.basicConfig(level=logging.INFO) @@ -197,6 +197,7 @@ def run_e2e_experiment_create_by_tune_with_external_model( logging.info("---------------------------------------------------------------") logging.info(f"E2E is failed for Experiment created by tune: {exp_namespace}/{exp_name}-2") get_experiment_pods_logs(katib_client, f"{exp_name}-2", exp_namespace) + get_experiment_pods_logs(katib_client, "katib-controller", "kubeflow") raise e finally: # Delete the Experiment.