Create EKS cluster, deploy CKF and run bundle test #16
Workflow file for this run
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Create EKS cluster, deploy CKF and run bundle test | |
on: | |
workflow_dispatch: # This event allows manual triggering from the Github UI | |
inputs: | |
uats_branch: | |
description: 'Branch to run the UATs from e.g. main or track/1.8. By default, the workflow uses 1.8.' | |
required: false | |
default: '"1.8"' | |
secrets: | |
BUNDLE_KUBEFLOW_EKS_AWS_ACCESS_KEY_ID: | |
required: true | |
BUNDLE_KUBEFLOW_EKS_AWS_SECRET_ACCESS_KEY: | |
required: true | |
schedule: | |
- cron: "23 0 * * 2" | |
jobs: | |
deploy-ckf-to-eks: | |
runs-on: ubuntu-22.04 | |
env: | |
UATS_BRANCH: ${{ inputs.uats_branch }} | |
PYTHON_VERSION: "3.8" | |
steps: | |
- name: Checkout repository | |
uses: actions/checkout@v2 | |
# Remove once https://github.com/canonical/bundle-kubeflow/issues/761 | |
# is resolved and applied to uats repository. | |
- name: Install python ${{ env.PYTHON_VERSION }} | |
run: | | |
sudo add-apt-repository ppa:deadsnakes/ppa -y | |
sudo apt update -y | |
sudo apt install python${{ env.PYTHON_VERSION }} python${{ env.PYTHON_VERSION }}-distutils python${{ env.PYTHON_VERSION }}-venv -y | |
- name: Install CLI tools | |
run: | | |
wget https://bootstrap.pypa.io/get-pip.py | |
python${{ env.PYTHON_VERSION }} get-pip.py | |
python${{ env.PYTHON_VERSION }} -m pip install tox | |
sudo snap install charmcraft --classic | |
# We need to install form binrary because of this https://bugs.launchpad.net/juju/+bug/2007848 | |
curl -LO https://launchpad.net/juju/3.5/3.5.0/+download/juju-3.5.0-linux-amd64.tar.xz | |
tar xf juju-3.5.0-linux-amd64.tar.xz | |
sudo install -o root -g root -m 0755 juju /usr/local/bin/juju | |
juju version | |
- name: Configure AWS Credentials | |
env: | |
AWS_ACCESS_KEY_ID: ${{ secrets.BUNDLE_KUBEFLOW_EKS_AWS_ACCESS_KEY_ID }} | |
AWS_SECRET_ACCESS_KEY: ${{ secrets.BUNDLE_KUBEFLOW_EKS_AWS_SECRET_ACCESS_KEY }} | |
run: | | |
aws configure set aws_access_key_id $AWS_ACCESS_KEY_ID | |
aws configure set aws_secret_access_key $AWS_SECRET_ACCESS_KEY | |
aws configure set default.region eu-central-1 | |
- name: Install kubectl | |
run: | | |
sudo snap install kubectl --classic --channel=1.24/stable | |
mkdir ~/.kube | |
kubectl version --client | |
- name: Install eksctl | |
run: | | |
sudo apt-get update | |
sudo apt-get install -y unzip | |
curl --silent --location "https://github.com/weaveworks/eksctl/releases/latest/download/eksctl_$(uname -s)_amd64.tar.gz" | tar xz -C /tmp | |
sudo mv /tmp/eksctl /usr/local/bin | |
eksctl version | |
- name: Create cluster | |
run: | | |
eksctl create cluster -f .github/cluster.yaml | |
kubectl get nodes | |
- name: Setup juju | |
run: | | |
juju add-k8s kubeflow --client | |
juju bootstrap kubeflow kubeflow-controller | |
juju add-model kubeflow | |
- name: Test bundle deployment | |
run: | | |
tox -vve test_bundle_deployment-1.8 -- --model kubeflow --keep-models -vv -s | |
- name: Run Kubeflow UATs | |
run: | | |
git clone https://github.com/canonical/charmed-kubeflow-uats.git ~/charmed-kubeflow-uats | |
cd ~/charmed-kubeflow-uats | |
git checkout ${{ env.UATS_BRANCH }} | |
tox -e kubeflow-remote | |
# On failure, capture debugging resources | |
- name: Save debug artifacts | |
uses: canonical/kubeflow-ci/actions/dump-charm-debug-artifacts@main | |
if: always() | |
# On failure, capture debugging resources | |
- name: Get juju status | |
run: juju status | |
if: failure() | |
- name: Get juju debug logs | |
run: juju debug-log --replay --no-tail | |
if: failure() | |
- name: Get all kubernetes resources | |
run: kubectl get all -A | |
if: failure() | |
- name: Get logs from pods with status = Pending | |
run: kubectl -n kubeflow get pods | tail -n +2 | grep Pending | awk '{print $1}' | xargs -n1 kubectl -n kubeflow logs --all-containers=true --tail 100 | |
if: failure() | |
- name: Get logs from pods with status = Failed | |
run: kubectl -n kubeflow get pods | tail -n +2 | grep Failed | awk '{print $1}' | xargs -n1 kubectl -n kubeflow logs --all-containers=true --tail 100 | |
if: failure() | |
- name: Get logs from pods with status = CrashLoopBackOff | |
run: kubectl -n kubeflow get pods | tail -n +2 | grep CrashLoopBackOff | awk '{print $1}' | xargs -n1 kubectl -n kubeflow logs --all-containers=true --tail 100 | |
if: failure() | |
- name: Delete EKS cluster | |
if: always() | |
run: | | |
eksctl delete cluster --region eu-central-1 --name=kubeflow-test | |
delete-unattached-volumes: | |
if: always() | |
uses: ./.github/workflows/delete-aws-volumes.yaml | |
secrets: inherit | |
with: | |
region: eu-central-1 | |
needs: [deploy-ckf-to-eks] |