Evaluation tests #592

Workflow file for this run

.github/workflows/pull-evaluation-tests.yaml at 6c59ef8

	name: "Evaluation tests"
	run-name: "Evaluation tests"

	# Required repository secrets:
	# - AICORE_SECRET
	# - COMPANION_CONFIGMAP
	# - GARDENER_TEST_CLUSTER_URL
	# - GARDENER_TEST_CLUSTER_AUTH_TOKEN
	# - GARDENER_TEST_CLUSTER_CA_DATA

	on:
	pull_request_target:
	types: [labeled, opened, synchronize, reopened, ready_for_review]
	branches:
	- main
	paths-ignore:
	- ".github/**"
	- ".reuse/**"
	- "LICENSES/**"
	- "config/**"
	- "data/**"
	- "docs/**"
	- "scripts/**"
	- "tests/**"
	- "*/.md"
	- "doc_indexer/**"
	- CODEOWNERS
	- LICENSE

	# global env variables.
	env:
	DOCKER_TIMEOUT: 30
	K3D_VERSION: "v5.7.2" # Required K3d version.
	REPOSITORY_FULL_NAME: "${{ github.repository }}" # <owner>/<repository-name>.
	GITHUB_EVENT_ACTION: "${{ github.event.action }}"
	IMAGE_NAME: "europe-docker.pkg.dev/kyma-project/dev/kyma-companion:PR-${{ github.event.number }}"

	jobs:
	wait-for-build:
	name: Wait for image build job
	runs-on: ubuntu-latest
	if: contains(github.event.pull_request.labels.*.name, 'evaluation requested')
	steps:
	- name: Checkout code
	uses: actions/checkout@v4
	with:
	ref: main

	- name: Setup python
	uses: actions/setup-python@v5
	with:
	python-version: "3.10"
	cache: "pip"

	- name: Install requirements
	run: \|
	pip install -r ./scripts/python/wait-for-commit-check/requirements.txt

	- name: wait for build
	env:
	GITHUB_TOKEN: ${{ github.token }}
	# Note: 'github.event.pull_request.head.sha' is not same as 'github.sha' on pull requests.
	GIT_REF: ${{ github.event.pull_request.head.sha }}
	REPOSITORY_FULL_NAME: "${{ github.repository }}"
	# The re-useable image-builder workflow from neighbors appends the "Build image" suffix to the check run name.
	GIT_CHECK_RUN_NAME: "build / Build image"
	INTERVAL: 60
	TIMEOUT: 900
	run: \|
	python ./scripts/python/wait-for-commit-check/run.py

	evaluation-tests:
	name: Run evaluation tests
	needs: wait-for-build
	runs-on: ubuntu-latest
	steps:
	- name: Checkout code
	uses: actions/checkout@v4
	with:
	ref: ${{ github.event.pull_request.head.ref }}
	repository: ${{ github.event.pull_request.head.repo.full_name }}

	- name: K3d Setup - Install Kubectl CLI
	run: \|
	curl -LO "https://storage.googleapis.com/kubernetes-release/release/$(curl -s https://storage.googleapis.com/kubernetes-release/release/stable.txt)/bin/linux/amd64/kubectl"
	chmod +x ./kubectl
	mv ./kubectl /usr/local/bin/kubectl
	kubectl version --client

	- name: K3d Setup - Install K3d CLI
	id: install-k3d
	run: \|
	curl -s https://raw.githubusercontent.com/k3d-io/k3d/main/install.sh \| TAG=${K3D_VERSION} bash
	k3d --version
	k3d_version=$(k3d --version \| cut -d " " -f 3 \| head -1 \| xargs)
	if [ "$k3d_version" != "${K3D_VERSION}" ]; then
	echo "K3d version is not correct. Expected: ${K3D_VERSION}, got: $k3d_version"
	exit 1
	fi
	echo "K3d version is correct: $k3d_version"

	- name: K3d Setup - Provision K3d cluster
	run: \|
	echo "::group::K3d - Provision"
	k3d cluster create test-cluster --verbose --agents=1 -p 9080:80@loadbalancer -p 9443:443@loadbalancer -p "32000:32000@agent:0"
	echo "::endgroup::"

	- name: K3d Setup - Verify K3d context
	run: \|
	echo "::group::K3d - Context"
	context_name=$(kubectl config current-context)
	if [ "$context_name" != "k3d-test-cluster" ]; then
	echo "K3d context is not correct. Expected: k3d-test-cluster, got: $context_name"
	exit 1
	fi
	echo "K3d context is correct"
	echo "::endgroup::"

	- name: Redis Setup - Deploy Redis using Helm
	run: \|
	kubectl create namespace redis
	helm repo add redis-stack https://redis-stack.github.io/helm-redis-stack/
	echo "Installing Redis using Helm..."
	helm install --wait redis-stack redis-stack/redis-stack --set auth.enabled=false -n redis

	- name: Companion Deploy - Create namespace
	run: \|
	kubectl apply -f scripts/k8s/companion-namespace.yaml

	- name: Companion Deploy - Create secret
	run: \|
	echo "${{ secrets.AICORE_SECRET }}" \| base64 -d > scripts/k8s/aicore-secret.yaml
	kubectl apply -f scripts/k8s/aicore-secret.yaml
	rm -f scripts/k8s/aicore-secret.yaml

	- name: Companion Deploy - Create ConfigMap
	run: \|
	echo "${{ secrets.COMPANION_CONFIGMAP }}" \| base64 -d > scripts/k8s/companion-configmap.yaml
	kubectl apply -f scripts/k8s/companion-configmap.yaml
	rm -f scripts/k8s/companion-configmap.yaml

	- name: Companion Deploy - Update image name in Deployment
	run: \|
	sed -i "s\|example.com/ai-backend:stable\|${{env.IMAGE_NAME}}\|g" scripts/k8s/companion-deployment.yaml

	- name: Companion Deploy - Create Deployment and NodePort Service
	run: \|
	kubectl apply -f scripts/k8s/companion-deployment.yaml

	- name: Companion Deploy - Wait for deployment
	run: \|
	echo "Waiting for backend pods (labels: app=ai-backend) to be ready..."
	kubectl wait --for=condition=Ready pod -l 'app=ai-backend' -n ai-core --timeout=300s
	sleep 30

	- name: Companion Deploy - Test reachability through NodePort
	run: \|
	curl http://localhost:32000/readyz

	- name: Companion Deploy - Debug information
	if: failure()
	run: \|
	kubectl get deploy -n ai-core
	kubectl get pod -n ai-core
	kubectl logs -n ai-core -l app=ai-backend

	- name: Evaluation Tests Setup - Extract project Python version
	working-directory: tests/blackbox
	id: python-version
	run: \|
	./../../scripts/shell/extract-python-version.sh

	- name: Evaluation Tests Setup - Install Python
	uses: actions/setup-python@v4
	with:
	python-version: ${{ env.PYTHON_VERSION }}

	- name: Evaluation Tests Setup - Install Poetry
	working-directory: tests/blackbox
	run: \|
	curl -sSL https://install.python-poetry.org \| python3 -
	echo "$HOME/.local/bin" >> $GITHUB_PATH

	- name: Evaluation Tests Setup - Install dependencies
	working-directory: tests/blackbox
	run: poetry install

	- name: Evaluation Tests Setup - Prepare test configurations
	id: eval-tests-configs
	env:
	AICORE_SECRET: ${{ secrets.AICORE_SECRET }}
	HANA_DB_SECRET: ${{ secrets.HANA_DB }}
	run: \|
	# AI Core configurations.
	echo "${AICORE_SECRET}" \| base64 -d > aicore-secret.yaml
	echo "AICORE_CLIENT_ID=$(yq eval '.stringData.clientid' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_CLIENT_SECRET=$(yq eval '.stringData.clientsecret' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_AUTH_URL=$(yq eval '.stringData.auth_url' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_BASE_URL=$(yq eval '.stringData.base_url' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_RESOURCE_GROUP=$(yq eval '.stringData.resource_group' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_CONFIGURATION_ID_GPT4_MINI=$(yq eval '.stringData.configuration_id_gpt4_mini' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	echo "AICORE_DEPLOYMENT_ID_GPT4_MINI=$(yq eval '.stringData.deployment_id_gpt4_mini' aicore-secret.yaml)" >> $GITHUB_OUTPUT
	# cleanup
	rm -f aicore-secret.yaml

	- name: Run Evaluation Tests
	working-directory: tests/blackbox
	env:
	LOG_LEVEL: "DEBUG"
	TEST_DATA_PATH: "./data"
	COMPANION_API_URL: "http://localhost:32000"
	# Gardener test cluster configurations.
	TEST_CLUSTER_URL: ${{ secrets.GARDENER_TEST_CLUSTER_URL }}
	TEST_CLUSTER_CA_DATA: ${{ secrets.GARDENER_TEST_CLUSTER_CA_DATA }}
	TEST_CLUSTER_AUTH_TOKEN: ${{ secrets.GARDENER_TEST_CLUSTER_AUTH_TOKEN }}
	# AI Core configurations.
	AICORE_CLIENT_ID: ${{ steps.eval-tests-configs.outputs.AICORE_CLIENT_ID }}
	AICORE_CLIENT_SECRET: ${{ steps.eval-tests-configs.outputs.AICORE_CLIENT_SECRET }}
	AICORE_AUTH_URL: ${{ steps.eval-tests-configs.outputs.AICORE_AUTH_URL }}
	AICORE_BASE_URL: ${{ steps.eval-tests-configs.outputs.AICORE_BASE_URL }}
	AICORE_RESOURCE_GROUP: ${{ steps.eval-tests-configs.outputs.AICORE_RESOURCE_GROUP }}
	AICORE_CONFIGURATION_ID_GPT4_MINI: ${{ steps.eval-tests-configs.outputs.AICORE_CONFIGURATION_ID_GPT4_MINI }}
	AICORE_DEPLOYMENT_ID_GPT4_MINI: ${{ steps.eval-tests-configs.outputs.AICORE_DEPLOYMENT_ID_GPT4_MINI }}
	run: \|
	poetry run python src/run_evaluation.py

	- name: Evaluation Tests - Debug information
	if: failure()
	run: \|
	kubectl get deploy -n ai-core
	kubectl get pod -n ai-core
	kubectl logs -n ai-core -l app=ai-backend

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Evaluation tests #592

Workflow file

Evaluation tests #592

Jobs

Run details

Workflow file for this run