Model Test #25

Workflow file for this run

.github/workflows/model_test.yml at e7c068d

	# Copyright (c) 2024 Intel Corporation
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	name: Model Test

	on:
	workflow_dispatch:

	# If there is a new commit, the previous jobs will be canceled
	concurrency:
	group: ${{ github.workflow }}-${{ github.event.pull_request.number \|\| github.ref }}
	cancel-in-progress: true
	permissions: write-all
	env:
	OUT_SCRIPT_PATH: ${{ github.workspace }}/.github/workflows/scripts/models
	SCRIPT_PATH: /GenAIEval/.github/workflows/scripts
	DOCKER_NAME: "genaieval"
	DOCKER_TAG: "latest"
	CONTAINER_NAME: "modelTest"


	jobs:
	Evaluation-Workflow:
	runs-on: aise-cluster
	strategy:
	matrix:
	include:
	- modelName: "opt-125m"
	datasets: "piqa"
	device: "cpu"
	tasks: "text-generation"
	fail-fast: true

	steps:
	- name: Clean Up Working Directory
	run: sudo rm -rf ${{github.workspace}}/*

	- name: Load environment variables
	if: ${{ matrix.device }} == "cpu"
	run:
	cat ~/actions-runner4/.env >> $GITHUB_ENV

	- name: Checkout out Repo
	uses: actions/checkout@v4
	with:
	submodules: "recursive"
	fetch-tags: true
	# We need this because GitHub needs to clone the branch to pipeline
	- name: Docker Build
	run: \|
	docker build -f ${{ github.workspace }}/.github/workflows/docker/common.dockerfile --build-arg http_proxy="${{ env.HTTP_PROXY_IMAGE_BUILD }}" --build-arg https_proxy="${{ env.HTTPS_PROXY_IMAGE_BUILD }}" -t ${{ env.DOCKER_NAME }}:${{ env.DOCKER_TAG }} .

	- name: Docker Run
	run: \|
	if [[ $(docker ps -a \| grep -i '${{ env.CONTAINER_NAME }}'$) ]]; then
	docker stop ${{ env.CONTAINER_NAME }}
	docker rm -vf ${{ env.CONTAINER_NAME }} \|\| true
	fi
	docker run -dit --disable-content-trust --privileged --name=${{ env.CONTAINER_NAME }} -v /dev/shm:/dev/shm \
	-v ${{ github.workspace }}:/GenAIEval \
	-e http_proxy="${{ env.HTTP_PROXY_IMAGE_BUILD }}" -e https_proxy="${{ env.HTTPS_PROXY_IMAGE_BUILD }}" \
	${{ env.DOCKER_NAME }}:${{ env.DOCKER_TAG }}

	- name: Binary build
	run: \|
	docker exec ${{ env.CONTAINER_NAME }} \
	bash -c "cd /GenAIEval && pip install -r requirements.txt && python setup.py install"

	#- name: Download Reference Artifact
	# id: download-artifact
	# uses: dawidd6/action-download-artifact@v3.1.2
	# with:
	# workflow: model_test.yml
	# name: ${{ matrix.device }}-${{ matrix.modelName }}
	# run_id: ${{ vars.ModelTest_REF_ID }}
	# path: ${{ github.workspace }}/${{ matrix.device }}_${{ matrix.modelName }}_refer_log
	# name_is_regexp: true
	# repo: ${{ github.repository }}
	# check_artifacts: false
	# search_artifacts: false
	# skip_unpack: false
	# if_no_artifact_found: warn

	- name: Evaluation
	run: \|
	docker exec ${{ env.CONTAINER_NAME }} \
	bash -c "cd /GenAIEval/.github/workflows/scripts/models \
	&& bash model_test.sh --model=${{ matrix.modelName }} --device=${{ matrix.device }} --datasets=${{ matrix.datasets }} --tasks=${{ matrix.tasks }}"

	- name: Collect Log
	run: \|
	docker exec ${{ env.CONTAINER_NAME }} \
	bash -c "cd /GenAIEval/.github/workflows/scripts/models \
	&& bash -x collect_log.sh --model=${{ matrix.modelName }} \
	--device=${{ matrix.device }} \
	--datasets=${{ matrix.datasets }} \
	--tasks=${{ matrix.tasks }}"

	- name: Publish pipeline artifact
	uses: actions/upload-artifact@v4
	if: ${{ !cancelled() }}
	with:
	name: ${{ matrix.device }}-${{ matrix.tasks }}-${{ matrix.modelName }}-${{ matrix.datasets }}
	path: \|
	${{ github.workspace }}/${{ matrix.device }}-${{ matrix.tasks }}-${{ matrix.modelName }}-${{ matrix.datasets }}.log
	${{ github.workspace }}/summary.log
	if-no-files-found: ignore # 'warn' or 'ignore' are also available, defaults to `warn`
	retention-days: 60 # 1 <= retention-days <= 90

	Genreate-Report:
	runs-on: ubuntu-latest
	needs: [Evaluation-Workflow]
	steps:
	- name: Checkout out Repo
	uses: actions/checkout@v4

	- name: Download Summary Log
	uses: actions/download-artifact@v4
	with:
	path: ${{ env.OUT_SCRIPT_PATH }}/log
	- name: Display structure of downloaded files
	run: ls -R
	- name: Analysis Summary
	run: \|
	cd ${{ env.OUT_SCRIPT_PATH }}
	ls -R

	- name: Download Reference Artifact
	id: download-artifact
	uses: dawidd6/action-download-artifact@v3.1.2
	with:
	workflow: model-test.yml
	name: FinalReport
	run_id: ${{ vars.ModelTest_REF_ID }}
	path: ${{ env.OUT_SCRIPT_PATH }}
	name_is_regexp: true
	repo: ${{ github.repository }}
	check_artifacts: false
	search_artifacts: false
	skip_unpack: false
	if_no_artifact_found: warn

	- name: Display structure of downloaded files
	run: cd ${{ env.OUT_SCRIPT_PATH }}/log && ls -R

	- name: Generate report
	run: \|
	echo "------ Generating final report.html ------"
	cd ${{ env.OUT_SCRIPT_PATH }}
	mkdir -p generated
	/usr/bin/bash generate_report.sh
	env:
	RUN_DISPLAY_URL: https://https://github.com/opea-project/GenAIEval/actions/runs/${{ github.run_id }}
	BUILD_NUMBER: ${{ github.run_id }}
	JOB_STATUS: succeed

	- name: Publish Report
	uses: actions/upload-artifact@v4
	if: ${{ !cancelled() }}
	with:
	name: FinalReport
	path: ${{ env.OUT_SCRIPT_PATH }}/generated

	- name: Specify performance regression
	if: ${{ !cancelled() }}
	run: \|
	if [ ${{ env.is_perf_reg }} == 'true' ]; then
	echo "[Performance Regression] Some model performance regression occurred, please check artifacts and reports."
	exit 1
	fi

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Model Test #25

Workflow file

Model Test #25

Jobs

Run details

Workflow file for this run