.github/workflows/continuous_batching.yml

Add CB CI tests #1

Workflow file for this run

.github/workflows/continuous_batching.yml at ee1fa38

	on:
	pull_request:
	paths:
	- .github/workflows/continuous_batching.yml
	- src/**
	- samples/**
	- thirdparty/openvino_tokenizers
	- "!**.md"
	permissions: read-all # Required by https://github.com/ossf/scorecard/blob/e23b8ad91fd6a64a0a971ca4fc0a4d1650725615/docs/checks.md#token-permissions
	concurrency:
	group: ${{ github.workflow }}-${{ github.ref }}
	cancel-in-progress: true

	env:
	l_ov_centos_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/l_openvino_toolkit_centos7_2024.3.0.dev20240626_x86_64.tgz
	l_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/l_openvino_toolkit_ubuntu20_2024.3.0.dev20240626_x86_64.tgz
	w_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/w_openvino_toolkit_windows_2024.3.0.dev20240626_x86_64.zip
	m_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/m_openvino_toolkit_macos_12_6_2024.3.0.dev20240626_x86_64.tgz
	jobs:
	cpp-continuous-batching-ubuntu:
	runs-on: ubuntu-20.04-8-cores
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- name: Install OpenVINO
	run: \|
	mkdir ./ov/
	curl ${{ env.l_ov_link }} \| tar --directory ./ov/ --strip-components 1 -xz
	sudo ./ov/install_dependencies/install_openvino_dependencies.sh
	- name: Download, convert and build
	run: \|
	source ./ov/setupvars.sh
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -DENABLE_PYTHON=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- name: Run gtests
	run: \|
	source ./ov/setupvars.sh
	./build/src/cpp/continuous_batching/tests_continuous_batching
	- name: Run accuracy_sample
	run: >
	source ./ov/setupvars.sh
	&& timeout 50s ./build/samples/cpp/accuracy_sample/accuracy_sample -m ./TinyLlama-1.1B-Chat-v1.0/ -n 5
	- name: Run throughput_benchmark
	run: \|
	wget -q https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json
	source ./ov/setupvars.sh
	timeout 150s ./build/samples/cpp/throughput_benchmark/throughput_benchmark -n 10 --dynamic_split_fuse -m ./TinyLlama-1.1B-Chat-v1.0/ --dataset ./ShareGPT_V3_unfiltered_cleaned_split.json --cache_size 1

	continuous_batching_python_lib_ubuntu:
	# A tokenizers' dependency fails to compile on ubuntu-20 n CenOS7 env.
	runs-on: ubuntu-22.04
	env:
	# A tokenizers' dependency fails to compile with Ninja in CenOS7 env.
	CMAKE_GENERATOR: Unix Makefiles
	CMAKE_BUILD_PARALLEL_LEVEL: null
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- run: mkdir ./ov/
	# Install CentOS7 instead of Ubuntu to match PyPI distribution ABI.
	- run: curl ${{ env.l_ov_centos_link }} \| tar --directory ./ov/ --strip-components 1 -xz
	- run: sudo ./ov/install_dependencies/install_openvino_dependencies.sh
	- run: source ./ov/setupvars.sh && cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -DENABLE_PYTHON=ON -S ./ -B ./build/
	- run: source ./ov/setupvars.sh && cmake --build ./build/ --config Release -j
	- run: source ./ov/setupvars.sh && python -m pip install ./thirdparty/openvino_tokenizers/[transformers] -r ./tests/python_tests/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly --upgrade-strategy eager
	- run: source ./ov/setupvars.sh && PYTHONPATH=./build/:$PYTHONPATH python -m pytest ./tests/python_tests/continuous_batching/test_sampling.py -m precommit
	- run: source ./ov/setupvars.sh && PYTHONPATH=./build/:$PYTHONPATH python -m pytest ./tests/python_tests/continuous_batching/test_preemption.py -m precommit
	- run: source ./ov/setupvars.sh && python -m pip install .
	- run: python -m pytest ./tests/python_tests/continuous_batching/test_sampling.py -m precommit
	- run: python -m pytest ./tests/python_tests/continuous_batching/test_preemption.py -m precommit

	cpp-continuous-batching-windows:
	runs-on: windows-latest
	defaults:
	run:
	shell: cmd
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- run: curl --output ov.zip ${{ env.w_ov_link }}
	- run: unzip -d ov ov.zip
	- run: dirs=(ov/) && mv ov//* ov && rmdir "${dirs[@]}"
	shell: bash
	- name: Download, convert and build
	run: \|
	call .\ov\setupvars.bat
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- name: Run gtests
	run: \|
	set PATH=.\build\openvino_genai\;%PATH%
	call .\ov\setupvars.bat
	.\build\src\cpp\continuous_batching\Release\tests_continuous_batching.exe
	- name: Run accuracy_sample
	run: \|
	set PATH=.\build\openvino_genai\;%PATH%
	call .\ov\setupvars.bat
	.\build\samples\cpp\accuracy_sample\Release\accuracy_sample.exe -m .\TinyLlama-1.1B-Chat-v1.0\ -n 5
	- name: Run throughput_benchmark
	run: \|
	curl -o .\ShareGPT_V3_unfiltered_cleaned_split.json -s -L "https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json"
	set PATH=.\build\openvino_genai\;%PATH%
	call .\ov\setupvars.bat
	.\build\samples\cpp\throughput_benchmark\Release\throughput_benchmark.exe -n 2 --dynamic_split_fuse -m .\TinyLlama-1.1B-Chat-v1.0\ --dataset .\ShareGPT_V3_unfiltered_cleaned_split.json --cache_size 1

	cpp-continuous-batching-macos:
	runs-on: macos-12
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- name: Install OpenVINO
	run: \|
	mkdir ./ov/
	curl ${{ env.m_ov_link }} \| tar --directory ./ov/ --strip-components 1 -xz
	brew install coreutils scons
	- name: Download, convert and build
	run: \|
	source ./ov/setupvars.sh
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- name: Run gtests
	run: \|
	source ./ov/setupvars.sh
	./build/src/cpp/continuous_batching/tests_continuous_batching
	- name: Run accuracy_sample
	run: >
	source ./ov/setupvars.sh
	&& timeout 120s ./build/samples/cpp/accuracy_sample/accuracy_sample -m ./TinyLlama-1.1B-Chat-v1.0/ -n 5
	- name: Run throughput_benchmark
	run: \|
	wget -q https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json
	source ./ov/setupvars.sh
	./build/samples/cpp/throughput_benchmark/throughput_benchmark -n 5 --dynamic_split_fuse -m ./TinyLlama-1.1B-Chat-v1.0/ --dataset ./ShareGPT_V3_unfiltered_cleaned_split.json --cache_size 1

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Add CB CI tests #1

Workflow file

Add CB CI tests #1

Jobs

Run details

Workflow file for this run