.github/workflows/continuous_batching_cpp.yml

Add CB CI tests #10

Workflow file for this run

.github/workflows/continuous_batching_cpp.yml at f1b3cb8

	on:
	pull_request:
	paths:
	- .github/workflows/continuous_batching_cpp.yml
	- src/**
	- samples/**
	- thirdparty/openvino_tokenizers
	- "!**.md"
	permissions: read-all # Required by https://github.com/ossf/scorecard/blob/e23b8ad91fd6a64a0a971ca4fc0a4d1650725615/docs/checks.md#token-permissions
	concurrency:
	group: ${{ github.workflow }}-${{ github.ref }}
	cancel-in-progress: true

	env:
	l_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/l_openvino_toolkit_ubuntu20_2024.3.0.dev20240626_x86_64.tgz
	w_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/w_openvino_toolkit_windows_2024.3.0.dev20240626_x86_64.zip
	m_ov_link: https://storage.openvinotoolkit.org/repositories/openvino/packages/nightly/2024.3.0-15805-6138d624dc1/m_openvino_toolkit_macos_12_6_2024.3.0.dev20240626_x86_64.tgz
	jobs:
	cpp-accuracy-sample-ubuntu:
	runs-on: ubuntu-20.04-8-cores
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- name: Install OpenVINO
	run: \|
	mkdir ./ov/
	curl ${{ env.l_ov_link }} \| tar --directory ./ov/ --strip-components 1 -xz
	sudo ./ov/install_dependencies/install_openvino_dependencies.sh
	- name: Download, convert and build
	run: \|
	source ./ov/setupvars.sh
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- name: Run gtests
	run: \|
	source ./ov/setupvars.sh
	./build/src/cpp/continuous_batching/tests_continuous_batching
	- name: Run accuracy_sample
	run: >
	source ./ov/setupvars.sh
	&& timeout 25s ./build/samples/cpp/accuracy_sample/accuracy_sample -m ./TinyLlama-1.1B-Chat-v1.0/ -n 5
	- name: Run throughput_benchmark
	run: \|
	wget -q https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json
	source ./ov/setupvars.sh
	timeout 50s ./build/samples/cpp/throughput_benchmark/throughput_benchmark -n 10 --dynamic_split_fuse -m ./TinyLlama-1.1B-Chat-v1.0/

	cpp-accuracy-sample-windows:
	runs-on: windows-latest
	defaults:
	run:
	shell: cmd
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- run: curl --output ov.zip ${{ env.w_ov_link }}
	- run: unzip -d ov ov.zip
	- run: dirs=(ov/) && mv ov//* ov && rmdir "${dirs[@]}"
	shell: bash
	- name: Download, convert and build
	run: \|
	call .\ov\setupvars.bat
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- run: >
	set PATH=.\build\openvino_genai\;%PATH%
	&& call .\ov\setupvars.bat
	&& .\build\samples\cpp\accuracy_sample\Release\accuracy_sample.exe -m .\TinyLlama-1.1B-Chat-v1.0\ -n 5
	# - run: \|
	# echo import transformers > ref.py
	# echo predictions = open('cpp.txt', 'r').read() >> ref.py
	# echo tokenizer = transformers.AutoTokenizer.from_pretrained('TinyLlama/TinyLlama-1.1B-Chat-v1.0', trust_remote_code=True) >> ref.py
	# echo tokenized = tokenizer('69', return_tensors='pt') >> ref.py
	# echo for beam in transformers.AutoModelForCausalLM.from_pretrained('TinyLlama/TinyLlama-1.1B-Chat-v1.0', trust_remote_code=True).generate(**tokenized, max_new_tokens=100, do_sample=False): >> ref.py
	# echo ref = tokenizer.decode(beam[tokenized['input_ids'].numel():], skip_special_tokens=True) >> ref.py
	# echo idx = predictions.find(ref) >> ref.py
	# echo if -1 == idx: >> ref.py
	# echo raise RuntimeError(f'Missing "{ref=}" from predictions') >> ref.py
	# echo predictions = predictions[:idx] + predictions[idx + len(ref):] >> ref.py
	# - run: python ref.py
	# - run: >
	# set PATH=.\build\openvino_genai\;%PATH%
	# && set "PYTHONPATH=./build/"
	# && call .\ov\setupvars.bat
	# && python samples\python\greedy_causal_lm\greedy_causal_lm.py .\TinyLlama-1.1B-Chat-v1.0\ 69 > .\py.txt
	# - run: fc .\cpp.txt .\py.txt

	cpp-accuracy-sample-macos:
	runs-on: macos-12
	steps:
	- uses: actions/checkout@v4
	with:
	submodules: recursive
	- uses: actions/setup-python@v4
	with:
	python-version: 3.8
	- name: Install OpenVINO
	run: \|
	mkdir ./ov/
	curl ${{ env.m_ov_link }} \| tar --directory ./ov/ --strip-components 1 -xz
	brew install coreutils scons
	- name: Download, convert and build
	run: \|
	source ./ov/setupvars.sh
	python -m pip install --upgrade-strategy eager -r ./samples/requirements.txt --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	python -m pip install ./thirdparty/openvino_tokenizers/[transformers] --pre --extra-index-url https://storage.openvinotoolkit.org/simple/wheels/nightly
	optimum-cli export openvino --trust-remote-code --weight-format fp16 --model TinyLlama/TinyLlama-1.1B-Chat-v1.0 TinyLlama-1.1B-Chat-v1.0
	cmake -DCMAKE_BUILD_TYPE=Release -DENABLE_CONTINUOUS_BATCHING=ON -DENABLE_APPS=ON -S ./ -B ./build/
	cmake --build ./build/ --config Release -j
	- run: >
	source ./ov/setupvars.sh
	&& ./build/samples/cpp/accuracy_sample/accuracy_sample -m ./TinyLlama-1.1B-Chat-v1.0/ -n 5

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Add CB CI tests #10

Workflow file

Add CB CI tests #10

Jobs

Run details

Workflow file for this run