A load testing tool for LLM streaming APIs.
git clone https://github.com/twaka/loadllm.git
cd loadllm
npm install
npm run build
chmod +x dist/cli.jsexport OPENAI_API_BASE="http://localhost:8000/v1" # openai compatible endpoint to test
export OPENAI_API_KEY="sk-your-key" # api key for the endpoint- Run a test with 3 concurrent virtual users for 60 seconds using the
gpt-oss-20bmodel:dist/cli.js -m gpt-oss-20b -c 3 -d 60
