diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/experiment.yaml
new file mode 100644
index 0000000..cec812c
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x 1x RTX A5000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:a37636
+run_id: vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000
+slug: 1x_1x_rtx_a5000
+timestamp: 2024-08-27_14-21-55
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output.yaml
new file mode 100644
index 0000000..80115b9
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e
+Describe justice system in UK vs USA in 2000-5000 words: 331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b
+Describe schooling system in UK vs USA in 2000-5000 words: 0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b
+Explain me some random problem for me in 2000-5000 words: 9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d
+Tell me entire history of USA: 318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4
+Write a ballad. Pick a random theme.: 1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b
+Write an epic story about a dragon and a knight: b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb
+Write an essay about being a Senior developer.: a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/run.local.log
new file mode 100644
index 0000000..d11f01a
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:21:55,507 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x 1x RTX A5000
+2024-08-27 14:21:55,510 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/run.local.log
+2024-08-27 14:21:55,644 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:21:55,891 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:21:55,896 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:21:55,899 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:21:56,106 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:21:59,804 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:23:02,082 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-21-55_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-21-55_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-21-55_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 2.08s\nPrepared 124 packages in 39.29s\nInstalled 124 packages in 10.29s\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.1\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:23:02,091 - __main__ - INFO - Gathering system info
+2024-08-27 14:23:06,086 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-21-55_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-21-55_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-21-55_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:23:06,090 - __main__ - INFO - Running experiment code on remote
+2024-08-27 14:26:53,904 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output | tee ~/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:23:17 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:23:20 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:23:20 selector.py:116] Using XFormers backend.\nINFO 08-27 12:23:21 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:23:21 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:23:21 selector.py:116] Using XFormers backend.\nINFO 08-27 12:23:22 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 12:24:34 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 12:24:35 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682\nmodel loading took 80.13 seconds\nStarting 8 responses generation\n8 responses generation took 134.87 seconds\n{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',\n 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',\n 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',\n 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',\n 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',\n 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',\n 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-21-55_1x_1x_rtx_a5000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-21-55_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-21-55_1x_1x_rtx_a5000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:01<00:01,  1.25s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  1.98s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  1.87s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:14<15:40, 134.35s/it, est. speed input: 0.85 toks/s, output: 29.65 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [02:14<01:41, 25.49s/it, est. speed input: 3.31 toks/s, output: 118.42 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [02:14<00:28, 14.41s/it, est. speed input: 4.86 toks/s, output: 177.59 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00,  8.91s/it, est. speed input: 6.35 toks/s, output: 236.67 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00, 16.86s/it, est. speed input: 6.35 toks/s, output: 236.67 toks/s]\n' status_code: 0
+2024-08-27 14:26:53,920 - __main__ - INFO - Syncing output back to local
+2024-08-27 14:26:54,459 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/stdout.txt
new file mode 100644
index 0000000..18e0de4
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:23:17 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:23:20 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:23:20 selector.py:116] Using XFormers backend.
+INFO 08-27 12:23:21 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:23:21 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:23:21 selector.py:116] Using XFormers backend.
+INFO 08-27 12:23:22 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 12:24:34 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 12:24:35 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682
+model loading took 80.13 seconds
+Starting 8 responses generation
+8 responses generation took 134.87 seconds
+{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',
+ 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',
+ 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',
+ 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',
+ 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',
+ 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/sysinfo.yaml
new file mode 100644
index 0000000..8bc3815
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/sysinfo.yaml
@@ -0,0 +1,510 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1499.85
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2285.121
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    count: 16
+    model: AMD EPYC 7232P 8-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '23028'
+      cuda: '8.6'
+      driver: 535.54.03
+      graphics_speed: '0'
+      memory_speed: '405'
+      name: NVIDIA RTX A5000
+      power_limit: '230.00'
+  hard_disk:
+    free: 38492880
+    total: 45088768
+    used: 6595888
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 255153356
+    free: 91071272
+    total: 263794412
+    used: 172723140
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-21-55_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.1
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.17
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04.1
+  - libpython3.10-minimal==3.10.12-1~22.04.5
+  - libpython3.10-stdlib==3.10.12-1~22.04.5
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04.1
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04.1
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3ubuntu0.1
+  - python3.10==3.10.12-1~22.04.5
+  - python3.10-minimal==3.10.12-1~22.04.5
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#85~20.04.1-Ubuntu SMP Mon Jul 17 09:42:39 UTC 2023'
+  processor: x86_64
+  release: 5.15.0-78-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/experiment.yaml
new file mode 100644
index 0000000..040d42b
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x 1x RTX A5000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:8d365d
+run_id: vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000
+slug: 1x_1x_rtx_a5000
+timestamp: 2024-08-27_14-30-01
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output.yaml
new file mode 100644
index 0000000..80115b9
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e
+Describe justice system in UK vs USA in 2000-5000 words: 331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b
+Describe schooling system in UK vs USA in 2000-5000 words: 0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b
+Explain me some random problem for me in 2000-5000 words: 9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d
+Tell me entire history of USA: 318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4
+Write a ballad. Pick a random theme.: 1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b
+Write an epic story about a dragon and a knight: b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb
+Write an essay about being a Senior developer.: a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/run.local.log
new file mode 100644
index 0000000..e8fbea6
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:30:01,334 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x 1x RTX A5000
+2024-08-27 14:30:01,337 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/run.local.log
+2024-08-27 14:30:01,460 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:30:01,696 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:30:01,701 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:30:01,703 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:30:01,906 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:30:04,612 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:30:08,765 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-30-01_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-30-01_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-30-01_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 73ms\nPrepared 1 package in 2ms\nInstalled 124 packages in 358ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.1\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:30:08,774 - __main__ - INFO - Gathering system info
+2024-08-27 14:30:12,287 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-30-01_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-30-01_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-30-01_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:30:12,293 - __main__ - INFO - Running experiment code on remote
+2024-08-27 14:32:48,675 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output | tee ~/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:30:23 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:30:23 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:30:23 selector.py:116] Using XFormers backend.\nINFO 08-27 12:30:24 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:30:24 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:30:24 selector.py:116] Using XFormers backend.\nINFO 08-27 12:30:25 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 12:30:29 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 12:30:31 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682\nmodel loading took 9.64 seconds\nStarting 8 responses generation\n8 responses generation took 134.12 seconds\n{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',\n 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',\n 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',\n 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',\n 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',\n 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',\n 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-30-01_1x_1x_rtx_a5000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-30-01_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-30-01_1x_1x_rtx_a5000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:01<00:01,  1.30s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  2.02s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  1.91s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:13<15:35, 133.60s/it, est. speed input: 0.85 toks/s, output: 29.81 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [02:13<01:41, 25.35s/it, est. speed input: 3.33 toks/s, output: 119.08 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [02:13<00:28, 14.33s/it, est. speed input: 4.89 toks/s, output: 178.59 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00,  8.86s/it, est. speed input: 6.39 toks/s, output: 238.00 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00, 16.76s/it, est. speed input: 6.39 toks/s, output: 238.00 toks/s]\n' status_code: 0
+2024-08-27 14:32:48,697 - __main__ - INFO - Syncing output back to local
+2024-08-27 14:32:49,295 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/stdout.txt
new file mode 100644
index 0000000..f8b73e1
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:30:23 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:30:23 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:30:23 selector.py:116] Using XFormers backend.
+INFO 08-27 12:30:24 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:30:24 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:30:24 selector.py:116] Using XFormers backend.
+INFO 08-27 12:30:25 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 12:30:29 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 12:30:31 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682
+model loading took 9.64 seconds
+Starting 8 responses generation
+8 responses generation took 134.12 seconds
+{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',
+ 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',
+ 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',
+ 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',
+ 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',
+ 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/sysinfo.yaml
new file mode 100644
index 0000000..fc0af20
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/sysinfo.yaml
@@ -0,0 +1,510 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1480.488
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1618.489
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    count: 16
+    model: AMD EPYC 7232P 8-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '23028'
+      cuda: '8.6'
+      driver: 535.54.03
+      graphics_speed: '0'
+      memory_speed: '405'
+      name: NVIDIA RTX A5000
+      power_limit: '230.00'
+  hard_disk:
+    free: 30923940
+    total: 45088768
+    used: 14164828
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 255211004
+    free: 83546552
+    total: 263794412
+    used: 180247860
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-30-01_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.1
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.17
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04.1
+  - libpython3.10-minimal==3.10.12-1~22.04.5
+  - libpython3.10-stdlib==3.10.12-1~22.04.5
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04.1
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04.1
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3ubuntu0.1
+  - python3.10==3.10.12-1~22.04.5
+  - python3.10-minimal==3.10.12-1~22.04.5
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#85~20.04.1-Ubuntu SMP Mon Jul 17 09:42:39 UTC 2023'
+  processor: x86_64
+  release: 5.15.0-78-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/experiment.yaml
new file mode 100644
index 0000000..3f0c4c8
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x 1x RTX A5000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:2f6b87
+run_id: vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000
+slug: 1x_1x_rtx_a5000
+timestamp: 2024-08-27_14-39-44
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output.yaml
new file mode 100644
index 0000000..80115b9
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e
+Describe justice system in UK vs USA in 2000-5000 words: 331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b
+Describe schooling system in UK vs USA in 2000-5000 words: 0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b
+Explain me some random problem for me in 2000-5000 words: 9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d
+Tell me entire history of USA: 318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4
+Write a ballad. Pick a random theme.: 1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b
+Write an epic story about a dragon and a knight: b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb
+Write an essay about being a Senior developer.: a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/run.local.log
new file mode 100644
index 0000000..2af7355
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:39:44,050 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x 1x RTX A5000
+2024-08-27 14:39:44,052 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/run.local.log
+2024-08-27 14:39:44,177 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:39:44,419 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:39:44,425 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:39:44,427 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:39:44,636 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:39:47,621 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:39:55,790 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-39-44_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-39-44_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-39-44_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 746ms\nPrepared 1 package in 2ms\nInstalled 124 packages in 346ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.1\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:39:55,806 - __main__ - INFO - Gathering system info
+2024-08-27 14:39:59,366 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-39-44_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-39-44_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-39-44_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:39:59,370 - __main__ - INFO - Running experiment code on remote
+2024-08-27 14:42:36,467 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output | tee ~/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:40:10 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:40:10 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:40:10 selector.py:116] Using XFormers backend.\nINFO 08-27 12:40:11 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:40:12 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:40:12 selector.py:116] Using XFormers backend.\nINFO 08-27 12:40:12 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 12:40:16 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 12:40:18 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682\nmodel loading took 9.59 seconds\nStarting 8 responses generation\n8 responses generation took 134.79 seconds\n{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',\n 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',\n 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',\n 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',\n 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',\n 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',\n 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-39-44_1x_1x_rtx_a5000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-39-44_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-39-44_1x_1x_rtx_a5000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:01<00:01,  1.29s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  2.06s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:03<00:00,  1.94s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:14<15:39, 134.27s/it, est. speed input: 0.85 toks/s, output: 29.66 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [02:14<01:41, 25.48s/it, est. speed input: 3.31 toks/s, output: 118.49 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [02:14<00:28, 14.40s/it, est. speed input: 4.86 toks/s, output: 177.70 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00,  8.90s/it, est. speed input: 6.36 toks/s, output: 236.82 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:14<00:00, 16.85s/it, est. speed input: 6.36 toks/s, output: 236.82 toks/s]\n' status_code: 0
+2024-08-27 14:42:36,487 - __main__ - INFO - Syncing output back to local
+2024-08-27 14:42:37,544 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/stdout.txt
new file mode 100644
index 0000000..c348eac
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:40:10 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:40:10 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:40:10 selector.py:116] Using XFormers backend.
+INFO 08-27 12:40:11 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:40:12 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:40:12 selector.py:116] Using XFormers backend.
+INFO 08-27 12:40:12 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 12:40:16 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 12:40:18 gpu_executor.py:121] # GPU blocks: 2004, # CPU blocks: 682
+model loading took 9.59 seconds
+Starting 8 responses generation
+8 responses generation took 134.79 seconds
+{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',
+ 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',
+ 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',
+ 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',
+ 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',
+ 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/sysinfo.yaml
new file mode 100644
index 0000000..6a47667
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/sysinfo.yaml
@@ -0,0 +1,510 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1499.916
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    count: 16
+    model: AMD EPYC 7232P 8-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '23028'
+      cuda: '8.6'
+      driver: 535.54.03
+      graphics_speed: '210'
+      memory_speed: '405'
+      name: NVIDIA RTX A5000
+      power_limit: '230.00'
+  hard_disk:
+    free: 30826520
+    total: 45088768
+    used: 14262248
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 255169372
+    free: 83395604
+    total: 263794412
+    used: 180398808
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-39-44_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.1
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.17
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04.1
+  - libpython3.10-minimal==3.10.12-1~22.04.5
+  - libpython3.10-stdlib==3.10.12-1~22.04.5
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04.1
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04.1
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3ubuntu0.1
+  - python3.10==3.10.12-1~22.04.5
+  - python3.10-minimal==3.10.12-1~22.04.5
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#85~20.04.1-Ubuntu SMP Mon Jul 17 09:42:39 UTC 2023'
+  processor: x86_64
+  release: 5.15.0-78-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/experiment.yaml
new file mode 100644
index 0000000..ea488c8
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x 1x RTX A5000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:2f6b87
+run_id: vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000
+slug: 1x_1x_rtx_a5000
+timestamp: 2024-08-27_14-44-48
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output.yaml
new file mode 100644
index 0000000..80115b9
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e
+Describe justice system in UK vs USA in 2000-5000 words: 331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b
+Describe schooling system in UK vs USA in 2000-5000 words: 0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b
+Explain me some random problem for me in 2000-5000 words: 9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d
+Tell me entire history of USA: 318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4
+Write a ballad. Pick a random theme.: 1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b
+Write an epic story about a dragon and a knight: b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb
+Write an essay about being a Senior developer.: a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/run.local.log
new file mode 100644
index 0000000..023c79c
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:44:48,362 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x 1x RTX A5000
+2024-08-27 14:44:48,365 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/run.local.log
+2024-08-27 14:44:48,469 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:44:48,685 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:44:48,687 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:44:48,687 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:44:48,869 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:44:51,973 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:45:49,099 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-44-48_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-44-48_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-44-48_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 1.70s\nPrepared 124 packages in 49.31s\nInstalled 124 packages in 364ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.1\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:45:49,111 - __main__ - INFO - Gathering system info
+2024-08-27 14:45:54,044 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-44-48_1x_1x_rtx_a5000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-44-48_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-44-48_1x_1x_rtx_a5000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:45:54,056 - __main__ - INFO - Running experiment code on remote
+2024-08-27 14:49:04,620 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output | tee ~/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:46:05 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:46:06 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:46:06 selector.py:116] Using XFormers backend.\nINFO 08-27 12:46:08 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:46:08 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:46:08 selector.py:116] Using XFormers backend.\nINFO 08-27 12:46:09 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 12:47:20 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 12:47:21 gpu_executor.py:121] # GPU blocks: 2233, # CPU blocks: 682\nmodel loading took 78.82 seconds\nStarting 8 responses generation\n8 responses generation took 99.26 seconds\n{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',\n 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',\n 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',\n 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',\n 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',\n 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',\n 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-44-48_1x_1x_rtx_a5000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-44-48_1x_1x_rtx_a5000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-44-48_1x_1x_rtx_a5000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:00<00:00,  1.05it/s]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:02<00:00,  1.29s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:02<00:00,  1.24s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [01:38<11:31, 98.86s/it, est. speed input: 1.15 toks/s, output: 40.29 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [01:39<01:15, 18.76s/it, est. speed input: 4.50 toks/s, output: 160.92 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [01:39<00:00,  7.40s/it, est. speed input: 8.63 toks/s, output: 321.60 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [01:39<00:00, 12.41s/it, est. speed input: 8.63 toks/s, output: 321.60 toks/s]\n' status_code: 0
+2024-08-27 14:49:04,637 - __main__ - INFO - Syncing output back to local
+2024-08-27 14:49:05,567 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/stdout.txt
new file mode 100644
index 0000000..419586d
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:46:05 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:46:06 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:46:06 selector.py:116] Using XFormers backend.
+INFO 08-27 12:46:08 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:46:08 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:46:08 selector.py:116] Using XFormers backend.
+INFO 08-27 12:46:09 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 12:47:20 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 12:47:21 gpu_executor.py:121] # GPU blocks: 2233, # CPU blocks: 682
+model loading took 78.82 seconds
+Starting 8 responses generation
+8 responses generation took 99.26 seconds
+{'Count to 1000, skip unpopular numbers': '47e766e6b9c4a9530cca0163f395f6bf814a5977b1543e330c7cf9985e68b3f9304c9b58901989b36647313fb3279a276fcbd9abc107f3a84d982ed8713b0c7e',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '331a2d29206403d9a76027eb005c9d5e202bcc26d49dc7dd31a4026b612bbafca22264f75cb22548174bdc4675b7a8acb5892d3dd8203b81991bc3fb25995d6b',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '0621808e3ca6777d55024775b4b01ca1b7fa452f713137c72be02ba8c30683b5d19dfb6241ef1605e10d1b90b541f08e15df632e77960ff15b370163fb814d0b',
+ 'Explain me some random problem for me in 2000-5000 words': '9f05037cdf6126545027c496e06b7a86b987364e1e07664948b2a5190ff955f7e81c2d3f792752b621f7180e46a6c5c5f379be579f7aeb89ed87722cfaa41f5d',
+ 'Tell me entire history of USA': '318fd13f7cbee849f351f5919364f34a8fcafe202050d91d630b3c10523075516d9eaff838f808e3c0ba785dcf857fa03a8a5308b002ffb323a74d4d04f5e3f4',
+ 'Write a ballad. Pick a random theme.': '1d5e78e142e62ddeb914053bec41f9987a5b3d9cdf2fd39ac4835460c2b003fa3991799ed0fb9bd4ad068b6a2d63b19c80ebc2e99c29286205c8db71b361929b',
+ 'Write an epic story about a dragon and a knight': 'b5901ec5d261c379acec9180c658e024b5665b3b9a1c52202647a68f7f125467e65a35b3e941e8c7a669689b73cfce49273eacd3e59fd2d3d5c8a0c0686dd9fb',
+ 'Write an essay about being a Senior developer.': 'a6068b4300b724b84ee1ba949824a4647430b745162e21acb85cc4bb9704dc8316ad04d740e18c8c666a4dabf2eee98d3c443b7cb350e6f1441f4c42de5a2f25'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/sysinfo.yaml
new file mode 100644
index 0000000..2c0949e
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/sysinfo.yaml
@@ -0,0 +1,558 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.047
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    - 800.0
+    count: 64
+    model: Intel(R) Xeon(R) Gold 6338 CPU @ 2.00GHz
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '24564'
+      cuda: '8.6'
+      driver: 535.161.08
+      graphics_speed: '0'
+      memory_speed: '405'
+      name: NVIDIA RTX A5000
+      power_limit: '230.00'
+  hard_disk:
+    free: 38491364
+    total: 45088768
+    used: 6597404
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 255078916
+    free: 80659908
+    total: 263525740
+    used: 182865832
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-44-48_1x_1x_rtx_a5000/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.1
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.17
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04.1
+  - libpython3.10-minimal==3.10.12-1~22.04.5
+  - libpython3.10-stdlib==3.10.12-1~22.04.5
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04.1
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04.1
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3ubuntu0.1
+  - python3.10==3.10.12-1~22.04.5
+  - python3.10-minimal==3.10.12-1~22.04.5
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#49~20.04.1-Ubuntu SMP Thu Aug 4 19:15:44 UTC 2022'
+  processor: x86_64
+  release: 5.15.0-46-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/experiment.yaml
new file mode 100644
index 0000000..887b8f5
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x RTX 4090
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:2f6b87
+run_id: vllm_16g/2024-08-27_14-56-46_1x_rtx_4090
+slug: 1x_rtx_4090
+timestamp: 2024-08-27_14-56-46
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output.yaml
new file mode 100644
index 0000000..bb69a4b
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4
+Describe justice system in UK vs USA in 2000-5000 words: d197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973
+Describe schooling system in UK vs USA in 2000-5000 words: 050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e
+Explain me some random problem for me in 2000-5000 words: f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661
+Tell me entire history of USA: 9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837
+Write a ballad. Pick a random theme.: 30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c
+Write an epic story about a dragon and a knight: 6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68
+Write an essay about being a Senior developer.: 6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/run.local.log
new file mode 100644
index 0000000..81051c0
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:56:46,839 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x RTX 4090
+2024-08-27 14:56:46,842 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/run.local.log
+2024-08-27 14:56:47,397 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:56:48,488 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:56:48,489 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:56:48,490 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:56:49,330 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:56:59,719 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:58:09,168 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-56-46_1x_rtx_4090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-56-46_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-56-46_1x_rtx_4090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 2.61s\nPrepared 124 packages in 58.79s\nInstalled 124 packages in 266ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:58:09,191 - __main__ - INFO - Gathering system info
+2024-08-27 14:58:13,853 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-56-46_1x_rtx_4090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-56-46_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-56-46_1x_rtx_4090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:58:14,270 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:03:55,321 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output | tee ~/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:58:26 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:58:29 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:58:29 selector.py:116] Using XFormers backend.\nINFO 08-27 12:58:33 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:58:33 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:58:33 selector.py:116] Using XFormers backend.\nINFO 08-27 12:58:33 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:01:35 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:01:37 gpu_executor.py:121] # GPU blocks: 2170, # CPU blocks: 682\nmodel loading took 196.25 seconds\nStarting 8 responses generation\n8 responses generation took 130.16 seconds\n{'Count to 1000, skip unpopular numbers': '546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4',\n 'Describe justice system in UK vs USA in 2000-5000 words': 'd197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e',\n 'Explain me some random problem for me in 2000-5000 words': 'f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661',\n 'Tell me entire history of USA': '9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837',\n 'Write a ballad. Pick a random theme.': '30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c',\n 'Write an epic story about a dragon and a knight': '6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68',\n 'Write an essay about being a Senior developer.': '6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-56-46_1x_rtx_4090 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-56-46_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-56-46_1x_rtx_4090) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:03<00:03,  3.82s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:10<00:00,  5.46s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:10<00:00,  5.22s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:00<14:01, 120.24s/it, est. speed input: 0.82 toks/s, output: 30.70 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [02:09<05:30, 55.11s/it, est. speed input: 1.64 toks/s, output: 59.14 toks/s] \rProcessed prompts:  62%|██████▎   | 5/8 [02:10<00:47, 15.72s/it, est. speed input: 4.19 toks/s, output: 150.97 toks/s]\rProcessed prompts:  88%|████████▊ | 7/8 [02:10<00:09,  9.37s/it, est. speed input: 5.79 toks/s, output: 212.21 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:10<00:00, 16.27s/it, est. speed input: 6.58 toks/s, output: 242.89 toks/s]\n' status_code: 0
+2024-08-27 15:03:55,349 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:03:58,521 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/stdout.txt
new file mode 100644
index 0000000..7bf3cc0
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:58:26 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:58:29 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:58:29 selector.py:116] Using XFormers backend.
+INFO 08-27 12:58:33 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:58:33 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:58:33 selector.py:116] Using XFormers backend.
+INFO 08-27 12:58:33 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:01:35 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:01:37 gpu_executor.py:121] # GPU blocks: 2170, # CPU blocks: 682
+model loading took 196.25 seconds
+Starting 8 responses generation
+8 responses generation took 130.16 seconds
+{'Count to 1000, skip unpopular numbers': '546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4',
+ 'Describe justice system in UK vs USA in 2000-5000 words': 'd197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e',
+ 'Explain me some random problem for me in 2000-5000 words': 'f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661',
+ 'Tell me entire history of USA': '9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837',
+ 'Write a ballad. Pick a random theme.': '30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c',
+ 'Write an epic story about a dragon and a knight': '6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68',
+ 'Write an essay about being a Senior developer.': '6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/sysinfo.yaml
new file mode 100644
index 0000000..074a722
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/sysinfo.yaml
@@ -0,0 +1,686 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1331.001
+    - 1597.152
+    - 1999.975
+    - 1563.376
+    - 1648.661
+    - 1663.029
+    - 1782.483
+    - 1665.489
+    - 1607.256
+    - 1581.952
+    - 1577.978
+    - 1785.384
+    - 1654.39
+    - 1768.639
+    - 1797.632
+    - 1798.552
+    - 1798.546
+    - 1800.304
+    - 1798.475
+    - 1795.947
+    - 1796.216
+    - 1498.373
+    - 1796.364
+    - 1797.369
+    - 1731.595
+    - 1740.321
+    - 1738.867
+    - 1933.714
+    - 1782.113
+    - 1799.214
+    - 1799.8
+    - 1798.788
+    - 1649.456
+    - 1801.315
+    - 1646.772
+    - 1648.017
+    - 1799.377
+    - 1797.609
+    - 1797.439
+    - 1799.651
+    - 1799.593
+    - 1798.251
+    - 1796.732
+    - 1797.866
+    - 1647.542
+    - 3271.239
+    - 2237.9
+    - 1433.146
+    - 1497.619
+    - 1497.827
+    - 1499.878
+    - 1496.1
+    - 1499.379
+    - 1496.148
+    - 1498.922
+    - 1497.963
+    - 1459.079
+    - 1419.109
+    - 2855.386
+    - 1466.361
+    - 1499.538
+    - 1498.959
+    - 1499.729
+    - 1499.059
+    - 1499.273
+    - 1491.325
+    - 1499.77
+    - 1499.269
+    - 1498.958
+    - 1498.768
+    - 1497.182
+    - 1499.055
+    - 3299.074
+    - 1465.87
+    - 1465.529
+    - 1465.65
+    - 1499.583
+    - 1499.274
+    - 1499.313
+    - 1497.906
+    - 1496.075
+    - 1497.995
+    - 1497.588
+    - 1496.128
+    - 1497.722
+    - 1499.75
+    - 1495.859
+    - 1499.462
+    - 1499.812
+    - 1497.912
+    - 1493.561
+    - 1495.519
+    - 1499.81
+    - 1498.971
+    - 1492.902
+    - 1499.768
+    - 1325.686
+    - 2115.815
+    - 1974.289
+    - 2152.537
+    - 1789.129
+    - 2288.134
+    - 2290.949
+    - 2304.781
+    - 2313.345
+    - 2279.85
+    - 2288.536
+    - 2292.811
+    - 2317.668
+    - 2288.243
+    - 2296.221
+    - 2297.096
+    - 1898.599
+    - 2291.26
+    - 2306.352
+    - 2305.479
+    - 2278.484
+    - 1352.18
+    - 2061.382
+    - 2070.731
+    - 2309.115
+    - 1993.718
+    - 1976.717
+    - 1799.873
+    - 2340.186
+    - 2316.744
+    - 2322.776
+    - 2314.996
+    - 1798.395
+    - 1796.07
+    - 1799.168
+    - 1795.422
+    - 2336.258
+    - 1792.694
+    - 2285.596
+    - 2285.892
+    - 2207.397
+    - 2340.792
+    - 2303.486
+    - 2305.685
+    - 2210.761
+    - 3297.149
+    - 1749.129
+    - 1465.992
+    - 1499.191
+    - 1499.504
+    - 1499.54
+    - 1435.175
+    - 1499.819
+    - 1498.852
+    - 1499.61
+    - 1498.259
+    - 1402.763
+    - 1454.679
+    - 1999.992
+    - 1331.256
+    - 1497.873
+    - 1497.783
+    - 1498.839
+    - 1455.452
+    - 1499.005
+    - 1495.566
+    - 1498.04
+    - 1498.318
+    - 1497.402
+    - 1498.615
+    - 1496.824
+    - 1499.335
+    - 3294.827
+    - 1466.485
+    - 1463.931
+    - 1466.911
+    - 1498.698
+    - 1496.165
+    - 1497.243
+    - 1488.502
+    - 1498.391
+    - 1497.506
+    - 1498.859
+    - 1499.197
+    - 1497.983
+    - 1496.161
+    - 1497.679
+    - 1498.797
+    - 1499.253
+    - 1498.603
+    - 1496.848
+    - 1498.791
+    - 1499.94
+    - 1499.716
+    - 1498.228
+    - 1498.858
+    count: 192
+    model: AMD EPYC 7R12 48-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '24564'
+      cuda: '8.9'
+      driver: 525.105.17
+      graphics_speed: '210'
+      memory_speed: '405'
+      name: NVIDIA GeForce RTX 4090
+      power_limit: '450.00'
+  hard_disk:
+    free: 10121792
+    total: 16777216
+    used: 6655424
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 477838588
+    free: 62716152
+    total: 528193180
+    used: 465477028
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-56-46_1x_rtx_4090/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.5
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.10
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.1
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.14
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.2
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.2
+  - libglib2.0-bin==2.72.4-0ubuntu2.2
+  - libglib2.0-data==2.72.4-0ubuntu2.2
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.1
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.1
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.11
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.3
+  - libpython3.10-stdlib==3.10.12-1~22.04.3
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.1
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.11
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.3
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu2
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu2
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.3
+  - python3.10-minimal==3.10.12-1~22.04.3
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.11
+  - systemd-sysv==249.11-0ubuntu3.11
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#167~18.04.1-Ubuntu SMP Wed May 24 00:51:42 UTC 2023'
+  processor: x86_64
+  release: 5.4.0-150-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/experiment.yaml
new file mode 100644
index 0000000..79f7d18
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x RTX 4080S
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:2f6b87
+run_id: vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s
+slug: 1x_rtx_4080s
+timestamp: 2024-08-27_14-58-04
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output.yaml
new file mode 100644
index 0000000..a6247d0
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 8826e45b35b12de22a71803cd67cfaf0e47f3d83adbc9c95d9026d864761d8a88850adb3bd115de8f28c73bccb09e7dec0c4f40f0c85972292a72bcc4c3a344e
+Describe justice system in UK vs USA in 2000-5000 words: 4989a42c2e1fc4552d4f403d0e9b22b5e7144d813ea38a9c1490adc82eee1d1537408c1e0140a2726cafac0ebe8601661fd088f80bb539898a745f5ae41de5ca
+Describe schooling system in UK vs USA in 2000-5000 words: 85393953c469ff11238c24e7a8c4c8891f0b2f7cf80dc42b15c98c20f9ccb870b7ad4842f9272dd902f2bd7e3c04270adeba92e1e68979e6decd788d63df7ffa
+Explain me some random problem for me in 2000-5000 words: 5a07c589a60d0c597ec31800171d07c0e5394beab896ad186472e8b589bd3998d1500076af33885addc03a116fc2bf807ebcef4beef2595d49dabae61b811ed0
+Tell me entire history of USA: 61285b07965a2d1e456aa5a64450c68c3ef01377d2f6f6b87cb146932aeb3bff0ffb0b892c8fcf2c0ba65e6a8e514e78ec1f9bb1c50dc033e8d129049701d989
+Write a ballad. Pick a random theme.: e13a867f6e7a044f0d90bcf4cca2e07373abf93bf072b66a664e1dd71f72092779797dec166559eae130d85a02660d60003c4f230e443848802ec0534abc6e6d
+Write an epic story about a dragon and a knight: 29549b2b8a3ef34db9fd949e789c27c5418942548414cbc9f8e84d391e6693c5a0ac85018898d590918f584557d1820f5c58062a87c92d380a9ce42ba328e971
+Write an essay about being a Senior developer.: 53a19fca3c796a5d7c5f2fa3a24577d71bb6a543e2ed367fd36be3b20b84bd17525adb389db04bec804e4134f63f58132029d1e456f4dee119226a40df024b7c
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/run.local.log
new file mode 100644
index 0000000..59db42f
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 14:58:04,858 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x RTX 4080S
+2024-08-27 14:58:04,861 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/run.local.log
+2024-08-27 14:58:04,980 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 14:58:05,231 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 14:58:05,242 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 14:58:05,246 - __main__ - INFO - Syncing files to remote
+2024-08-27 14:58:05,448 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 14:58:08,799 - __main__ - INFO - Setting up remote environment
+2024-08-27 14:59:31,436 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-58-04_1x_rtx_4080s '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-58-04_1x_rtx_4080s\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-58-04_1x_rtx_4080s) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 1.36s\nPrepared 124 packages in 1m 15s\nInstalled 124 packages in 381ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev7+ge44d014.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 14:59:31,459 - __main__ - INFO - Gathering system info
+2024-08-27 14:59:35,477 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_14-58-04_1x_rtx_4080s '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-58-04_1x_rtx_4080s\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_14-58-04_1x_rtx_4080s) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 14:59:35,486 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:04:20,497 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output | tee ~/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 12:59:46 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 12:59:48 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:59:48 selector.py:116] Using XFormers backend.\nINFO 08-27 12:59:50 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 12:59:50 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 12:59:50 selector.py:116] Using XFormers backend.\nINFO 08-27 12:59:50 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:01:03 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:01:04 gpu_executor.py:121] # GPU blocks: 1005, # CPU blocks: 682\nmodel loading took 80.54 seconds\nStarting 8 responses generation\nWARNING 08-27 13:02:06 scheduler.py:1242] Sequence group 7 is preempted by PreemptionMode.RECOMPUTE mode because there is not enough KV cache space. This can affect the end-to-end performance. Increase gpu_memory_utilization or tensor_parallel_size to provide more KV cache memory. total_num_cumulative_preemption=1\n8 responses generation took 191.26 seconds\n{'Count to 1000, skip unpopular numbers': '8826e45b35b12de22a71803cd67cfaf0e47f3d83adbc9c95d9026d864761d8a88850adb3bd115de8f28c73bccb09e7dec0c4f40f0c85972292a72bcc4c3a344e',\n 'Describe justice system in UK vs USA in 2000-5000 words': '4989a42c2e1fc4552d4f403d0e9b22b5e7144d813ea38a9c1490adc82eee1d1537408c1e0140a2726cafac0ebe8601661fd088f80bb539898a745f5ae41de5ca',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '85393953c469ff11238c24e7a8c4c8891f0b2f7cf80dc42b15c98c20f9ccb870b7ad4842f9272dd902f2bd7e3c04270adeba92e1e68979e6decd788d63df7ffa',\n 'Explain me some random problem for me in 2000-5000 words': '5a07c589a60d0c597ec31800171d07c0e5394beab896ad186472e8b589bd3998d1500076af33885addc03a116fc2bf807ebcef4beef2595d49dabae61b811ed0',\n 'Tell me entire history of USA': '61285b07965a2d1e456aa5a64450c68c3ef01377d2f6f6b87cb146932aeb3bff0ffb0b892c8fcf2c0ba65e6a8e514e78ec1f9bb1c50dc033e8d129049701d989',\n 'Write a ballad. Pick a random theme.': 'e13a867f6e7a044f0d90bcf4cca2e07373abf93bf072b66a664e1dd71f72092779797dec166559eae130d85a02660d60003c4f230e443848802ec0534abc6e6d',\n 'Write an epic story about a dragon and a knight': '29549b2b8a3ef34db9fd949e789c27c5418942548414cbc9f8e84d391e6693c5a0ac85018898d590918f584557d1820f5c58062a87c92d380a9ce42ba328e971',\n 'Write an essay about being a Senior developer.': '53a19fca3c796a5d7c5f2fa3a24577d71bb6a543e2ed367fd36be3b20b84bd17525adb389db04bec804e4134f63f58132029d1e456f4dee119226a40df024b7c'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_14-58-04_1x_rtx_4080s \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_14-58-04_1x_rtx_4080s\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_14-58-04_1x_rtx_4080s) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output\n+ tee /root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:00<00:00,  1.36it/s]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:02<00:00,  1.06s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:02<00:00,  1.01s/it]\n\n/root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:06<14:45, 126.46s/it, est. speed input: 0.90 toks/s, output: 31.50 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [02:06<05:13, 52.19s/it, est. speed input: 1.79 toks/s, output: 62.90 toks/s] \rProcessed prompts:  50%|█████     | 4/8 [02:06<01:18, 19.54s/it, est. speed input: 3.51 toks/s, output: 125.63 toks/s]\rProcessed prompts:  88%|████████▊ | 7/8 [02:07<00:08,  8.38s/it, est. speed input: 5.93 toks/s, output: 219.67 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [03:11<00:00, 20.34s/it, est. speed input: 4.48 toks/s, output: 166.89 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [03:11<00:00, 23.91s/it, est. speed input: 4.48 toks/s, output: 166.89 toks/s]\n' status_code: 0
+2024-08-27 15:04:20,536 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:04:21,191 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/stdout.txt
new file mode 100644
index 0000000..54cd6ad
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/stdout.txt
@@ -0,0 +1,23 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 12:59:46 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 12:59:48 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:59:48 selector.py:116] Using XFormers backend.
+INFO 08-27 12:59:50 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 12:59:50 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 12:59:50 selector.py:116] Using XFormers backend.
+INFO 08-27 12:59:50 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:01:03 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:01:04 gpu_executor.py:121] # GPU blocks: 1005, # CPU blocks: 682
+model loading took 80.54 seconds
+Starting 8 responses generation
+WARNING 08-27 13:02:06 scheduler.py:1242] Sequence group 7 is preempted by PreemptionMode.RECOMPUTE mode because there is not enough KV cache space. This can affect the end-to-end performance. Increase gpu_memory_utilization or tensor_parallel_size to provide more KV cache memory. total_num_cumulative_preemption=1
+8 responses generation took 191.26 seconds
+{'Count to 1000, skip unpopular numbers': '8826e45b35b12de22a71803cd67cfaf0e47f3d83adbc9c95d9026d864761d8a88850adb3bd115de8f28c73bccb09e7dec0c4f40f0c85972292a72bcc4c3a344e',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '4989a42c2e1fc4552d4f403d0e9b22b5e7144d813ea38a9c1490adc82eee1d1537408c1e0140a2726cafac0ebe8601661fd088f80bb539898a745f5ae41de5ca',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '85393953c469ff11238c24e7a8c4c8891f0b2f7cf80dc42b15c98c20f9ccb870b7ad4842f9272dd902f2bd7e3c04270adeba92e1e68979e6decd788d63df7ffa',
+ 'Explain me some random problem for me in 2000-5000 words': '5a07c589a60d0c597ec31800171d07c0e5394beab896ad186472e8b589bd3998d1500076af33885addc03a116fc2bf807ebcef4beef2595d49dabae61b811ed0',
+ 'Tell me entire history of USA': '61285b07965a2d1e456aa5a64450c68c3ef01377d2f6f6b87cb146932aeb3bff0ffb0b892c8fcf2c0ba65e6a8e514e78ec1f9bb1c50dc033e8d129049701d989',
+ 'Write a ballad. Pick a random theme.': 'e13a867f6e7a044f0d90bcf4cca2e07373abf93bf072b66a664e1dd71f72092779797dec166559eae130d85a02660d60003c4f230e443848802ec0534abc6e6d',
+ 'Write an epic story about a dragon and a knight': '29549b2b8a3ef34db9fd949e789c27c5418942548414cbc9f8e84d391e6693c5a0ac85018898d590918f584557d1820f5c58062a87c92d380a9ce42ba328e971',
+ 'Write an essay about being a Senior developer.': '53a19fca3c796a5d7c5f2fa3a24577d71bb6a543e2ed367fd36be3b20b84bd17525adb389db04bec804e4134f63f58132029d1e456f4dee119226a40df024b7c'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/sysinfo.yaml
new file mode 100644
index 0000000..11d3daa
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/sysinfo.yaml
@@ -0,0 +1,622 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1800.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1800.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1800.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1486.603
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    count: 128
+    model: AMD EPYC 7702 64-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '16376'
+      cuda: '8.9'
+      driver: '550.67'
+      graphics_speed: '210'
+      memory_speed: '405'
+      name: NVIDIA GeForce RTX 4080 SUPER
+      power_limit: '320.00'
+  hard_disk:
+    free: 10118652
+    total: 16777216
+    used: 6658564
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 252590816
+    free: 145644132
+    total: 263748376
+    used: 118104244
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_14-58-04_1x_rtx_4080s/deterministic_ml-0.1.dev7+ge44d014.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.6
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.10
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.16
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.2
+  - libglib2.0-bin==2.72.4-0ubuntu2.2
+  - libglib2.0-data==2.72.4-0ubuntu2.2
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.1
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.3
+  - libpython3.10-stdlib==3.10.12-1~22.04.3
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.3
+  - python3.10-minimal==3.10.12-1~22.04.3
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#115-Ubuntu SMP Mon Apr 15 09:52:04 UTC 2024'
+  processor: x86_64
+  release: 5.15.0-105-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/experiment.yaml
new file mode 100644
index 0000000..93dcc7f
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x RTX 4090
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:39979e
+run_id: vllm_16g/2024-08-27_15-26-43_1x_rtx_4090
+slug: 1x_rtx_4090
+timestamp: 2024-08-27_15-26-43
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output.yaml
new file mode 100644
index 0000000..bb69a4b
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4
+Describe justice system in UK vs USA in 2000-5000 words: d197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973
+Describe schooling system in UK vs USA in 2000-5000 words: 050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e
+Explain me some random problem for me in 2000-5000 words: f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661
+Tell me entire history of USA: 9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837
+Write a ballad. Pick a random theme.: 30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c
+Write an epic story about a dragon and a knight: 6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68
+Write an essay about being a Senior developer.: 6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/run.local.log
new file mode 100644
index 0000000..372ee25
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 15:26:43,629 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x RTX 4090
+2024-08-27 15:26:43,631 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/run.local.log
+2024-08-27 15:26:43,749 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 15:26:43,980 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 15:26:43,986 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 15:26:43,988 - __main__ - INFO - Syncing files to remote
+2024-08-27 15:26:44,188 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 15:26:46,859 - __main__ - INFO - Setting up remote environment
+2024-08-27 15:26:50,851 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-26-43_1x_rtx_4090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-26-43_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-26-43_1x_rtx_4090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 706ms\nPrepared 1 package in 3ms\nInstalled 124 packages in 300ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev11+g42fefcd (from file:///root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 15:26:50,871 - __main__ - INFO - Gathering system info
+2024-08-27 15:26:54,969 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-26-43_1x_rtx_4090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-26-43_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-26-43_1x_rtx_4090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 15:26:54,977 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:29:31,245 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output | tee ~/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 13:27:06 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 13:27:06 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:27:06 selector.py:116] Using XFormers backend.\nINFO 08-27 13:27:08 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 13:27:08 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:27:08 selector.py:116] Using XFormers backend.\nINFO 08-27 13:27:08 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:27:16 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:27:17 gpu_executor.py:121] # GPU blocks: 2222, # CPU blocks: 682\nmodel loading took 14.50 seconds\nStarting 8 responses generation\n8 responses generation took 128.13 seconds\n{'Count to 1000, skip unpopular numbers': '546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4',\n 'Describe justice system in UK vs USA in 2000-5000 words': 'd197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e',\n 'Explain me some random problem for me in 2000-5000 words': 'f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661',\n 'Tell me entire history of USA': '9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837',\n 'Write a ballad. Pick a random theme.': '30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c',\n 'Write an epic story about a dragon and a knight': '6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68',\n 'Write an essay about being a Senior developer.': '6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_15-26-43_1x_rtx_4090 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-26-43_1x_rtx_4090\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_15-26-43_1x_rtx_4090) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output\n+ tee /root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:02<00:02,  2.65s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:07<00:00,  4.02s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:07<00:00,  3.82s/it]\n\n/root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [01:58<13:47, 118.18s/it, est. speed input: 0.84 toks/s, output: 31.23 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [02:07<05:25, 54.29s/it, est. speed input: 1.67 toks/s, output: 60.07 toks/s] \rProcessed prompts:  62%|██████▎   | 5/8 [02:08<00:46, 15.48s/it, est. speed input: 4.26 toks/s, output: 153.35 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:08<00:00, 16.02s/it, est. speed input: 6.69 toks/s, output: 246.73 toks/s]\n' status_code: 0
+2024-08-27 15:29:31,276 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:29:31,914 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/stdout.txt
new file mode 100644
index 0000000..6a462f2
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 13:27:06 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 13:27:06 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:27:06 selector.py:116] Using XFormers backend.
+INFO 08-27 13:27:08 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 13:27:08 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:27:08 selector.py:116] Using XFormers backend.
+INFO 08-27 13:27:08 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:27:16 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:27:17 gpu_executor.py:121] # GPU blocks: 2222, # CPU blocks: 682
+model loading took 14.50 seconds
+Starting 8 responses generation
+8 responses generation took 128.13 seconds
+{'Count to 1000, skip unpopular numbers': '546198e7a8aab75a2e7e18ced14cfa23be3fc19362496163b14eacca7406e3527f04efd67be916fb87705c100c2e2a81e8ccdaae5d389f862020ef8f3e73a8c4',
+ 'Describe justice system in UK vs USA in 2000-5000 words': 'd197beaf5d3a4d5b82f520a5845c76b5c6827d3bf1f5565c6e56f614b5f2cf588f5ab4790be2fd12f31f584923fbac4cd2b3a8b50f484221e9eb5c724cdca973',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '050a7ef858d9be0c386ceefbf2a729f0938201026477137d1a2066c1f2b135f3d3bdf0d17846a9c80fb5ab64296923e86b4ae794c60747d6784749a66d4f7e6e',
+ 'Explain me some random problem for me in 2000-5000 words': 'f546a57138eb952dbb8dace7d46d06e976da96ea6e489b532824e4b42b68bdabea4d97c08ec38c4766a1827c247a550a6e542c572dcd0f7b1ca224415fcb5661',
+ 'Tell me entire history of USA': '9e1870ab7240877ab7adbc86eb3b62ddf68e5a270020b454bb4c3a77a7a35a214b3eda6b819c2b6a5019bec4f9d712522f94860df377a2c3edcdc685861cb837',
+ 'Write a ballad. Pick a random theme.': '30ee7bd7c5393814debaa7008acf5188ffba68af09f539bb141414376cdf322c76f81bdeca1a15a575659569cd1ddd392ff467c7cb4baec16b8cbc9fd41b018c',
+ 'Write an epic story about a dragon and a knight': '6447f18aabf3bac7dd79a451a1b66f632061e7a447b25a5be8829c1501518126c64cb42f791441544902be06ea63e0450807303520bb4d3a111fbfff19641e68',
+ 'Write an essay about being a Senior developer.': '6a25eb3c90d572794f575470cd8b916892db8777f7830bb0b87afc0e7126e90c090878a19294bc73a5b7a42c56de5ce04f84d368099f9d59df7a2e8d38b0ff3a'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/sysinfo.yaml
new file mode 100644
index 0000000..98d19af
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/sysinfo.yaml
@@ -0,0 +1,750 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1423.037
+    - 1438.912
+    - 2936.698
+    - 3017.405
+    - 3197.732
+    - 3189.939
+    - 1427.698
+    - 1405.711
+    - 1607.087
+    - 3013.419
+    - 3236.192
+    - 1428.496
+    - 3014.108
+    - 3236.554
+    - 1429.425
+    - 1427.594
+    - 1427.504
+    - 3192.534
+    - 1427.518
+    - 1446.839
+    - 1433.095
+    - 3205.009
+    - 3189.059
+    - 1428.362
+    - 1427.629
+    - 3015.656
+    - 1428.22
+    - 2817.961
+    - 1453.676
+    - 1407.52
+    - 3018.651
+    - 1463.848
+    - 3190.698
+    - 3221.89
+    - 1607.426
+    - 1429.86
+    - 1429.196
+    - 1455.283
+    - 3210.997
+    - 1428.369
+    - 1607.486
+    - 3227.472
+    - 2979.121
+    - 1427.91
+    - 3175.977
+    - 2922.186
+    - 1412.17
+    - 1425.764
+    - 1860.069
+    - 1454.669
+    - 3131.308
+    - 3000.305
+    - 3191.567
+    - 3218.677
+    - 1415.506
+    - 1605.855
+    - 1429.86
+    - 3217.096
+    - 3017.304
+    - 1428.254
+    - 2853.281
+    - 1455.206
+    - 1428.079
+    - 3018.335
+    - 1500.548
+    - 1499.872
+    - 1496.889
+    - 1798.146
+    - 1497.324
+    - 1498.923
+    - 1798.127
+    - 1800.084
+    - 1497.622
+    - 1471.484
+    - 1782.761
+    - 1787.988
+    - 1632.484
+    - 1674.808
+    - 1487.467
+    - 3329.006
+    - 1798.014
+    - 1799.973
+    - 1798.991
+    - 1498.742
+    - 1499.686
+    - 1798.32
+    - 1797.789
+    - 1498.835
+    - 1488.93
+    - 1799.002
+    - 1500.622
+    - 1799.851
+    - 1498.312
+    - 1797.402
+    - 1496.721
+    - 1499.993
+    - 1795.838
+    - 1497.666
+    - 1795.872
+    - 1497.987
+    - 1797.789
+    - 1499.773
+    - 1498.652
+    - 1499.23
+    - 1799.423
+    - 1499.973
+    - 1799.319
+    - 1499.9
+    - 1499.792
+    - 1799.631
+    - 1796.858
+    - 1498.576
+    - 1499.813
+    - 1496.016
+    - 1799.746
+    - 1496.654
+    - 1500.255
+    - 1496.539
+    - 1498.59
+    - 1496.715
+    - 1485.811
+    - 1486.28
+    - 1486.662
+    - 3346.455
+    - 1799.546
+    - 1795.029
+    - 1498.062
+    - 1800.189
+    - 1433.719
+    - 1406.428
+    - 3152.595
+    - 3230.422
+    - 3192.369
+    - 3234.962
+    - 1430.047
+    - 1430.412
+    - 1620.778
+    - 3234.286
+    - 3024.647
+    - 1421.975
+    - 3236.539
+    - 3016.713
+    - 1406.157
+    - 1415.361
+    - 1406.083
+    - 3208.615
+    - 1426.261
+    - 1538.997
+    - 1429.915
+    - 2910.477
+    - 3222.039
+    - 1430.851
+    - 1429.833
+    - 3217.196
+    - 1427.855
+    - 2213.725
+    - 1427.393
+    - 1427.629
+    - 3218.82
+    - 1454.4
+    - 3220.151
+    - 2912.72
+    - 1608.69
+    - 1429.359
+    - 1425.019
+    - 1424.733
+    - 3193.982
+    - 1429.266
+    - 2232.298
+    - 3017.389
+    - 3167.517
+    - 1403.759
+    - 2974.043
+    - 1749.776
+    - 1427.855
+    - 1429.189
+    - 2339.945
+    - 1463.703
+    - 2993.409
+    - 3243.684
+    - 3176.709
+    - 3194.154
+    - 1428.988
+    - 3223.496
+    - 1429.158
+    - 2930.708
+    - 3230.251
+    - 1428.317
+    - 2557.363
+    - 1401.821
+    - 1428.583
+    - 3221.547
+    - 1486.855
+    - 1499.114
+    - 1487.925
+    - 3348.357
+    - 1485.895
+    - 1487.254
+    - 3345.017
+    - 3349.126
+    - 1499.553
+    - 1419.286
+    - 2385.149
+    - 1827.642
+    - 1673.327
+    - 3240.054
+    - 1488.424
+    - 3347.311
+    - 2463.078
+    - 2423.791
+    - 2411.387
+    - 1493.416
+    - 1494.047
+    - 2419.059
+    - 2409.709
+    - 1492.13
+    - 1492.059
+    - 2431.106
+    - 2855.554
+    - 2441.325
+    - 1492.429
+    - 2409.914
+    - 1493.008
+    - 1493.021
+    - 1828.819
+    - 1487.606
+    - 2328.915
+    - 1487.545
+    - 2391.698
+    - 1493.137
+    - 1492.947
+    - 1494.861
+    - 2312.838
+    - 1493.422
+    - 2378.979
+    - 1492.013
+    - 1486.773
+    - 3344.788
+    - 3338.866
+    - 1486.264
+    - 1486.18
+    - 1487.222
+    - 3343.32
+    - 1488.867
+    - 1497.809
+    - 1498.408
+    - 1498.187
+    - 1496.553
+    - 1485.38
+    - 1487.406
+    - 1487.902
+    - 3349.286
+    - 3349.992
+    - 3350.073
+    - 1487.844
+    - 3244.615
+    count: 256
+    model: AMD EPYC 7702 64-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '24564'
+      cuda: '8.9'
+      driver: '550.76'
+      graphics_speed: '210'
+      memory_speed: '405'
+      name: NVIDIA GeForce RTX 4090
+      power_limit: '450.00'
+  hard_disk:
+    free: 2594368
+    total: 16777216
+    used: 14182848
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 489323760
+    free: 382782468
+    total: 528219948
+    used: 145437480
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_15-26-43_1x_rtx_4090/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.17
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.5
+  - libpython3.10-stdlib==3.10.12-1~22.04.5
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3ubuntu0.1
+  - python3.10==3.10.12-1~22.04.5
+  - python3.10-minimal==3.10.12-1~22.04.5
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#210-Ubuntu SMP Fri Jul 5 17:03:38 UTC 2024'
+  processor: x86_64
+  release: 5.4.0-190-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/experiment.yaml
new file mode 100644
index 0000000..9a8e02c
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x RTX A6000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:39979e
+run_id: vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000
+slug: 1x_rtx_a6000
+timestamp: 2024-08-27_15-27-49
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output.yaml
new file mode 100644
index 0000000..b2cbb18
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 203c6738867a8bac3a1a2598ead9c1c83833c9a53417cf938307df27b4891105cba31b0b851f5a837e18c9caf1fd1f7a4715dc8fb42e360b596c14afec9654f9
+Describe justice system in UK vs USA in 2000-5000 words: c022baf3b0a1a8cfd1c25950bdb1a756b7777f7b9629eee2e8afb353e78496fabac73f45b2819e626c6e4a520e3ff5624edb1c241809da6aa0962db26342d34c
+Describe schooling system in UK vs USA in 2000-5000 words: 9350420a44aa35c8893c8197b617c3c39e53b69db19a35b49fb45d8b18dcf8795fe243e6afaba10a63d3f63526740a56c1bf3094295ddb10c73bc869f8769592
+Explain me some random problem for me in 2000-5000 words: b811a80b587b01aaba45fc044f9530155531790b5d581984b62f03c44884a6f422b37be9a8f14fa146abbafbaf1452d3cf66eea3a8df9162ed4fb07ffcad0d81
+Tell me entire history of USA: 5bb973bbaadb2b72c0bb0200686a2bffc86b62be393b871bd772b59c5685048799a6d97a9f146789de01059752c21497b891027d3f1d02de17606af5b1defd6e
+Write a ballad. Pick a random theme.: 7a78ae643d5ca4c9439b27c17a51cd4070870083f5b99bfc8159bd366b730c1e1c6619a8e21519d030b9cfb86fe7c278e72c6a20bad49f4ad9d72b4bd14f20d1
+Write an epic story about a dragon and a knight: 2c7b3a7204d586ac2a682cfd67a40a39ba8e3dc810ff96148c77e78eadc67fa71c9ac4be8711fbbd26bdb5f83654aa6b8070fd8a81dd0fef6bc33ba662f1d40a
+Write an essay about being a Senior developer.: 726c63d347a91b7d077263ff00bc445ba2d20e69a10ed2057a4e6f9c1606c68e6c49da61410f8907e407f44b0cd4aadc39e70f73436a9d1353e48aa64b366228
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/run.local.log
new file mode 100644
index 0000000..e70c960
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 15:27:49,082 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x RTX A6000
+2024-08-27 15:27:49,085 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/run.local.log
+2024-08-27 15:27:49,214 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 15:27:49,470 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 15:27:49,482 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 15:27:49,484 - __main__ - INFO - Syncing files to remote
+2024-08-27 15:27:49,693 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 15:27:52,996 - __main__ - INFO - Setting up remote environment
+2024-08-27 15:27:57,151 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-27-49_1x_rtx_a6000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-27-49_1x_rtx_a6000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-27-49_1x_rtx_a6000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 339ms\nPrepared 1 package in 2ms\nInstalled 124 packages in 339ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev11+g42fefcd (from file:///root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 15:27:57,171 - __main__ - INFO - Gathering system info
+2024-08-27 15:28:01,166 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-27-49_1x_rtx_a6000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-27-49_1x_rtx_a6000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-27-49_1x_rtx_a6000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 15:28:01,180 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:32:00,318 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output | tee ~/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 13:28:12 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 13:28:14 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:28:14 selector.py:116] Using XFormers backend.\nINFO 08-27 13:28:15 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 13:28:16 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:28:16 selector.py:116] Using XFormers backend.\nINFO 08-27 13:28:16 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:29:47 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:29:48 gpu_executor.py:121] # GPU blocks: 5895, # CPU blocks: 682\nmodel loading took 105.03 seconds\nStarting 8 responses generation\n8 responses generation took 121.58 seconds\n{'Count to 1000, skip unpopular numbers': '203c6738867a8bac3a1a2598ead9c1c83833c9a53417cf938307df27b4891105cba31b0b851f5a837e18c9caf1fd1f7a4715dc8fb42e360b596c14afec9654f9',\n 'Describe justice system in UK vs USA in 2000-5000 words': 'c022baf3b0a1a8cfd1c25950bdb1a756b7777f7b9629eee2e8afb353e78496fabac73f45b2819e626c6e4a520e3ff5624edb1c241809da6aa0962db26342d34c',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '9350420a44aa35c8893c8197b617c3c39e53b69db19a35b49fb45d8b18dcf8795fe243e6afaba10a63d3f63526740a56c1bf3094295ddb10c73bc869f8769592',\n 'Explain me some random problem for me in 2000-5000 words': 'b811a80b587b01aaba45fc044f9530155531790b5d581984b62f03c44884a6f422b37be9a8f14fa146abbafbaf1452d3cf66eea3a8df9162ed4fb07ffcad0d81',\n 'Tell me entire history of USA': '5bb973bbaadb2b72c0bb0200686a2bffc86b62be393b871bd772b59c5685048799a6d97a9f146789de01059752c21497b891027d3f1d02de17606af5b1defd6e',\n 'Write a ballad. Pick a random theme.': '7a78ae643d5ca4c9439b27c17a51cd4070870083f5b99bfc8159bd366b730c1e1c6619a8e21519d030b9cfb86fe7c278e72c6a20bad49f4ad9d72b4bd14f20d1',\n 'Write an epic story about a dragon and a knight': '2c7b3a7204d586ac2a682cfd67a40a39ba8e3dc810ff96148c77e78eadc67fa71c9ac4be8711fbbd26bdb5f83654aa6b8070fd8a81dd0fef6bc33ba662f1d40a',\n 'Write an essay about being a Senior developer.': '726c63d347a91b7d077263ff00bc445ba2d20e69a10ed2057a4e6f9c1606c68e6c49da61410f8907e407f44b0cd4aadc39e70f73436a9d1353e48aa64b366228'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_15-27-49_1x_rtx_a6000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-27-49_1x_rtx_a6000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_15-27-49_1x_rtx_a6000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:06<00:06,  6.87s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:18<00:00,  9.83s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:18<00:00,  9.38s/it]\n\n/root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [00:09<01:07,  9.62s/it, est. speed input: 10.71 toks/s, output: 33.68 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [02:01<06:57, 69.54s/it, est. speed input: 1.79 toks/s, output: 35.56 toks/s] \rProcessed prompts:  62%|██████▎   | 5/8 [02:01<00:59, 19.81s/it, est. speed input: 4.52 toks/s, output: 134.03 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:01<00:00,  9.83s/it, est. speed input: 7.05 toks/s, output: 232.35 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:01<00:00, 15.20s/it, est. speed input: 7.05 toks/s, output: 232.35 toks/s]\n' status_code: 0
+2024-08-27 15:32:00,357 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:32:01,091 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/stdout.txt
new file mode 100644
index 0000000..720ffc6
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 13:28:12 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 13:28:14 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:28:14 selector.py:116] Using XFormers backend.
+INFO 08-27 13:28:15 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 13:28:16 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:28:16 selector.py:116] Using XFormers backend.
+INFO 08-27 13:28:16 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:29:47 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:29:48 gpu_executor.py:121] # GPU blocks: 5895, # CPU blocks: 682
+model loading took 105.03 seconds
+Starting 8 responses generation
+8 responses generation took 121.58 seconds
+{'Count to 1000, skip unpopular numbers': '203c6738867a8bac3a1a2598ead9c1c83833c9a53417cf938307df27b4891105cba31b0b851f5a837e18c9caf1fd1f7a4715dc8fb42e360b596c14afec9654f9',
+ 'Describe justice system in UK vs USA in 2000-5000 words': 'c022baf3b0a1a8cfd1c25950bdb1a756b7777f7b9629eee2e8afb353e78496fabac73f45b2819e626c6e4a520e3ff5624edb1c241809da6aa0962db26342d34c',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '9350420a44aa35c8893c8197b617c3c39e53b69db19a35b49fb45d8b18dcf8795fe243e6afaba10a63d3f63526740a56c1bf3094295ddb10c73bc869f8769592',
+ 'Explain me some random problem for me in 2000-5000 words': 'b811a80b587b01aaba45fc044f9530155531790b5d581984b62f03c44884a6f422b37be9a8f14fa146abbafbaf1452d3cf66eea3a8df9162ed4fb07ffcad0d81',
+ 'Tell me entire history of USA': '5bb973bbaadb2b72c0bb0200686a2bffc86b62be393b871bd772b59c5685048799a6d97a9f146789de01059752c21497b891027d3f1d02de17606af5b1defd6e',
+ 'Write a ballad. Pick a random theme.': '7a78ae643d5ca4c9439b27c17a51cd4070870083f5b99bfc8159bd366b730c1e1c6619a8e21519d030b9cfb86fe7c278e72c6a20bad49f4ad9d72b4bd14f20d1',
+ 'Write an epic story about a dragon and a knight': '2c7b3a7204d586ac2a682cfd67a40a39ba8e3dc810ff96148c77e78eadc67fa71c9ac4be8711fbbd26bdb5f83654aa6b8070fd8a81dd0fef6bc33ba662f1d40a',
+ 'Write an essay about being a Senior developer.': '726c63d347a91b7d077263ff00bc445ba2d20e69a10ed2057a4e6f9c1606c68e6c49da61410f8907e407f44b0cd4aadc39e70f73436a9d1353e48aa64b366228'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/sysinfo.yaml
new file mode 100644
index 0000000..c7f569c
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/sysinfo.yaml
@@ -0,0 +1,558 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2400.0
+    - 1500.0
+    - 2400.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 3298.387
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1872.774
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2400.0
+    - 1500.0
+    - 2400.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 2400.0
+    - 2000.0
+    - 1500.0
+    - 2000.0
+    - 2400.0
+    - 2000.0
+    count: 64
+    model: AMD EPYC 7532 32-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '49140'
+      cuda: '8.6'
+      driver: 535.161.07
+      graphics_speed: '0'
+      memory_speed: '405'
+      name: NVIDIA RTX A6000
+      power_limit: '300.00'
+  hard_disk:
+    free: 10108652
+    total: 16777216
+    used: 6668564
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 473267224
+    free: 189954620
+    total: 528204480
+    used: 338249860
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_15-27-49_1x_rtx_a6000/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.6
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.10
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.16
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.2
+  - libglib2.0-bin==2.72.4-0ubuntu2.2
+  - libglib2.0-data==2.72.4-0ubuntu2.2
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.1
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.3
+  - libpython3.10-stdlib==3.10.12-1~22.04.3
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.3
+  - python3.10-minimal==3.10.12-1~22.04.3
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#111-Ubuntu SMP Tue Mar 5 20:16:58 UTC 2024'
+  processor: x86_64
+  release: 5.15.0-101-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/experiment.yaml
new file mode 100644
index 0000000..c6dd660
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x A100 SXM4
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:39979e
+run_id: vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4
+slug: 1x_a100_sxm4
+timestamp: 2024-08-27_15-36-20
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output.yaml
new file mode 100644
index 0000000..189e4db
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 4c4ad56d950159f19bdd12edb2174b7251dcab0d84817b0468b9e20c7360674e4f5e4501f48e79dcc1d159b3c4c5f831c48f9a87662434786035c4356b776b73
+Describe justice system in UK vs USA in 2000-5000 words: 8a2c1f06ea082d73245e084f474b0f98993f389e678850645c711c7f4f7b489b969bf4b0c0b9db0b3773190a1933121bdcd64a2f14df2153e50f6bb93cd12013
+Describe schooling system in UK vs USA in 2000-5000 words: 1c2e330eaedb19b3b8a0fbce46fe7bd0410123be457d42ffdcb139d327a5a1bba025d1fd88b9f3405682a36f3459c2c562134f17c40e192a218526a860b6103c
+Explain me some random problem for me in 2000-5000 words: 69f29410af4e74fb5b76a831fe61c74bcadc3cda83792388775e299aa85965c3a006b8744b33a853d2ebb9c6684e2290093b1a0dde46c00db8c451f3d6d4a10d
+Tell me entire history of USA: b6104c38852a60aa9af5216131cb6de27435e14182caab650f7099daab41a6021472fcf29627454570cb1c85c7c5bd389bf67fa72d24187ba192b9b17cc089ee
+Write a ballad. Pick a random theme.: 5c649e8eb9cbd2cc1fac4edd2482afae4fcaa03319d46be8d48d9780f8eb86428ad34a81865f6dd35f217fd7760bba8946b40163f6f35e78a6265e976fbd3164
+Write an epic story about a dragon and a knight: 1844470f0e6e3d17730911fa3c2cbae252c04082653c91e3166f66dd859d49c22883c77c3106d6c7cf5734787876447b8f72ce2f5c3b0754555607c1711cda6c
+Write an essay about being a Senior developer.: 6b58725db3040c3d384cdf2d9b297cd1037f65d2c6a647a7d028ee51e500a22fcdb9615331aa1b3b3b631a742e74a35f854677771f081a62ad80fdacccd69b5b
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/run.local.log
new file mode 100644
index 0000000..d1baf6a
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 15:36:20,808 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x A100 SXM4
+2024-08-27 15:36:20,811 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/run.local.log
+2024-08-27 15:36:20,928 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 15:36:21,167 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 15:36:21,172 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 15:36:21,175 - __main__ - INFO - Syncing files to remote
+2024-08-27 15:36:21,387 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 15:36:24,666 - __main__ - INFO - Setting up remote environment
+2024-08-27 15:37:11,724 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-36-20_1x_a100_sxm4 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-36-20_1x_a100_sxm4\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-36-20_1x_a100_sxm4) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 1.63s\nPrepared 124 packages in 39.26s\nInstalled 124 packages in 382ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev11+g42fefcd (from file:///root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 15:37:11,737 - __main__ - INFO - Gathering system info
+2024-08-27 15:37:15,599 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-36-20_1x_a100_sxm4 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-36-20_1x_a100_sxm4\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-36-20_1x_a100_sxm4) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 15:37:15,604 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:41:20,756 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output | tee ~/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 13:37:26 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 13:37:28 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:37:28 selector.py:116] Using XFormers backend.\nINFO 08-27 13:37:30 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 13:37:30 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:37:30 selector.py:116] Using XFormers backend.\nINFO 08-27 13:37:30 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:39:01 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:39:02 gpu_executor.py:121] # GPU blocks: 4639, # CPU blocks: 682\nmodel loading took 104.30 seconds\nStarting 8 responses generation\n8 responses generation took 128.40 seconds\n{'Count to 1000, skip unpopular numbers': '4c4ad56d950159f19bdd12edb2174b7251dcab0d84817b0468b9e20c7360674e4f5e4501f48e79dcc1d159b3c4c5f831c48f9a87662434786035c4356b776b73',\n 'Describe justice system in UK vs USA in 2000-5000 words': '8a2c1f06ea082d73245e084f474b0f98993f389e678850645c711c7f4f7b489b969bf4b0c0b9db0b3773190a1933121bdcd64a2f14df2153e50f6bb93cd12013',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '1c2e330eaedb19b3b8a0fbce46fe7bd0410123be457d42ffdcb139d327a5a1bba025d1fd88b9f3405682a36f3459c2c562134f17c40e192a218526a860b6103c',\n 'Explain me some random problem for me in 2000-5000 words': '69f29410af4e74fb5b76a831fe61c74bcadc3cda83792388775e299aa85965c3a006b8744b33a853d2ebb9c6684e2290093b1a0dde46c00db8c451f3d6d4a10d',\n 'Tell me entire history of USA': 'b6104c38852a60aa9af5216131cb6de27435e14182caab650f7099daab41a6021472fcf29627454570cb1c85c7c5bd389bf67fa72d24187ba192b9b17cc089ee',\n 'Write a ballad. Pick a random theme.': '5c649e8eb9cbd2cc1fac4edd2482afae4fcaa03319d46be8d48d9780f8eb86428ad34a81865f6dd35f217fd7760bba8946b40163f6f35e78a6265e976fbd3164',\n 'Write an epic story about a dragon and a knight': '1844470f0e6e3d17730911fa3c2cbae252c04082653c91e3166f66dd859d49c22883c77c3106d6c7cf5734787876447b8f72ce2f5c3b0754555607c1711cda6c',\n 'Write an essay about being a Senior developer.': '6b58725db3040c3d384cdf2d9b297cd1037f65d2c6a647a7d028ee51e500a22fcdb9615331aa1b3b3b631a742e74a35f854677771f081a62ad80fdacccd69b5b'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_15-36-20_1x_a100_sxm4 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-36-20_1x_a100_sxm4\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_15-36-20_1x_a100_sxm4) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output\n+ tee /root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:06<00:06,  6.54s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:18<00:00,  9.69s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:18<00:00,  9.22s/it]\n\n/root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [02:07<14:55, 127.87s/it, est. speed input: 0.89 toks/s, output: 31.15 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [02:08<01:37, 24.27s/it, est. speed input: 3.48 toks/s, output: 124.40 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [02:08<00:27, 13.72s/it, est. speed input: 5.11 toks/s, output: 186.54 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:08<00:00,  8.48s/it, est. speed input: 6.67 toks/s, output: 248.60 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:08<00:00, 16.05s/it, est. speed input: 6.67 toks/s, output: 248.60 toks/s]\n' status_code: 0
+2024-08-27 15:41:20,778 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:41:21,468 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/stdout.txt
new file mode 100644
index 0000000..0cdd2ec
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 13:37:26 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 13:37:28 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:37:28 selector.py:116] Using XFormers backend.
+INFO 08-27 13:37:30 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 13:37:30 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:37:30 selector.py:116] Using XFormers backend.
+INFO 08-27 13:37:30 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:39:01 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:39:02 gpu_executor.py:121] # GPU blocks: 4639, # CPU blocks: 682
+model loading took 104.30 seconds
+Starting 8 responses generation
+8 responses generation took 128.40 seconds
+{'Count to 1000, skip unpopular numbers': '4c4ad56d950159f19bdd12edb2174b7251dcab0d84817b0468b9e20c7360674e4f5e4501f48e79dcc1d159b3c4c5f831c48f9a87662434786035c4356b776b73',
+ 'Describe justice system in UK vs USA in 2000-5000 words': '8a2c1f06ea082d73245e084f474b0f98993f389e678850645c711c7f4f7b489b969bf4b0c0b9db0b3773190a1933121bdcd64a2f14df2153e50f6bb93cd12013',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '1c2e330eaedb19b3b8a0fbce46fe7bd0410123be457d42ffdcb139d327a5a1bba025d1fd88b9f3405682a36f3459c2c562134f17c40e192a218526a860b6103c',
+ 'Explain me some random problem for me in 2000-5000 words': '69f29410af4e74fb5b76a831fe61c74bcadc3cda83792388775e299aa85965c3a006b8744b33a853d2ebb9c6684e2290093b1a0dde46c00db8c451f3d6d4a10d',
+ 'Tell me entire history of USA': 'b6104c38852a60aa9af5216131cb6de27435e14182caab650f7099daab41a6021472fcf29627454570cb1c85c7c5bd389bf67fa72d24187ba192b9b17cc089ee',
+ 'Write a ballad. Pick a random theme.': '5c649e8eb9cbd2cc1fac4edd2482afae4fcaa03319d46be8d48d9780f8eb86428ad34a81865f6dd35f217fd7760bba8946b40163f6f35e78a6265e976fbd3164',
+ 'Write an epic story about a dragon and a knight': '1844470f0e6e3d17730911fa3c2cbae252c04082653c91e3166f66dd859d49c22883c77c3106d6c7cf5734787876447b8f72ce2f5c3b0754555607c1711cda6c',
+ 'Write an essay about being a Senior developer.': '6b58725db3040c3d384cdf2d9b297cd1037f65d2c6a647a7d028ee51e500a22fcdb9615331aa1b3b3b631a742e74a35f854677771f081a62ad80fdacccd69b5b'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/sysinfo.yaml
new file mode 100644
index 0000000..175c46e
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/sysinfo.yaml
@@ -0,0 +1,558 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1979.991
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 1500.0
+    - 3233.876
+    - 1500.0
+    - 1586.275
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 2400.0
+    - 1500.0
+    - 1500.0
+    - 2000.0
+    - 2400.0
+    - 2000.0
+    - 2000.0
+    - 1500.0
+    - 1500.0
+    - 2400.0
+    count: 64
+    model: AMD EPYC 7532 32-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '40960'
+      cuda: '8.0'
+      driver: 535.154.05
+      graphics_speed: '210'
+      memory_speed: '1215'
+      name: NVIDIA A100-SXM4-40GB
+      power_limit: '400.00'
+  hard_disk:
+    free: 10117456
+    total: 16777216
+    used: 6659760
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 508058868
+    free: 142156024
+    total: 528205176
+    used: 386049152
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_15-36-20_1x_a100_sxm4/deterministic_ml-0.1.dev11+g42fefcd-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.10
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.16
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.3
+  - libpython3.10-stdlib==3.10.12-1~22.04.3
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.3
+  - python3.10-minimal==3.10.12-1~22.04.3
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#104-Ubuntu SMP Tue Jan 9 15:25:40 UTC 2024'
+  processor: x86_64
+  release: 5.15.0-94-generic
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/experiment.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/experiment.yaml
new file mode 100644
index 0000000..a3492a5
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/experiment.yaml
@@ -0,0 +1,6 @@
+comment: 1x RTX A4000
+experiment: vllm_16g
+experiment_hash: exp_hash_v1:46bae4
+run_id: vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000
+slug: 1x_rtx_a4000
+timestamp: 2024-08-27_15-54-05
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output.yaml
new file mode 100644
index 0000000..b3e8618
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: 7abefbad87e638bbcab79bb3a5614d6efe9a8e4e76d950479051c952259fa5c50b4343c7b930afe3329af7cbaa49989e6c64b5840c9a767768fe1226e8233645
+Describe justice system in UK vs USA in 2000-5000 words: b41fc6e907510d065d7d198a982dc7ff67c4c229453ba9a89ce5dc4eae9450f720b5ec373484d00933ede1181f88fe8c3e28ad70f7acccf1421b5e10a3c019f5
+Describe schooling system in UK vs USA in 2000-5000 words: fd2f435afb1877967d3950c02df80f8bf1f362de6d961fbb5fa4e961312d35d9335e4b4022d76f1bd20ed14606f86366c38472638327b61529781b20f75e9348
+Explain me some random problem for me in 2000-5000 words: 3a076c9a648c0502297a1a1008e1ffebecd57463ef1e3cf22d8e6afa71f8861b9434deba3f82e3b9e2200b9340b5f88c1bf7f05eef34dc876f479066235dae4b
+Tell me entire history of USA: 98ee9ca87bdecfbeb8dc2a104c9bc6c4b902080eba64e4844f8308320d0be5cf5ab159e419ab636d150a7e51cc2434b4720f133d12da8eab793aa60c4549372b
+Write a ballad. Pick a random theme.: 9da91bde53cbaa2f3a3ff27801a97fd52ab9e39dffa89c9c1d45074fef8fee5dd8542b49df2add9f9d64390ac902bcc99baa6256e29c12fc8f9dc971bc2cd154
+Write an epic story about a dragon and a knight: 54722bd09195af7d447e635403a375f3131660d012732e3bebdd5485dce54169914c800cea87e68b50d5da713f69b01a224899cbc995607c8576765c20c5db37
+Write an essay about being a Senior developer.: 44afb980ca4dea2c71b20e6ecdb925b7b9ddd28b195232b08219f9c64ecf468b7e0470ea088c3b2bd51957ea46e2d8a0526879f071de6500d69da115301644f4
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/run.local.log b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/run.local.log
new file mode 100644
index 0000000..a9ddcb6
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/run.local.log
@@ -0,0 +1,15 @@
+2024-08-27 15:54:05,017 - __main__ - INFO - Starting experiment vllm_16g with comment: 1x RTX A4000
+2024-08-27 15:54:05,020 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/run.local.log
+2024-08-27 15:54:05,413 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-27 15:54:06,131 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-27 15:54:06,139 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-27 15:54:06,142 - __main__ - INFO - Syncing files to remote
+2024-08-27 15:54:06,849 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output' stdout: '' stderr: '' status_code: 0
+2024-08-27 15:54:15,265 - __main__ - INFO - Setting up remote environment
+2024-08-27 15:54:56,626 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_16g/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n\nTo add $HOME/.cargo/bin to your PATH, either restart your shell or run:\n\n    source $HOME/.cargo/env (sh, bash, zsh)\n    source $HOME/.cargo/env.fish (fish)\n" stderr: "+ curl -LsSf https://astral.sh/uv/install.sh\n+ sh\ndownloading uv 0.3.4 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-54-05_1x_rtx_a4000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-54-05_1x_rtx_a4000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-54-05_1x_rtx_a4000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev11+g42fefcd.d20240827-py3-none-any.whl pyyaml -r vllm_16g/requirements.txt\nResolved 124 packages in 1.63s\nPrepared 124 packages in 34.60s\nInstalled 124 packages in 240ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev11+g42fefcd.d20240827 (from file:///root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/deterministic_ml-0.1.dev11+g42fefcd.d20240827-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.3\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.34.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==73.0.1\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-27 15:54:56,657 - __main__ - INFO - Gathering system info
+2024-08-27 15:55:01,428 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-27_15-54-05_1x_rtx_a4000 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-54-05_1x_rtx_a4000\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-27_15-54-05_1x_rtx_a4000) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-27 15:55:01,441 - __main__ - INFO - Running experiment code on remote
+2024-08-27 15:59:05,647 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_16g ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output | tee ~/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output/stdout.txt' stdout: "gpu_count=1\nStarting model loading\nINFO 08-27 13:55:13 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-27 13:55:15 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:55:15 selector.py:116] Using XFormers backend.\nINFO 08-27 13:55:19 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...\nINFO 08-27 13:55:19 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-27 13:55:19 selector.py:116] Using XFormers backend.\nINFO 08-27 13:55:20 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-27 13:56:07 model_runner.py:890] Loading model weights took 7.1183 GB\nINFO 08-27 13:56:10 gpu_executor.py:121] # GPU blocks: 958, # CPU blocks: 682\nmodel loading took 63.08 seconds\nStarting 8 responses generation\n8 responses generation took 166.26 seconds\n{'Count to 1000, skip unpopular numbers': '7abefbad87e638bbcab79bb3a5614d6efe9a8e4e76d950479051c952259fa5c50b4343c7b930afe3329af7cbaa49989e6c64b5840c9a767768fe1226e8233645',\n 'Describe justice system in UK vs USA in 2000-5000 words': 'b41fc6e907510d065d7d198a982dc7ff67c4c229453ba9a89ce5dc4eae9450f720b5ec373484d00933ede1181f88fe8c3e28ad70f7acccf1421b5e10a3c019f5',\n 'Describe schooling system in UK vs USA in 2000-5000 words': 'fd2f435afb1877967d3950c02df80f8bf1f362de6d961fbb5fa4e961312d35d9335e4b4022d76f1bd20ed14606f86366c38472638327b61529781b20f75e9348',\n 'Explain me some random problem for me in 2000-5000 words': '3a076c9a648c0502297a1a1008e1ffebecd57463ef1e3cf22d8e6afa71f8861b9434deba3f82e3b9e2200b9340b5f88c1bf7f05eef34dc876f479066235dae4b',\n 'Tell me entire history of USA': '98ee9ca87bdecfbeb8dc2a104c9bc6c4b902080eba64e4844f8308320d0be5cf5ab159e419ab636d150a7e51cc2434b4720f133d12da8eab793aa60c4549372b',\n 'Write a ballad. Pick a random theme.': '9da91bde53cbaa2f3a3ff27801a97fd52ab9e39dffa89c9c1d45074fef8fee5dd8542b49df2add9f9d64390ac902bcc99baa6256e29c12fc8f9dc971bc2cd154',\n 'Write an epic story about a dragon and a knight': '54722bd09195af7d447e635403a375f3131660d012732e3bebdd5485dce54169914c800cea87e68b50d5da713f69b01a224899cbc995607c8576765c20c5db37',\n 'Write an essay about being a Senior developer.': '44afb980ca4dea2c71b20e6ecdb925b7b9ddd28b195232b08219f9c64ecf468b7e0470ea088c3b2bd51957ea46e2d8a0526879f071de6500d69da115301644f4'}\n" stderr: '+ cd /root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-27_15-54-05_1x_rtx_a4000 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-27_15-54-05_1x_rtx_a4000\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-27_15-54-05_1x_rtx_a4000) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_16g /root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output\n+ tee /root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/output/stdout.txt\n/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:05<00:05,  5.18s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:15<00:00,  7.96s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:15<00:00,  7.54s/it]\n\n/root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [00:04<00:30,  4.40s/it, est. speed input: 25.66 toks/s, output: 21.80 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [02:45<09:40, 96.67s/it, est. speed input: 1.37 toks/s, output: 24.62 toks/s] \rProcessed prompts:  50%|█████     | 4/8 [02:45<02:24, 36.16s/it, est. speed input: 2.69 toks/s, output: 72.62 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [02:46<00:38, 19.10s/it, est. speed input: 3.94 toks/s, output: 120.65 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:46<00:00, 11.44s/it, est. speed input: 5.15 toks/s, output: 168.61 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [02:46<00:00, 20.78s/it, est. speed input: 5.15 toks/s, output: 168.61 toks/s]\n' status_code: 0
+2024-08-27 15:59:05,666 - __main__ - INFO - Syncing output back to local
+2024-08-27 15:59:08,115 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/stdout.txt b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/stdout.txt
new file mode 100644
index 0000000..be6a169
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/stdout.txt
@@ -0,0 +1,22 @@
+gpu_count=1
+Starting model loading
+INFO 08-27 13:55:13 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3-mini-4k-instruct', speculative_config=None, tokenizer='microsoft/Phi-3-mini-4k-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, rope_scaling=None, rope_theta=None, tokenizer_revision=5a516f86087853f9d560c95eb9209c1d4ed9ff69, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=4096, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3-mini-4k-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-27 13:55:15 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:55:15 selector.py:116] Using XFormers backend.
+INFO 08-27 13:55:19 model_runner.py:879] Starting to load model microsoft/Phi-3-mini-4k-instruct...
+INFO 08-27 13:55:19 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-27 13:55:19 selector.py:116] Using XFormers backend.
+INFO 08-27 13:55:20 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-27 13:56:07 model_runner.py:890] Loading model weights took 7.1183 GB
+INFO 08-27 13:56:10 gpu_executor.py:121] # GPU blocks: 958, # CPU blocks: 682
+model loading took 63.08 seconds
+Starting 8 responses generation
+8 responses generation took 166.26 seconds
+{'Count to 1000, skip unpopular numbers': '7abefbad87e638bbcab79bb3a5614d6efe9a8e4e76d950479051c952259fa5c50b4343c7b930afe3329af7cbaa49989e6c64b5840c9a767768fe1226e8233645',
+ 'Describe justice system in UK vs USA in 2000-5000 words': 'b41fc6e907510d065d7d198a982dc7ff67c4c229453ba9a89ce5dc4eae9450f720b5ec373484d00933ede1181f88fe8c3e28ad70f7acccf1421b5e10a3c019f5',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': 'fd2f435afb1877967d3950c02df80f8bf1f362de6d961fbb5fa4e961312d35d9335e4b4022d76f1bd20ed14606f86366c38472638327b61529781b20f75e9348',
+ 'Explain me some random problem for me in 2000-5000 words': '3a076c9a648c0502297a1a1008e1ffebecd57463ef1e3cf22d8e6afa71f8861b9434deba3f82e3b9e2200b9340b5f88c1bf7f05eef34dc876f479066235dae4b',
+ 'Tell me entire history of USA': '98ee9ca87bdecfbeb8dc2a104c9bc6c4b902080eba64e4844f8308320d0be5cf5ab159e419ab636d150a7e51cc2434b4720f133d12da8eab793aa60c4549372b',
+ 'Write a ballad. Pick a random theme.': '9da91bde53cbaa2f3a3ff27801a97fd52ab9e39dffa89c9c1d45074fef8fee5dd8542b49df2add9f9d64390ac902bcc99baa6256e29c12fc8f9dc971bc2cd154',
+ 'Write an epic story about a dragon and a knight': '54722bd09195af7d447e635403a375f3131660d012732e3bebdd5485dce54169914c800cea87e68b50d5da713f69b01a224899cbc995607c8576765c20c5db37',
+ 'Write an essay about being a Senior developer.': '44afb980ca4dea2c71b20e6ecdb925b7b9ddd28b195232b08219f9c64ecf468b7e0470ea088c3b2bd51957ea46e2d8a0526879f071de6500d69da115301644f4'}
diff --git a/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/sysinfo.yaml b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/sysinfo.yaml
new file mode 100644
index 0000000..8de9d3b
--- /dev/null
+++ b/tests/integration/results/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/sysinfo.yaml
@@ -0,0 +1,544 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    - 1097.937
+    count: 50
+    model: AMD EPYC 7D12 32-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '16376'
+      cuda: '8.6'
+      driver: 525.147.05
+      graphics_speed: '210'
+      memory_speed: '405'
+      name: NVIDIA RTX A4000
+      power_limit: '140.00'
+  hard_disk:
+    free: 10122168
+    total: 16777216
+    used: 6655048
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 73691116
+    free: 13669384
+    total: 100579052
+    used: 86909668
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_16g/2024-08-27_15-54-05_1x_rtx_a4000/deterministic_ml-0.1.dev11+g42fefcd.d20240827-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.3
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.34.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==73.0.1
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.6
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.10
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.15
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.2
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.2
+  - libglib2.0-bin==2.72.4-0ubuntu2.2
+  - libglib2.0-data==2.72.4-0ubuntu2.2
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.1
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.3
+  - libpython3.10-stdlib==3.10.12-1~22.04.3
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.3
+  - python3.10-minimal==3.10.12-1~22.04.3
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#183-Ubuntu SMP Mon Oct 2 11:28:33 UTC 2023'
+  processor: x86_64
+  release: 5.4.0-166-generic
diff --git a/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/experiment.yaml b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/experiment.yaml
new file mode 100644
index 0000000..0531d83
--- /dev/null
+++ b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/experiment.yaml
@@ -0,0 +1,10 @@
+comment: 1x RTX 3090
+experiment: vllm_phi35
+experiment_hash: exp_hash_v1:c6502f
+run_id: vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090
+slug: 1x_rtx_3090
+time_stats:
+  gathering_sysinfo: 3.15156
+  remote_env_setup: 3.081225
+  running_experiment: 138.39621
+timestamp: 2024-08-28_10-03-04
diff --git a/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output.yaml b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output.yaml
new file mode 100644
index 0000000..6a475fe
--- /dev/null
+++ b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output.yaml
@@ -0,0 +1,8 @@
+Count to 1000, skip unpopular numbers: fe0119a32e5cb10c8ef7b32824e01f72ed7dacb9619e4e54df43b05a8ce6d978586fcc462b8ef7734ca6331cb5e383f1621f246647a16b6420e2d48f5f63c15c
+Describe justice system in UK vs USA in 2000-5000 words: f18f930c23ed062a36f753c4f45da2dee51c9e9c24f2314424e002a8b67cb5f6e9a2525ddcabe7e314c593ce6c86f96f05325f6d6bc98a859dfe5ca5ce8e9d98
+Describe schooling system in UK vs USA in 2000-5000 words: 1902d972aedee49f8aca9d0dd03eff7997d143c84e274296db434c3d2e71b1171233d8b824f989861f51d120c8e70f792390136e311d72152bc52a3212cd29ad
+Explain me some random problem for me in 2000-5000 words: 2953a6cc64465b5c62dcb8257d3292304ea3b9a43a2ce01c82bcd8a59f94b2cc01e1217d7769ceb248bd64c4f11e3f2a60ff79e986e3fb64443aae0f902ac58e
+Tell me entire history of USA: 678c0e2d3fe6dab2eb6c3eba428f98c190b784fd35f16183025a341e4a08c98f39e6aa43d3ed2bf8dc96464d02ee20545f4db73bcb790c57d7e4db781499dfd5
+Write a ballad. Pick a random theme.: a2ca9c83288ba84b99d33a391b7b83747a263486c23958d0c30eb35299cd33236371dc78ed4bd9d0e453185878fdc0317117d2b23507bc2bb341279ffdd5d9c4
+Write an epic story about a dragon and a knight: b7e133385c527856f91c6d26e16fa5590074d349729aa45b0cc80f2e2df993cb4e7e4a30d2bae4265d310153a71e07086a0121083c895a8cad3406dd2922d945
+Write an essay about being a Senior developer.: 9119725699bc047553df0eb90d3ba431d9e04c52b201cb4eaed599df120f66c08f06449454623447ec7f74b651bca652106bcba9950f881fae8ae27e0f29ffa4
diff --git a/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/run.local.log b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/run.local.log
new file mode 100644
index 0000000..395804b
--- /dev/null
+++ b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/run.local.log
@@ -0,0 +1,15 @@
+2024-08-28 10:03:04,205 - __main__ - INFO - Starting experiment vllm_phi35 with comment: 1x RTX 3090
+2024-08-28 10:03:04,208 - __main__ - INFO - Local log file: /home/rooter/dev/bac/deterministic-ml/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/run.local.log
+2024-08-28 10:03:04,345 - paramiko.transport - INFO - Connected (version 2.0, client OpenSSH_8.9p1)
+2024-08-28 10:03:04,631 - paramiko.transport - INFO - Auth banner: b'Welcome to vast.ai. If authentication fails, try again after a few seconds, and double check your ssh key.\nHave fun!\n'
+2024-08-28 10:03:04,637 - paramiko.transport - INFO - Authentication (publickey) successful!
+2024-08-28 10:03:04,640 - __main__ - INFO - Syncing files to remote
+2024-08-28 10:03:04,873 - tools.ssh - INFO - Command: 'mkdir -p ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output' stdout: '' stderr: '' status_code: 0
+2024-08-28 10:03:07,782 - __main__ - INFO - Setting up remote environment
+2024-08-28 10:03:10,855 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    curl -LsSf https://astral.sh/uv/install.sh | sh\n    export PATH=$HOME/.cargo/bin:$PATH\n    \n    cd ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n    uv venv -p python3.11 --python-preference managed\n    source .venv/bin/activate \n    uv pip install       ./deterministic_ml*.whl       pyyaml       -r vllm_phi35/requirements.txt\n    ' stdout: "installing to /root/.cargo/bin\n  uv\n  uvx\neverything's installed!\n" stderr: "+ sh\n+ curl -LsSf https://astral.sh/uv/install.sh\ndownloading uv 0.3.5 x86_64-unknown-linux-gnu\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ cd /root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n+ uv venv -p python3.11 --python-preference managed\nUsing Python 3.11.9\nCreating virtualenv at: .venv\nActivate with: source .venv/bin/activate\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-28_10-03-04_1x_rtx_3090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-28_10-03-04_1x_rtx_3090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-28_10-03-04_1x_rtx_3090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ uv pip install ./deterministic_ml-0.1.dev12+g033d6ad.d20240828-py3-none-any.whl pyyaml -r vllm_phi35/requirements.txt\nResolved 124 packages in 57ms\nPrepared 1 package in 1ms\nInstalled 124 packages in 260ms\n + aiohappyeyeballs==2.4.0\n + aiohttp==3.10.5\n + aiosignal==1.3.1\n + annotated-types==0.7.0\n + anyio==4.4.0\n + attrs==24.2.0\n + audioread==3.0.1\n + certifi==2024.7.4\n + cffi==1.17.0\n + charset-normalizer==3.3.2\n + click==8.1.7\n + cloudpickle==3.0.0\n + datasets==2.21.0\n + decorator==5.1.1\n + deterministic-ml==0.1.dev12+g033d6ad.d20240828 (from file:///root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/deterministic_ml-0.1.dev12+g033d6ad.d20240828-py3-none-any.whl)\n + dill==0.3.8\n + diskcache==5.6.3\n + distro==1.9.0\n + fastapi==0.112.2\n + filelock==3.15.4\n + frozenlist==1.4.1\n + fsspec==2024.6.1\n + gguf==0.9.1\n + h11==0.14.0\n + httpcore==1.0.5\n + httptools==0.6.1\n + httpx==0.27.2\n + huggingface-hub==0.24.6\n + idna==3.8\n + importlib-metadata==8.4.0\n + interegular==0.3.3\n + jinja2==3.1.4\n + jiter==0.5.0\n + joblib==1.4.2\n + jsonschema==4.23.0\n + jsonschema-specifications==2023.12.1\n + lark==1.2.2\n + lazy-loader==0.4\n + librosa==0.10.2.post1\n + llvmlite==0.43.0\n + lm-format-enforcer==0.10.6\n + markupsafe==2.1.5\n + mpmath==1.3.0\n + msgpack==1.0.8\n + msgspec==0.18.6\n + multidict==6.0.5\n + multiprocess==0.70.16\n + nest-asyncio==1.6.0\n + networkx==3.3\n + numba==0.60.0\n + numpy==1.26.4\n + nvidia-cublas-cu12==12.1.3.1\n + nvidia-cuda-cupti-cu12==12.1.105\n + nvidia-cuda-nvrtc-cu12==12.1.105\n + nvidia-cuda-runtime-cu12==12.1.105\n + nvidia-cudnn-cu12==9.1.0.70\n + nvidia-cufft-cu12==11.0.2.54\n + nvidia-curand-cu12==10.3.2.106\n + nvidia-cusolver-cu12==11.4.5.107\n + nvidia-cusparse-cu12==12.1.0.106\n + nvidia-ml-py==12.560.30\n + nvidia-nccl-cu12==2.20.5\n + nvidia-nvjitlink-cu12==12.6.20\n + nvidia-nvtx-cu12==12.1.105\n + openai==1.42.0\n + outlines==0.0.46\n + packaging==24.1\n + pandas==2.2.2\n + pillow==10.4.0\n + platformdirs==4.2.2\n + pooch==1.8.2\n + prometheus-client==0.20.0\n + prometheus-fastapi-instrumentator==7.0.0\n + protobuf==5.27.4\n + psutil==6.0.0\n + py-cpuinfo==9.0.0\n + pyairports==2.1.1\n + pyarrow==17.0.0\n + pycountry==24.6.1\n + pycparser==2.22\n + pydantic==2.8.2\n + pydantic-core==2.20.1\n + python-dateutil==2.9.0.post0\n + python-dotenv==1.0.1\n + pytz==2024.1\n + pyyaml==6.0.2\n + pyzmq==26.2.0\n + ray==2.35.0\n + referencing==0.35.1\n + regex==2024.7.24\n + requests==2.32.3\n + rpds-py==0.20.0\n + safetensors==0.4.4\n + scikit-learn==1.5.1\n + scipy==1.14.1\n + sentencepiece==0.2.0\n + setuptools==74.0.0\n + six==1.16.0\n + sniffio==1.3.1\n + soundfile==0.12.1\n + soxr==0.5.0\n + starlette==0.38.2\n + sympy==1.13.2\n + threadpoolctl==3.5.0\n + tiktoken==0.7.0\n + tokenizers==0.19.1\n + torch==2.4.0\n + torchvision==0.19.0\n + tqdm==4.66.5\n + transformers==4.44.2\n + triton==3.0.0\n + typing-extensions==4.12.2\n + tzdata==2024.1\n + urllib3==2.2.2\n + uvicorn==0.30.6\n + uvloop==0.20.0\n + vllm==0.5.5\n + vllm-flash-attn==2.6.1\n + watchfiles==0.23.0\n + websockets==13.0\n + xformers==0.0.27.post2\n + xxhash==3.5.0\n + yarl==1.9.4\n + zipp==3.20.1\n" status_code: 0
+2024-08-28 10:03:10,868 - __main__ - INFO - Gathering system info
+2024-08-28 10:03:14,017 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m deterministic_ml._internal.sysinfo > ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output/sysinfo.yaml' stdout: '' stderr: "+ cd /root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ '[' -n x ']'\n++ SCRIPT_PATH=.venv/bin/activate\n++ '[' .venv/bin/activate = bash ']'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ hash -r\n++ '[' -z '' ']'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ '[' '!' nondestructive = nondestructive ']'\n++ VIRTUAL_ENV=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv\n++ '[' linux-gnu = cygwin ']'\n++ '[' linux-gnu = msys ']'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ '[' x2024-08-28_10-03-04_1x_rtx_3090 '!=' x ']'\n++ VIRTUAL_ENV_PROMPT=2024-08-28_10-03-04_1x_rtx_3090\n++ export VIRTUAL_ENV_PROMPT\n++ '[' -z '' ']'\n++ '[' -z '' ']'\n++ _OLD_VIRTUAL_PS1=\n++ PS1='(2024-08-28_10-03-04_1x_rtx_3090) '\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m deterministic_ml._internal.sysinfo\n" status_code: 0
+2024-08-28 10:03:14,020 - __main__ - INFO - Running experiment code on remote
+2024-08-28 10:05:32,402 - tools.ssh - INFO - Command: '\n    set -exo pipefail\n    \n    cd ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n    export PATH=$HOME/.cargo/bin:$PATH\n    source .venv/bin/activate;\n     python -m vllm_phi35 ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output | tee ~/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output/stdout.txt' stdout: "Starting model loading\nINFO 08-28 08:03:24 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3.5-mini-instruct', speculative_config=None, tokenizer='microsoft/Phi-3.5-mini-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=cd6881a82d62252f5a84593c61acf290f15d89e3, rope_scaling=None, rope_theta=None, tokenizer_revision=cd6881a82d62252f5a84593c61acf290f15d89e3, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=6144, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3.5-mini-instruct, use_v2_block_manager=False, enable_prefix_caching=False)\nINFO 08-28 08:03:24 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-28 08:03:24 selector.py:116] Using XFormers backend.\nINFO 08-28 08:03:25 model_runner.py:879] Starting to load model microsoft/Phi-3.5-mini-instruct...\nINFO 08-28 08:03:25 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.\nINFO 08-28 08:03:25 selector.py:116] Using XFormers backend.\nINFO 08-28 08:03:26 weight_utils.py:236] Using model weights format ['*.safetensors']\nINFO 08-28 08:03:32 model_runner.py:890] Loading model weights took 7.1659 GB\nINFO 08-28 08:03:33 gpu_executor.py:121] # GPU blocks: 2217, # CPU blocks: 682\nmodel loading took 10.75 seconds\nStarting 8 responses generation\n8 responses generation took 116.15 seconds\n{'Count to 1000, skip unpopular numbers': 'fe0119a32e5cb10c8ef7b32824e01f72ed7dacb9619e4e54df43b05a8ce6d978586fcc462b8ef7734ca6331cb5e383f1621f246647a16b6420e2d48f5f63c15c',\n 'Describe justice system in UK vs USA in 2000-5000 words': 'f18f930c23ed062a36f753c4f45da2dee51c9e9c24f2314424e002a8b67cb5f6e9a2525ddcabe7e314c593ce6c86f96f05325f6d6bc98a859dfe5ca5ce8e9d98',\n 'Describe schooling system in UK vs USA in 2000-5000 words': '1902d972aedee49f8aca9d0dd03eff7997d143c84e274296db434c3d2e71b1171233d8b824f989861f51d120c8e70f792390136e311d72152bc52a3212cd29ad',\n 'Explain me some random problem for me in 2000-5000 words': '2953a6cc64465b5c62dcb8257d3292304ea3b9a43a2ce01c82bcd8a59f94b2cc01e1217d7769ceb248bd64c4f11e3f2a60ff79e986e3fb64443aae0f902ac58e',\n 'Tell me entire history of USA': '678c0e2d3fe6dab2eb6c3eba428f98c190b784fd35f16183025a341e4a08c98f39e6aa43d3ed2bf8dc96464d02ee20545f4db73bcb790c57d7e4db781499dfd5',\n 'Write a ballad. Pick a random theme.': 'a2ca9c83288ba84b99d33a391b7b83747a263486c23958d0c30eb35299cd33236371dc78ed4bd9d0e453185878fdc0317117d2b23507bc2bb341279ffdd5d9c4',\n 'Write an epic story about a dragon and a knight': 'b7e133385c527856f91c6d26e16fa5590074d349729aa45b0cc80f2e2df993cb4e7e4a30d2bae4265d310153a71e07086a0121083c895a8cad3406dd2922d945',\n 'Write an essay about being a Senior developer.': '9119725699bc047553df0eb90d3ba431d9e04c52b201cb4eaed599df120f66c08f06449454623447ec7f74b651bca652106bcba9950f881fae8ae27e0f29ffa4'}\n" stderr: '+ cd /root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090\n+ export PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n+ source .venv/bin/activate\n++ \'[\' -n x \']\'\n++ SCRIPT_PATH=.venv/bin/activate\n++ \'[\' .venv/bin/activate = bash \']\'\n++ deactivate nondestructive\n++ unset -f pydoc\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ hash -r\n++ \'[\' -z \'\' \']\'\n++ unset VIRTUAL_ENV\n++ unset VIRTUAL_ENV_PROMPT\n++ \'[\' \'!\' nondestructive = nondestructive \']\'\n++ VIRTUAL_ENV=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv\n++ \'[\' linux-gnu = cygwin \']\'\n++ \'[\' linux-gnu = msys \']\'\n++ export VIRTUAL_ENV\n++ _OLD_VIRTUAL_PATH=/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ PATH=/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/bin:/root/.cargo/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin\n++ export PATH\n++ \'[\' x2024-08-28_10-03-04_1x_rtx_3090 \'!=\' x \']\'\n++ VIRTUAL_ENV_PROMPT=2024-08-28_10-03-04_1x_rtx_3090\n++ export VIRTUAL_ENV_PROMPT\n++ \'[\' -z \'\' \']\'\n++ \'[\' -z \'\' \']\'\n++ _OLD_VIRTUAL_PS1=\n++ PS1=\'(2024-08-28_10-03-04_1x_rtx_3090) \'\n++ export PS1\n++ alias pydoc\n++ true\n++ hash -r\n+ python -m vllm_phi35 /root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output\n+ tee /root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/output/stdout.txt\n/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:211: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_fwd")\n/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/lib/python3.11/site-packages/xformers/ops/fmha/flash.py:344: FutureWarning: `torch.library.impl_abstract` was renamed to `torch.library.register_fake`. Please use that instead; we will remove `torch.library.impl_abstract` in a future version of PyTorch.\n  @torch.library.impl_abstract("xformers_flash::flash_bwd")\n\rLoading safetensors checkpoint shards:   0% Completed | 0/2 [00:00<?, ?it/s]\n\rLoading safetensors checkpoint shards:  50% Completed | 1/2 [00:01<00:01,  1.71s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:05<00:00,  2.75s/it]\n\rLoading safetensors checkpoint shards: 100% Completed | 2/2 [00:05<00:00,  2.59s/it]\n\n/root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/.venv/lib/python3.11/site-packages/vllm/model_executor/layers/sampler.py:301: UserWarning: cumsum_cuda_kernel does not have a deterministic implementation, but you set \'torch.use_deterministic_algorithms(True, warn_only=True)\'. You can file an issue at https://github.com/pytorch/pytorch/issues to help us prioritize adding deterministic support for this operation. (Triggered internally at ../aten/src/ATen/Context.cpp:83.)\n  probs_sum = probs_sort.cumsum(dim=-1)\n\rProcessed prompts:   0%|          | 0/8 [00:00<?, ?it/s, est. speed input: 0.00 toks/s, output: 0.00 toks/s]\rProcessed prompts:  12%|█▎        | 1/8 [00:20<02:24, 20.66s/it, est. speed input: 4.98 toks/s, output: 34.60 toks/s]\rProcessed prompts:  25%|██▌       | 2/8 [00:23<00:59, 10.00s/it, est. speed input: 9.01 toks/s, output: 65.36 toks/s]\rProcessed prompts:  38%|███▊      | 3/8 [00:26<00:34,  6.98s/it, est. speed input: 11.74 toks/s, output: 91.56 toks/s]\rProcessed prompts:  50%|█████     | 4/8 [00:27<00:19,  4.77s/it, est. speed input: 15.19 toks/s, output: 121.56 toks/s]\rProcessed prompts:  62%|██████▎   | 5/8 [00:32<00:13,  4.58s/it, est. speed input: 16.74 toks/s, output: 140.15 toks/s]\rProcessed prompts:  75%|███████▌  | 6/8 [00:52<00:19,  9.90s/it, est. speed input: 12.43 toks/s, output: 120.73 toks/s]\rProcessed prompts:  88%|████████▊ | 7/8 [01:54<00:27, 27.01s/it, est. speed input: 6.61 toks/s, output: 90.02 toks/s]  \rProcessed prompts: 100%|██████████| 8/8 [01:56<00:00, 18.88s/it, est. speed input: 7.38 toks/s, output: 123.67 toks/s]\rProcessed prompts: 100%|██████████| 8/8 [01:56<00:00, 14.52s/it, est. speed input: 7.38 toks/s, output: 123.67 toks/s]\n' status_code: 0
+2024-08-28 10:05:32,417 - __main__ - INFO - Syncing output back to local
+2024-08-28 10:05:33,108 - __main__ - INFO - Done
diff --git a/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/stdout.txt b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/stdout.txt
new file mode 100644
index 0000000..4561552
--- /dev/null
+++ b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/stdout.txt
@@ -0,0 +1,21 @@
+Starting model loading
+INFO 08-28 08:03:24 llm_engine.py:184] Initializing an LLM engine (v0.5.5) with config: model='microsoft/Phi-3.5-mini-instruct', speculative_config=None, tokenizer='microsoft/Phi-3.5-mini-instruct', skip_tokenizer_init=False, tokenizer_mode=auto, revision=cd6881a82d62252f5a84593c61acf290f15d89e3, rope_scaling=None, rope_theta=None, tokenizer_revision=cd6881a82d62252f5a84593c61acf290f15d89e3, trust_remote_code=False, dtype=torch.bfloat16, max_seq_len=6144, download_dir=None, load_format=LoadFormat.AUTO, tensor_parallel_size=1, pipeline_parallel_size=1, disable_custom_all_reduce=False, quantization=None, enforce_eager=True, kv_cache_dtype=auto, quantization_param_path=None, device_config=cuda, decoding_config=DecodingConfig(guided_decoding_backend='outlines'), observability_config=ObservabilityConfig(otlp_traces_endpoint=None, collect_model_forward_time=False, collect_model_execute_time=False), seed=0, served_model_name=microsoft/Phi-3.5-mini-instruct, use_v2_block_manager=False, enable_prefix_caching=False)
+INFO 08-28 08:03:24 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-28 08:03:24 selector.py:116] Using XFormers backend.
+INFO 08-28 08:03:25 model_runner.py:879] Starting to load model microsoft/Phi-3.5-mini-instruct...
+INFO 08-28 08:03:25 selector.py:236] Cannot use FlashAttention-2 backend due to sliding window.
+INFO 08-28 08:03:25 selector.py:116] Using XFormers backend.
+INFO 08-28 08:03:26 weight_utils.py:236] Using model weights format ['*.safetensors']
+INFO 08-28 08:03:32 model_runner.py:890] Loading model weights took 7.1659 GB
+INFO 08-28 08:03:33 gpu_executor.py:121] # GPU blocks: 2217, # CPU blocks: 682
+model loading took 10.75 seconds
+Starting 8 responses generation
+8 responses generation took 116.15 seconds
+{'Count to 1000, skip unpopular numbers': 'fe0119a32e5cb10c8ef7b32824e01f72ed7dacb9619e4e54df43b05a8ce6d978586fcc462b8ef7734ca6331cb5e383f1621f246647a16b6420e2d48f5f63c15c',
+ 'Describe justice system in UK vs USA in 2000-5000 words': 'f18f930c23ed062a36f753c4f45da2dee51c9e9c24f2314424e002a8b67cb5f6e9a2525ddcabe7e314c593ce6c86f96f05325f6d6bc98a859dfe5ca5ce8e9d98',
+ 'Describe schooling system in UK vs USA in 2000-5000 words': '1902d972aedee49f8aca9d0dd03eff7997d143c84e274296db434c3d2e71b1171233d8b824f989861f51d120c8e70f792390136e311d72152bc52a3212cd29ad',
+ 'Explain me some random problem for me in 2000-5000 words': '2953a6cc64465b5c62dcb8257d3292304ea3b9a43a2ce01c82bcd8a59f94b2cc01e1217d7769ceb248bd64c4f11e3f2a60ff79e986e3fb64443aae0f902ac58e',
+ 'Tell me entire history of USA': '678c0e2d3fe6dab2eb6c3eba428f98c190b784fd35f16183025a341e4a08c98f39e6aa43d3ed2bf8dc96464d02ee20545f4db73bcb790c57d7e4db781499dfd5',
+ 'Write a ballad. Pick a random theme.': 'a2ca9c83288ba84b99d33a391b7b83747a263486c23958d0c30eb35299cd33236371dc78ed4bd9d0e453185878fdc0317117d2b23507bc2bb341279ffdd5d9c4',
+ 'Write an epic story about a dragon and a knight': 'b7e133385c527856f91c6d26e16fa5590074d349729aa45b0cc80f2e2df993cb4e7e4a30d2bae4265d310153a71e07086a0121083c895a8cad3406dd2922d945',
+ 'Write an essay about being a Senior developer.': '9119725699bc047553df0eb90d3ba431d9e04c52b201cb4eaed599df120f66c08f06449454623447ec7f74b651bca652106bcba9950f881fae8ae27e0f29ffa4'}
diff --git a/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/sysinfo.yaml b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/sysinfo.yaml
new file mode 100644
index 0000000..801351b
--- /dev/null
+++ b/tests/integration/results/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/sysinfo.yaml
@@ -0,0 +1,622 @@
+cuda:
+  cuda: '12.1'
+  cudnn: 90100
+machine:
+  cpu:
+    clocks:
+    - 1749.89
+    - 400.0
+    - 753.32
+    - 3612.0
+    - 3612.0
+    - 400.0
+    - 400.0
+    - 432.12
+    - 3499.957
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 400.0
+    - 3612.0
+    - 3499.992
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 817.56
+    - 400.0
+    - 624.84
+    - 817.56
+    - 400.0
+    - 432.12
+    - 400.0
+    - 464.24
+    - 400.0
+    - 3420.009
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 464.24
+    - 1968.515
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 3499.991
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 432.12
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 432.12
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 432.12
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 1950.803
+    - 400.0
+    - 592.72
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 400.0
+    - 400.0
+    - 3612.0
+    - 3499.993
+    count: 128
+    model: AMD EPYC 9334 32-Core Processor
+  docker_support:
+    nvidia: false
+    runc: false
+  gpu:
+    count: 1
+    details:
+    - capacity: '24576'
+      cuda: '8.6'
+      driver: '550.100'
+      graphics_speed: '0'
+      memory_speed: '405'
+      name: NVIDIA GeForce RTX 3090
+      power_limit: '350.00'
+  hard_disk:
+    free: 1725552
+    total: 16777216
+    used: 15051664
+  os: Ubuntu 22.04.3 LTS
+  ram:
+    available: 300821972
+    free: 35137672
+    total: 395908704
+    used: 360771032
+python:
+  packages:
+  - aiohappyeyeballs==2.4.0
+  - aiohttp==3.10.5
+  - aiosignal==1.3.1
+  - annotated-types==0.7.0
+  - anyio==4.4.0
+  - attrs==24.2.0
+  - audioread==3.0.1
+  - certifi==2024.7.4
+  - cffi==1.17.0
+  - charset-normalizer==3.3.2
+  - click==8.1.7
+  - cloudpickle==3.0.0
+  - datasets==2.21.0
+  - decorator==5.1.1
+  - deterministic-ml @ file:///root/experiments/vllm_phi35/2024-08-28_10-03-04_1x_rtx_3090/deterministic_ml-0.1.dev12+g033d6ad.d20240828-py3-none-any.whl
+  - dill==0.3.8
+  - diskcache==5.6.3
+  - distro==1.9.0
+  - fastapi==0.112.2
+  - filelock==3.15.4
+  - frozenlist==1.4.1
+  - fsspec==2024.6.1
+  - gguf==0.9.1
+  - h11==0.14.0
+  - httpcore==1.0.5
+  - httptools==0.6.1
+  - httpx==0.27.2
+  - huggingface-hub==0.24.6
+  - idna==3.8
+  - importlib-metadata==8.4.0
+  - interegular==0.3.3
+  - jinja2==3.1.4
+  - jiter==0.5.0
+  - joblib==1.4.2
+  - jsonschema==4.23.0
+  - jsonschema-specifications==2023.12.1
+  - lark==1.2.2
+  - lazy-loader==0.4
+  - librosa==0.10.2.post1
+  - llvmlite==0.43.0
+  - lm-format-enforcer==0.10.6
+  - markupsafe==2.1.5
+  - mpmath==1.3.0
+  - msgpack==1.0.8
+  - msgspec==0.18.6
+  - multidict==6.0.5
+  - multiprocess==0.70.16
+  - nest-asyncio==1.6.0
+  - networkx==3.3
+  - numba==0.60.0
+  - numpy==1.26.4
+  - nvidia-cublas-cu12==12.1.3.1
+  - nvidia-cuda-cupti-cu12==12.1.105
+  - nvidia-cuda-nvrtc-cu12==12.1.105
+  - nvidia-cuda-runtime-cu12==12.1.105
+  - nvidia-cudnn-cu12==9.1.0.70
+  - nvidia-cufft-cu12==11.0.2.54
+  - nvidia-curand-cu12==10.3.2.106
+  - nvidia-cusolver-cu12==11.4.5.107
+  - nvidia-cusparse-cu12==12.1.0.106
+  - nvidia-ml-py==12.560.30
+  - nvidia-nccl-cu12==2.20.5
+  - nvidia-nvjitlink-cu12==12.6.20
+  - nvidia-nvtx-cu12==12.1.105
+  - openai==1.42.0
+  - outlines==0.0.46
+  - packaging==24.1
+  - pandas==2.2.2
+  - pillow==10.4.0
+  - platformdirs==4.2.2
+  - pooch==1.8.2
+  - prometheus-client==0.20.0
+  - prometheus-fastapi-instrumentator==7.0.0
+  - protobuf==5.27.4
+  - psutil==6.0.0
+  - py-cpuinfo==9.0.0
+  - pyairports==2.1.1
+  - pyarrow==17.0.0
+  - pycountry==24.6.1
+  - pycparser==2.22
+  - pydantic==2.8.2
+  - pydantic-core==2.20.1
+  - python-dateutil==2.9.0.post0
+  - python-dotenv==1.0.1
+  - pytz==2024.1
+  - pyyaml==6.0.2
+  - pyzmq==26.2.0
+  - ray==2.35.0
+  - referencing==0.35.1
+  - regex==2024.7.24
+  - requests==2.32.3
+  - rpds-py==0.20.0
+  - safetensors==0.4.4
+  - scikit-learn==1.5.1
+  - scipy==1.14.1
+  - sentencepiece==0.2.0
+  - setuptools==74.0.0
+  - six==1.16.0
+  - sniffio==1.3.1
+  - soundfile==0.12.1
+  - soxr==0.5.0
+  - starlette==0.38.2
+  - sympy==1.13.2
+  - threadpoolctl==3.5.0
+  - tiktoken==0.7.0
+  - tokenizers==0.19.1
+  - torch==2.4.0
+  - torchvision==0.19.0
+  - tqdm==4.66.5
+  - transformers==4.44.2
+  - triton==3.0.0
+  - typing-extensions==4.12.2
+  - tzdata==2024.1
+  - urllib3==2.2.2
+  - uvicorn==0.30.6
+  - uvloop==0.20.0
+  - vllm==0.5.5
+  - vllm-flash-attn==2.6.1
+  - watchfiles==0.23.0
+  - websockets==13.0
+  - xformers==0.0.27.post2
+  - xxhash==3.5.0
+  - yarl==1.9.4
+  - zipp==3.20.1
+  version: 3.11.9 (main, Aug 14 2024, 05:07:28) [Clang 18.1.8 ]
+system:
+  dpkg_packages:
+  - adduser==3.118ubuntu5
+  - apt==2.4.10
+  - base-files==12ubuntu4.4
+  - base-passwd==3.5.52build1
+  - bash==5.1-6ubuntu1
+  - binutils==2.38-4ubuntu2.3
+  - binutils-common==2.38-4ubuntu2.3
+  - binutils-x86-64-linux-gnu==2.38-4ubuntu2.3
+  - bsdutils==1:2.37.2-4ubuntu3
+  - build-essential==12.9ubuntu3
+  - bzip2==1.0.8-5build1
+  - ca-certificates==20230311ubuntu0.22.04.1
+  - coreutils==8.32-4.1ubuntu1
+  - cpp==4:11.2.0-1ubuntu1
+  - cpp-11==11.4.0-1ubuntu1~22.04
+  - cuda-cccl-12-0==12.0.140-1
+  - cuda-command-line-tools-12-0==12.0.1-1
+  - cuda-compat-12-0==525.147.05-1
+  - cuda-compiler-12-0==12.0.1-1
+  - cuda-cudart-12-0==12.0.146-1
+  - cuda-cudart-dev-12-0==12.0.146-1
+  - cuda-cuobjdump-12-0==12.0.140-1
+  - cuda-cupti-12-0==12.0.146-1
+  - cuda-cupti-dev-12-0==12.0.146-1
+  - cuda-cuxxfilt-12-0==12.0.140-1
+  - cuda-driver-dev-12-0==12.0.146-1
+  - cuda-gdb-12-0==12.0.140-1
+  - cuda-keyring==1.0-1
+  - cuda-libraries-12-0==12.0.1-1
+  - cuda-libraries-dev-12-0==12.0.1-1
+  - cuda-minimal-build-12-0==12.0.1-1
+  - cuda-nsight-compute-12-0==12.0.1-1
+  - cuda-nvcc-12-0==12.0.140-1
+  - cuda-nvdisasm-12-0==12.0.140-1
+  - cuda-nvml-dev-12-0==12.0.140-1
+  - cuda-nvprof-12-0==12.0.146-1
+  - cuda-nvprune-12-0==12.0.140-1
+  - cuda-nvrtc-12-0==12.0.140-1
+  - cuda-nvrtc-dev-12-0==12.0.140-1
+  - cuda-nvtx-12-0==12.0.140-1
+  - cuda-opencl-12-0==12.0.140-1
+  - cuda-opencl-dev-12-0==12.0.140-1
+  - cuda-profiler-api-12-0==12.0.140-1
+  - cuda-sanitizer-12-0==12.0.140-1
+  - cuda-toolkit-12-0-config-common==12.0.146-1
+  - cuda-toolkit-12-config-common==12.3.52-1
+  - cuda-toolkit-config-common==12.3.52-1
+  - curl==7.81.0-1ubuntu1.17
+  - dash==0.5.11+git20210903+057cd650a4ed-3build1
+  - dbus==1.12.20-2ubuntu4.1
+  - debconf==1.5.79ubuntu1
+  - debianutils==5.5-1ubuntu2
+  - diffutils==1:3.8-0ubuntu2
+  - dirmngr==2.2.27-3ubuntu2.1
+  - distro-info-data==0.52ubuntu0.7
+  - dpkg==1.21.1ubuntu2.2
+  - dpkg-dev==1.21.1ubuntu2.2
+  - e2fsprogs==1.46.5-2ubuntu1.1
+  - findutils==4.8.0-1ubuntu3
+  - g++==4:11.2.0-1ubuntu1
+  - g++-11==11.4.0-1ubuntu1~22.04
+  - gcc==4:11.2.0-1ubuntu1
+  - gcc-11==11.4.0-1ubuntu1~22.04
+  - gcc-11-base==11.4.0-1ubuntu1~22.04
+  - gcc-12-base==12.3.0-1ubuntu1~22.04
+  - gir1.2-glib-2.0==1.72.0-1
+  - gir1.2-packagekitglib-1.0==1.2.5-2ubuntu2
+  - git==1:2.34.1-1ubuntu1.11
+  - git-man==1:2.34.1-1ubuntu1.11
+  - gnupg==2.2.27-3ubuntu2.1
+  - gnupg-l10n==2.2.27-3ubuntu2.1
+  - gnupg-utils==2.2.27-3ubuntu2.1
+  - gnupg2==2.2.27-3ubuntu2.1
+  - gpg==2.2.27-3ubuntu2.1
+  - gpg-agent==2.2.27-3ubuntu2.1
+  - gpg-wks-client==2.2.27-3ubuntu2.1
+  - gpg-wks-server==2.2.27-3ubuntu2.1
+  - gpgconf==2.2.27-3ubuntu2.1
+  - gpgsm==2.2.27-3ubuntu2.1
+  - gpgv==2.2.27-3ubuntu2.1
+  - grep==3.7-1build1
+  - gzip==1.10-4ubuntu4.1
+  - hostname==3.23ubuntu2
+  - init-system-helpers==1.62
+  - iso-codes==4.9.0-1
+  - less==590-1ubuntu0.22.04.3
+  - libacl1==2.3.1-1
+  - libapparmor1==3.0.4-2ubuntu2.3
+  - libappstream4==0.15.2-2
+  - libapt-pkg6.0==2.4.10
+  - libargon2-1==0~20171227-0.3
+  - libasan6==11.4.0-1ubuntu1~22.04
+  - libassuan0==2.5.5-1build1
+  - libatomic1==12.3.0-1ubuntu1~22.04
+  - libattr1==1:2.5.1-1build1
+  - libaudit-common==1:3.0.7-1build1
+  - libaudit1==1:3.0.7-1build1
+  - libbinutils==2.38-4ubuntu2.3
+  - libblkid1==2.37.2-4ubuntu3
+  - libbrotli1==1.0.9-2build6
+  - libbsd0==0.11.5-1
+  - libbz2-1.0==1.0.8-5build1
+  - libc-bin==2.35-0ubuntu3.4
+  - libc-dev-bin==2.35-0ubuntu3.4
+  - libc6==2.35-0ubuntu3.4
+  - libc6-dev==2.35-0ubuntu3.4
+  - libcap-ng0==0.7.9-2.2build3
+  - libcap2==1:2.44-1ubuntu0.22.04.1
+  - libcap2-bin==1:2.44-1ubuntu0.22.04.1
+  - libcbor0.8==0.8.0-2ubuntu1
+  - libcc1-0==12.3.0-1ubuntu1~22.04
+  - libcom-err2==1.46.5-2ubuntu1.1
+  - libcrypt-dev==1:4.4.27-1
+  - libcrypt1==1:4.4.27-1
+  - libcryptsetup12==2:2.4.3-1ubuntu1.2
+  - libctf-nobfd0==2.38-4ubuntu2.3
+  - libctf0==2.38-4ubuntu2.3
+  - libcublas-12-0==12.0.2.224-1
+  - libcublas-dev-12-0==12.0.2.224-1
+  - libcufft-12-0==11.0.1.95-1
+  - libcufft-dev-12-0==11.0.1.95-1
+  - libcufile-12-0==1.5.1.14-1
+  - libcufile-dev-12-0==1.5.1.14-1
+  - libcurand-12-0==10.3.1.124-1
+  - libcurand-dev-12-0==10.3.1.124-1
+  - libcurl3-gnutls==7.81.0-1ubuntu1.16
+  - libcurl4==7.81.0-1ubuntu1.17
+  - libcusolver-12-0==11.4.3.1-1
+  - libcusolver-dev-12-0==11.4.3.1-1
+  - libcusparse-12-0==12.0.1.140-1
+  - libcusparse-dev-12-0==12.0.1.140-1
+  - libdb5.3==5.3.28+dfsg1-0.8ubuntu3
+  - libdbus-1-3==1.12.20-2ubuntu4.1
+  - libdebconfclient0==0.261ubuntu1
+  - libdevmapper1.02.1==2:1.02.175-2.1ubuntu4
+  - libdpkg-perl==1.21.1ubuntu2.2
+  - libdw1==0.186-1build1
+  - libedit2==3.1-20210910-1build1
+  - libelf1==0.186-1build1
+  - liberror-perl==0.17029-1
+  - libevent-core-2.1-7==2.1.12-stable-1build3
+  - libexpat1==2.4.7-1ubuntu0.3
+  - libext2fs2==1.46.5-2ubuntu1.1
+  - libffi8==3.4.2-4
+  - libfido2-1==1.10.0-1
+  - libgcc-11-dev==11.4.0-1ubuntu1~22.04
+  - libgcc-s1==12.3.0-1ubuntu1~22.04
+  - libgcrypt20==1.9.4-3ubuntu3
+  - libgdbm-compat4==1.23-1
+  - libgdbm6==1.23-1
+  - libgirepository-1.0-1==1.72.0-1
+  - libglib2.0-0==2.72.4-0ubuntu2.3
+  - libglib2.0-bin==2.72.4-0ubuntu2.3
+  - libglib2.0-data==2.72.4-0ubuntu2.3
+  - libgmp10==2:6.2.1+dfsg-3ubuntu1
+  - libgnutls30==3.7.3-4ubuntu1.2
+  - libgomp1==12.3.0-1ubuntu1~22.04
+  - libgpg-error0==1.43-3
+  - libgssapi-krb5-2==1.19.2-2ubuntu0.2
+  - libgstreamer1.0-0==1.20.3-0ubuntu1
+  - libhogweed6==3.7.3-1build2
+  - libicu70==70.1-2
+  - libidn2-0==2.3.2-2build1
+  - libip4tc2==1.8.7-1ubuntu5.2
+  - libisl23==0.24-2build1
+  - libitm1==12.3.0-1ubuntu1~22.04
+  - libjson-c5==0.15-3~ubuntu1.22.04.2
+  - libk5crypto3==1.19.2-2ubuntu0.2
+  - libkeyutils1==1.6.1-2ubuntu3
+  - libkmod2==29-1ubuntu1
+  - libkrb5-3==1.19.2-2ubuntu0.2
+  - libkrb5support0==1.19.2-2ubuntu0.2
+  - libksba8==1.6.0-2ubuntu0.2
+  - libldap-2.5-0==2.5.16+dfsg-0ubuntu0.22.04.1
+  - liblsan0==12.3.0-1ubuntu1~22.04
+  - liblz4-1==1.9.3-2build2
+  - liblzma5==5.2.5-2ubuntu1
+  - libmd0==1.0.4-1build1
+  - libmount1==2.37.2-4ubuntu3
+  - libmpc3==1.2.1-2build1
+  - libmpdec3==2.5.1-2build2
+  - libmpfr6==4.1.0-3build3
+  - libnccl-dev==2.16.5-1+cuda12.0
+  - libnccl2==2.16.5-1+cuda12.0
+  - libncurses6==6.3-2ubuntu0.1
+  - libncursesw6==6.3-2ubuntu0.1
+  - libnettle8==3.7.3-1build2
+  - libnghttp2-14==1.43.0-1ubuntu0.2
+  - libnpp-12-0==12.0.1.104-1
+  - libnpp-dev-12-0==12.0.1.104-1
+  - libnpth0==1.6-3build2
+  - libnsl-dev==1.3.0-2build2
+  - libnsl2==1.3.0-2build2
+  - libnvjitlink-12-0==12.0.140-1
+  - libnvjitlink-dev-12-0==12.0.140-1
+  - libnvjpeg-12-0==12.0.1.102-1
+  - libnvjpeg-dev-12-0==12.0.1.102-1
+  - libp11-kit0==0.24.0-6build1
+  - libpackagekit-glib2-18==1.2.5-2ubuntu2
+  - libpam-modules==1.4.0-11ubuntu2.3
+  - libpam-modules-bin==1.4.0-11ubuntu2.3
+  - libpam-runtime==1.4.0-11ubuntu2.3
+  - libpam-systemd==249.11-0ubuntu3.12
+  - libpam0g==1.4.0-11ubuntu2.3
+  - libpcre2-8-0==10.39-3ubuntu0.1
+  - libpcre3==2:8.39-13ubuntu0.22.04.1
+  - libperl5.34==5.34.0-3ubuntu1.2
+  - libpolkit-agent-1-0==0.105-33
+  - libpolkit-gobject-1-0==0.105-33
+  - libpopt0==1.18-3build1
+  - libprocps8==2:3.3.17-6ubuntu2
+  - libpsl5==0.21.0-1.2build2
+  - libpython3-stdlib==3.10.6-1~22.04
+  - libpython3.10-minimal==3.10.12-1~22.04.4
+  - libpython3.10-stdlib==3.10.12-1~22.04.4
+  - libquadmath0==12.3.0-1ubuntu1~22.04
+  - libreadline8==8.1.2-1
+  - librtmp1==2.4+20151223.gitfa8646d.1-2build4
+  - libsasl2-2==2.1.27+dfsg2-3ubuntu1.2
+  - libsasl2-modules-db==2.1.27+dfsg2-3ubuntu1.2
+  - libseccomp2==2.5.3-2ubuntu2
+  - libselinux1==3.3-1build2
+  - libsemanage-common==3.3-1build2
+  - libsemanage2==3.3-1build2
+  - libsepol2==3.3-1build1
+  - libsmartcols1==2.37.2-4ubuntu3
+  - libsqlite3-0==3.37.2-2ubuntu0.1
+  - libss2==1.46.5-2ubuntu1.1
+  - libssh-4==0.9.6-2ubuntu0.22.04.3
+  - libssl3==3.0.2-0ubuntu1.10
+  - libstdc++-11-dev==11.4.0-1ubuntu1~22.04
+  - libstdc++6==12.3.0-1ubuntu1~22.04
+  - libstemmer0d==2.2.0-1build1
+  - libsystemd0==249.11-0ubuntu3.12
+  - libtasn1-6==4.18.0-4build1
+  - libtinfo6==6.3-2ubuntu0.1
+  - libtirpc-common==1.3.2-2ubuntu0.1
+  - libtirpc-dev==1.3.2-2ubuntu0.1
+  - libtirpc3==1.3.2-2ubuntu0.1
+  - libtsan0==11.4.0-1ubuntu1~22.04
+  - libubsan1==12.3.0-1ubuntu1~22.04
+  - libudev1==249.11-0ubuntu3.10
+  - libunistring2==1.0-1
+  - libunwind8==1.3.2-2build2.1
+  - libutempter0==1.2.1-2build2
+  - libuuid1==2.37.2-4ubuntu3
+  - libwrap0==7.6.q-31build2
+  - libxml2==2.9.13+dfsg-1ubuntu0.4
+  - libxmlb2==0.3.6-2build1
+  - libxxhash0==0.8.1-1
+  - libyaml-0-2==0.2.2-1build2
+  - libzstd1==1.4.8+dfsg-3build1
+  - linux-libc-dev==5.15.0-88.98
+  - locales==2.35-0ubuntu3.8
+  - login==1:4.8.1-2ubuntu2.1
+  - logsave==1.46.5-2ubuntu1.1
+  - lsb-base==11.1.0ubuntu4
+  - lsb-release==11.1.0ubuntu4
+  - lto-disabled-list==24
+  - make==4.3-4.1build1
+  - mawk==1.3.4.20200120-3
+  - media-types==7.0.0
+  - mount==2.37.2-4ubuntu3
+  - ncurses-base==6.3-2ubuntu0.1
+  - ncurses-bin==6.3-2ubuntu0.1
+  - nsight-compute-2022.4.1==2022.4.1.6-1
+  - openssh-client==1:8.9p1-3ubuntu0.10
+  - openssh-server==1:8.9p1-3ubuntu0.10
+  - openssh-sftp-server==1:8.9p1-3ubuntu0.10
+  - openssl==3.0.2-0ubuntu1.12
+  - packagekit==1.2.5-2ubuntu2
+  - passwd==1:4.8.1-2ubuntu2.1
+  - patch==2.7.6-7build2
+  - perl==5.34.0-3ubuntu1.2
+  - perl-base==5.34.0-3ubuntu1.2
+  - perl-modules-5.34==5.34.0-3ubuntu1.2
+  - pinentry-curses==1.1.1-1build2
+  - pkexec==0.105-33
+  - policykit-1==0.105-33
+  - polkitd==0.105-33
+  - procps==2:3.3.17-6ubuntu2
+  - python-apt-common==2.4.0ubuntu3
+  - python3==3.10.6-1~22.04
+  - python3-apt==2.4.0ubuntu3
+  - python3-blinker==1.4+dfsg1-0.4
+  - python3-cffi-backend==1.15.0-1build2
+  - python3-cryptography==3.4.8-1ubuntu2.2
+  - python3-dbus==1.2.18-3build1
+  - python3-distro==1.7.0-1
+  - python3-gi==3.42.1-0ubuntu1
+  - python3-httplib2==0.20.2-2
+  - python3-importlib-metadata==4.6.4-1
+  - python3-jeepney==0.7.1-3
+  - python3-jwt==2.3.0-1ubuntu0.2
+  - python3-keyring==23.5.0-1
+  - python3-launchpadlib==1.10.16-1
+  - python3-lazr.restfulclient==0.14.4-1
+  - python3-lazr.uri==1.0.6-2
+  - python3-minimal==3.10.6-1~22.04
+  - python3-more-itertools==8.10.0-2
+  - python3-oauthlib==3.2.0-1ubuntu0.1
+  - python3-pkg-resources==59.6.0-1.2ubuntu0.22.04.1
+  - python3-pyparsing==2.4.7-1
+  - python3-secretstorage==3.3.1-1
+  - python3-six==1.16.0-3ubuntu1
+  - python3-software-properties==0.99.22.9
+  - python3-wadllib==1.3.6-1
+  - python3-zipp==1.0.0-3
+  - python3.10==3.10.12-1~22.04.4
+  - python3.10-minimal==3.10.12-1~22.04.4
+  - readline-common==8.1.2-1
+  - rpcsvc-proto==1.4.2-0ubuntu6
+  - rsync==3.2.7-0ubuntu0.22.04.2
+  - sed==4.8-1ubuntu2
+  - sensible-utils==0.0.17
+  - software-properties-common==0.99.22.9
+  - sudo==1.9.9-1ubuntu2.4
+  - systemd==249.11-0ubuntu3.12
+  - systemd-sysv==249.11-0ubuntu3.12
+  - sysvinit-utils==3.01-1ubuntu1
+  - tar==1.34+dfsg-1ubuntu0.1.22.04.1
+  - tmux==3.2a-4ubuntu0.2
+  - ubuntu-keyring==2021.03.26
+  - ucf==3.0043
+  - usrmerge==25ubuntu2
+  - util-linux==2.37.2-4ubuntu3
+  - wget==1.21.2-2ubuntu1.1
+  - xz-utils==5.2.5-2ubuntu1
+  - zlib1g==1:1.2.11.dfsg-2ubuntu9.2
+  machine: x86_64
+  os: Linux
+  os_version: '#58~20.04.1 SMP Mon Jun 17 08:46:21 CEST 2024'
+  processor: x86_64
+  release: 5.15.0-52-generic