Используя venv:
python3.12 -m venv vllm-env
source vllm-env/bin/activateИли используя conda:
conda create -n vllm-env python=3.12 -y
conda activate vllm-envpip install uvuv pip install -U "vllm[audio]" --torch-backend=auto --extra-index-url https://wheels.vllm.ai/nightlyvllm serve mistralai/Voxtral-Small-24B-2507 --tokenizer_mode mistral --config_format mistral --load_format mistral --tensor-parallel-size 1 --tool-call-parser mistral --enable-auto-tool-choice --gpu-memory-utilization 0.75