uv venv --python 3.12 --seed
source .venv/bin/activate
uv pip install vllm --torch-backend=autouv pip install hf_transfer
hf auth loginvllm serve meta-llama/Llama-3.1-70B-Instruct --tensor-parallel-size 4 --max-model-len 4096vllm bench serve --backend vllm --model meta-llama/Llama-3.1-70B-Instruct --endpoint /v1/completions --dataset-name sharegpt --dataset-path ShareGPT_V3_unfiltered_cleaned_split.json --num-prompts 64streamlit run app.py --server.enableCORS false --server.enableXsrfProtection false