使用FastAPI+vLLM部署Qwen2.5
git clone https://github.com/Xiaolong-RRL/qwen2_5_vllm_fastapi.git
cd qwen2_5_vllm_fastapi
pip install vllm, transformers, fastapi, uvicorn
python qwen2_5_vllm_fastapi_server.py
python qwen2_5_vllm_fastapi_client.py
python qwen2_5_vllm_fastapi_webui_gradio.py