start-vllm-qwen3-reranker-8b-15.sh 519 B

1234567891011121314151617
  1. #!/bin/bash
  2. set -e
  3. # 创建日志目录
  4. mkdir -p /var/log/vllm
  5. # 启动 vLLM 服务 --convert classify -task embed
  6. python3 -m vllm.entrypoints.openai.api_server \
  7. --model /model/Qwen3-Reranker-8B \
  8. --runner pooling \
  9. --trust-remote-code \
  10. --tensor-parallel-size 1 \
  11. --gpu-memory-utilization 0.45 \
  12. --host 0.0.0.0 \
  13. --port 30000 \
  14. --chat-template /vllm/sglang-main/examples/chat_template/qwen3_reranker.jinja
  15. --api-key lq123456 2>&1 | tee /var/log/vllm/qwen3-reranker-8b-server.log