测试, 生产10.182.17.2:/data1/tlw/image_classification10.182.17.2:/data1/tlw/timm10.51.0.1:/data/image_classification screen -r HunyuanOCR_1CUDA_VISIBLE_DEVICES=0 vllm serve /data1/models/HunyuanOCR --host 0.0.0.0 --port 8001 --served-model-name HunyuanOCR --no-enable-prefix-caching --mm-processor-cache-gb 0 --gpu-memory-utilization 0.2Ctrl +a +d screen -r HunyuanOCR_2CUDA_VISIBLE_DEVICES=1 vllm serve /data1/models/HunyuanOCR --host 0.0.0.0 --port 8002 --served-model-name HunyuanOCR --no-enable-prefix-caching --mm-processor-cache-gb 0 --gpu-memory-utilization 0.2Ctrl +a +d 负载均衡端口:8000 nohup uvicorn app:app --host 0.0.0.0 --port 8005 --workers 1 > logs/app.log 2>&1 & screen -r HunyuanOCR_1 CUDA_VISIBLE_DEVICES=2 vllm serve /data/models/HunyuanOCR --host 0.0.0.0 --port 8001 --served-model-name HunyuanOCR --no-enable-prefix-caching --mm-processor-cache-gb 0 --gpu-memory-utilization 0.45 --enable-log-requests --enable-log-outputsCtrl +a +d screen -r HunyuanOCR_2 CUDA_VISIBLE_DEVICES=3 vllm serve /data/models/HunyuanOCR --host 0.0.0.0 --port 8002 --served-model-name HunyuanOCR --no-enable-prefix-caching --mm-processor-cache-gb 0 --gpu-memory-utilization 0.45 --enable-log-requests --enable-log-outputsCtrl +a +d nohup uvicorn app:app --host 0.0.0.0 --port 8005 --workers 1 > logs/app.log 2>&1 & 负载均衡端口:8003 图片分类 :POST /predict OCR: POST /HunyuanOCR