Spaces:
Running
Running
Update start_gradio.sh
Browse files- start_gradio.sh +14 -1
start_gradio.sh
CHANGED
|
@@ -89,4 +89,17 @@ if [[ "$PRELOAD_MODEL" == "1" ]]; then
|
|
| 89 |
echo "✗ model.safetensors.index.json 缺失"
|
| 90 |
fi
|
| 91 |
echo "==================="
|
| 92 |
-
fi
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 89 |
echo "✗ model.safetensors.index.json 缺失"
|
| 90 |
fi
|
| 91 |
echo "==================="
|
| 92 |
+
fi
|
| 93 |
+
|
| 94 |
+
echo "模型路径: ${MODEL_PATH}"
|
| 95 |
+
echo "启动 Gradio..."
|
| 96 |
+
|
| 97 |
+
python app.py \
|
| 98 |
+
--host "$HOST" \
|
| 99 |
+
--port "$GRADIO_PORT" \
|
| 100 |
+
--model "$MODEL_PATH" \
|
| 101 |
+
--tensor-parallel-size "$TENSOR_PARALLEL_SIZE" \
|
| 102 |
+
--max-model-len "$MAX_MODEL_LEN" \
|
| 103 |
+
--gpu-memory-utilization "$GPU_MEMORY_UTILIZATION" \
|
| 104 |
+
--tokenizer-mode "$TOKENIZER_MODE" \
|
| 105 |
+
--served-model-name "$SERVED_MODEL_NAME"
|