forked from aphrodite-engine/aphrodite-engine
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathentrypoint.sh
executable file
·26 lines (21 loc) · 896 Bytes
/
entrypoint.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/bin/bash -e
echo 'Starting Aphrodite Engine API server...'
CMD="python3 -m aphrodite.endpoints.openai.api_server
--host 0.0.0.0
--port 7860
--download-dir ${HF_HOME:?}/hub
${MODEL_NAME:+--model $MODEL_NAME}
${REVISION:+--revision $REVISION}
${DATATYPE:+--dtype $DATATYPE}
${KVCACHE:+--kv-cache-dtype $KVCACHE}
${CONTEXT_LENGTH:+--max-model-len $CONTEXT_LENGTH}
${NUM_GPUS:+--tensor-parallel-size $NUM_GPUS}
${GPU_MEMORY_UTILIZATION:+--gpu-memory-utilization $GPU_MEMORY_UTILIZATION}
${QUANTIZATION:+--quantization $QUANTIZATION}
${ENFORCE_EAGER:+--enforce-eager}
${KOBOLD_API:+--launch-kobold-api}
${CMD_ADDITIONAL_ARGUMENTS}"
# set umask to ensure group read / write at runtime
umask 002
set -x
exec $CMD