Spaces:
Build error
Build error
Commit
·
9c40bcd
1
Parent(s):
6d2193e
Update entrypoint.sh.template
Browse files- entrypoint.sh.template +1 -3
entrypoint.sh.template
CHANGED
|
@@ -5,9 +5,7 @@ mongod &
|
|
| 5 |
|
| 6 |
# Start the text-generation-inference process
|
| 7 |
pip3 install -U transformers && pip install -U transformers
|
| 8 |
-
|
| 9 |
-
# text-generation-server quantize ${MODEL_NAME} /data/model_gptq
|
| 10 |
-
text-generation-launcher --model-id TheBloke/Llama-2-7B-GPTQ --quantize gptq --num-shard 1 --port 8080 &
|
| 11 |
|
| 12 |
# Wait for text-generation-inference to start
|
| 13 |
curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health
|
|
|
|
| 5 |
|
| 6 |
# Start the text-generation-inference process
|
| 7 |
pip3 install -U transformers && pip install -U transformers
|
| 8 |
+
text-generation-launcher --model-id ${MODEL_NAME} --quantize bitsandbytes-nf4 --num-shard 1 --port 8080 --trust-remote-code &
|
|
|
|
|
|
|
| 9 |
|
| 10 |
# Wait for text-generation-inference to start
|
| 11 |
curl --retry 60 --retry-delay 10 --retry-connrefused http://127.0.0.1:8080/health
|