Spaces:
Runtime error
Runtime error
ztime
commited on
Commit
·
e8482a8
1
Parent(s):
f5f8f18
change port export
Browse files- Dockerfile +2 -1
- start_server.sh +1 -1
Dockerfile
CHANGED
|
@@ -16,6 +16,7 @@ RUN apt-get update && \
|
|
| 16 |
|
| 17 |
RUN git clone https://github.com/ggerganov/llama.cpp.git llamacpp --depth 1 && \
|
| 18 |
cd llamacpp && \
|
|
|
|
| 19 |
cmake -B build -DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS && \
|
| 20 |
cmake --build build --config Release --target main server && \
|
| 21 |
cp build/bin/* ../ && \
|
|
@@ -42,4 +43,4 @@ ENV PORT=7860
|
|
| 42 |
EXPOSE ${PORT}
|
| 43 |
|
| 44 |
# Run the server start script
|
| 45 |
-
CMD ["/bin/sh", "./start_server.sh"]
|
|
|
|
| 16 |
|
| 17 |
RUN git clone https://github.com/ggerganov/llama.cpp.git llamacpp --depth 1 && \
|
| 18 |
cd llamacpp && \
|
| 19 |
+
sed -i 's/v1\/chat/api\/v1\/chat/g' examples/server/server.cpp && \
|
| 20 |
cmake -B build -DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS && \
|
| 21 |
cmake --build build --config Release --target main server && \
|
| 22 |
cp build/bin/* ../ && \
|
|
|
|
| 43 |
EXPOSE ${PORT}
|
| 44 |
|
| 45 |
# Run the server start script
|
| 46 |
+
CMD ["/bin/sh", "./start_server.sh"]
|
start_server.sh
CHANGED
|
@@ -3,7 +3,7 @@
|
|
| 3 |
# For mlock support
|
| 4 |
ulimit -l unlimited
|
| 5 |
|
| 6 |
-
/main -m model/gguf-model.bin --color -p '你好,你是谁' -n
|
| 7 |
|
| 8 |
/server --host 0.0.0.0 --port 7860 -m model/gguf-model.bin
|
| 9 |
/llamacpp/build/bin/server --host 0.0.0.0 --port 7860 -m model/gguf-model.bin
|
|
|
|
| 3 |
# For mlock support
|
| 4 |
ulimit -l unlimited
|
| 5 |
|
| 6 |
+
/main -m model/gguf-model.bin --color -p '你好,你是谁' -n 64 -c 64
|
| 7 |
|
| 8 |
/server --host 0.0.0.0 --port 7860 -m model/gguf-model.bin
|
| 9 |
/llamacpp/build/bin/server --host 0.0.0.0 --port 7860 -m model/gguf-model.bin
|