docker : include legacy llama-completion binary (#17964)
This commit is contained in:
parent
482211438d
commit
b7f5f46e03
|
|
@ -111,7 +111,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
# ==============================================================================
|
# ==============================================================================
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
ENTRYPOINT [ "/app/llama-cli" ]
|
ENTRYPOINT [ "/app/llama-cli" ]
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -68,7 +68,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
### Light, CLI only
|
### Light, CLI only
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -74,7 +74,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
### Light, CLI only
|
### Light, CLI only
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -73,7 +73,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/lib/ /app
|
COPY --from=build /app/lib/ /app
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -81,7 +81,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
### Light, CLI only
|
### Light, CLI only
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -94,7 +94,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
### Light, CLI only
|
### Light, CLI only
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -105,7 +105,7 @@ WORKDIR /llama.cpp/bin
|
||||||
|
|
||||||
# Copy llama.cpp binaries and libraries
|
# Copy llama.cpp binaries and libraries
|
||||||
COPY --from=collector /llama.cpp/bin/*.so /llama.cpp/bin
|
COPY --from=collector /llama.cpp/bin/*.so /llama.cpp/bin
|
||||||
COPY --from=collector /llama.cpp/bin/llama-cli /llama.cpp/bin
|
COPY --from=collector /llama.cpp/bin/llama-cli /llama.cpp/bin/llama-completion /llama.cpp/bin
|
||||||
|
|
||||||
ENTRYPOINT [ "/llama.cpp/bin/llama-cli" ]
|
ENTRYPOINT [ "/llama.cpp/bin/llama-cli" ]
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -13,6 +13,8 @@ elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
|
||||||
exec ./llama-quantize "$@"
|
exec ./llama-quantize "$@"
|
||||||
elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
|
elif [[ "$arg1" == '--run' || "$arg1" == '-r' ]]; then
|
||||||
exec ./llama-cli "$@"
|
exec ./llama-cli "$@"
|
||||||
|
elif [[ "$arg1" == '--run-legacy' || "$arg1" == '-l' ]]; then
|
||||||
|
exec ./llama-completion "$@"
|
||||||
elif [[ "$arg1" == '--bench' || "$arg1" == '-b' ]]; then
|
elif [[ "$arg1" == '--bench' || "$arg1" == '-b' ]]; then
|
||||||
exec ./llama-bench "$@"
|
exec ./llama-bench "$@"
|
||||||
elif [[ "$arg1" == '--perplexity' || "$arg1" == '-p' ]]; then
|
elif [[ "$arg1" == '--perplexity' || "$arg1" == '-p' ]]; then
|
||||||
|
|
@ -32,8 +34,10 @@ elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
|
||||||
else
|
else
|
||||||
echo "Unknown command: $arg1"
|
echo "Unknown command: $arg1"
|
||||||
echo "Available commands: "
|
echo "Available commands: "
|
||||||
echo " --run (-r): Run a model previously converted into ggml"
|
echo " --run (-r): Run a model (chat) previously converted into ggml"
|
||||||
echo " ex: -m /models/7B/ggml-model-q4_0.bin -p \"Building a website can be done in 10 simple steps:\" -n 512"
|
echo " ex: -m /models/7B/ggml-model-q4_0.bin"
|
||||||
|
echo " --run-legacy (-l): Run a model (legacy completion) previously converted into ggml"
|
||||||
|
echo " ex: -m /models/7B/ggml-model-q4_0.bin -no-cnv -p \"Building a website can be done in 10 simple steps:\" -n 512"
|
||||||
echo " --bench (-b): Benchmark the performance of the inference for various parameters."
|
echo " --bench (-b): Benchmark the performance of the inference for various parameters."
|
||||||
echo " ex: -m model.gguf"
|
echo " ex: -m model.gguf"
|
||||||
echo " --perplexity (-p): Measure the perplexity of a model over a given text."
|
echo " --perplexity (-p): Measure the perplexity of a model over a given text."
|
||||||
|
|
|
||||||
|
|
@ -68,7 +68,7 @@ ENTRYPOINT ["/app/tools.sh"]
|
||||||
### Light, CLI only
|
### Light, CLI only
|
||||||
FROM base AS light
|
FROM base AS light
|
||||||
|
|
||||||
COPY --from=build /app/full/llama-cli /app
|
COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue