File tree Expand file tree Collapse file tree 9 files changed +14
-10
lines changed
Expand file tree Collapse file tree 9 files changed +14
-10
lines changed Original file line number Diff line number Diff line change @@ -111,7 +111,7 @@ ENTRYPOINT ["/app/tools.sh"]
111111# ==============================================================================
112112FROM base AS light
113113
114- COPY --from=build /app/full/llama-cli /app
114+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
115115
116116ENTRYPOINT [ "/app/llama-cli" ]
117117
Original file line number Diff line number Diff line change @@ -68,7 +68,7 @@ ENTRYPOINT ["/app/tools.sh"]
6868# ## Light, CLI only
6969FROM base AS light
7070
71- COPY --from=build /app/full/llama-cli /app
71+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
7272
7373WORKDIR /app
7474
Original file line number Diff line number Diff line change @@ -74,7 +74,7 @@ ENTRYPOINT ["/app/tools.sh"]
7474# ## Light, CLI only
7575FROM base AS light
7676
77- COPY --from=build /app/full/llama-cli /app
77+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
7878
7979WORKDIR /app
8080
Original file line number Diff line number Diff line change @@ -73,7 +73,7 @@ ENTRYPOINT ["/app/tools.sh"]
7373FROM base AS light
7474
7575COPY --from=build /app/lib/ /app
76- COPY --from=build /app/full/llama-cli /app
76+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
7777
7878WORKDIR /app
7979
Original file line number Diff line number Diff line change @@ -81,7 +81,7 @@ ENTRYPOINT ["/app/tools.sh"]
8181# ## Light, CLI only
8282FROM base AS light
8383
84- COPY --from=build /app/full/llama-cli /app
84+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
8585
8686WORKDIR /app
8787
Original file line number Diff line number Diff line change @@ -94,7 +94,7 @@ ENTRYPOINT ["/app/tools.sh"]
9494# ## Light, CLI only
9595FROM base AS light
9696
97- COPY --from=build /app/full/llama-cli /app
97+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
9898
9999WORKDIR /app
100100
Original file line number Diff line number Diff line change @@ -105,7 +105,7 @@ WORKDIR /llama.cpp/bin
105105
106106# Copy llama.cpp binaries and libraries
107107COPY --from=collector /llama.cpp/bin/*.so /llama.cpp/bin
108- COPY --from=collector /llama.cpp/bin/llama-cli /llama.cpp/bin
108+ COPY --from=collector /llama.cpp/bin/llama-cli /llama.cpp/bin/llama-completion /llama.cpp/bin
109109
110110ENTRYPOINT [ "/llama.cpp/bin/llama-cli" ]
111111
Original file line number Diff line number Diff line change @@ -13,6 +13,8 @@ elif [[ "$arg1" == '--quantize' || "$arg1" == '-q' ]]; then
1313 exec ./llama-quantize " $@ "
1414elif [[ " $arg1 " == ' --run' || " $arg1 " == ' -r' ]]; then
1515 exec ./llama-cli " $@ "
16+ elif [[ " $arg1 " == ' --run-legacy' || " $arg1 " == ' -l' ]]; then
17+ exec ./llama-completion " $@ "
1618elif [[ " $arg1 " == ' --bench' || " $arg1 " == ' -b' ]]; then
1719 exec ./llama-bench " $@ "
1820elif [[ " $arg1 " == ' --perplexity' || " $arg1 " == ' -p' ]]; then
@@ -32,8 +34,10 @@ elif [[ "$arg1" == '--server' || "$arg1" == '-s' ]]; then
3234else
3335 echo " Unknown command: $arg1 "
3436 echo " Available commands: "
35- echo " --run (-r): Run a model previously converted into ggml"
36- echo " ex: -m /models/7B/ggml-model-q4_0.bin -p \" Building a website can be done in 10 simple steps:\" -n 512"
37+ echo " --run (-r): Run a model (chat) previously converted into ggml"
38+ echo " ex: -m /models/7B/ggml-model-q4_0.bin"
39+ echo " --run-legacy (-l): Run a model (legacy completion) previously converted into ggml"
40+ echo " ex: -m /models/7B/ggml-model-q4_0.bin -no-cnv -p \" Building a website can be done in 10 simple steps:\" -n 512"
3741 echo " --bench (-b): Benchmark the performance of the inference for various parameters."
3842 echo " ex: -m model.gguf"
3943 echo " --perplexity (-p): Measure the perplexity of a model over a given text."
Original file line number Diff line number Diff line change @@ -68,7 +68,7 @@ ENTRYPOINT ["/app/tools.sh"]
6868# ## Light, CLI only
6969FROM base AS light
7070
71- COPY --from=build /app/full/llama-cli /app
71+ COPY --from=build /app/full/llama-cli /app/full/llama-completion /app
7272
7373WORKDIR /app
7474
You can’t perform that action at this time.
0 commit comments