Spaces:
Running
on
T4
Running
on
T4
ggml -> gguf to get rid of a warning
Browse files- Dockerfile +5 -5
Dockerfile
CHANGED
|
@@ -11,8 +11,8 @@ WORKDIR /opt/koboldcpp
|
|
| 11 |
COPY *.json /opt/koboldcpp/
|
| 12 |
RUN curl -fLo koboldcpp https://koboldai.org/cpplinuxcu12
|
| 13 |
RUN chmod +x ./koboldcpp
|
| 14 |
-
RUN curl -fLo model.
|
| 15 |
-
RUN curl -fLo imgmodel.
|
| 16 |
-
RUN curl -fLo mmproj.
|
| 17 |
-
RUN curl -fLo whispermodel.
|
| 18 |
-
CMD ./koboldcpp --model model.
|
|
|
|
| 11 |
COPY *.json /opt/koboldcpp/
|
| 12 |
RUN curl -fLo koboldcpp https://koboldai.org/cpplinuxcu12
|
| 13 |
RUN chmod +x ./koboldcpp
|
| 14 |
+
RUN curl -fLo model.gguf $MODEL || true
|
| 15 |
+
RUN curl -fLo imgmodel.gguf $IMGMODEL || true
|
| 16 |
+
RUN curl -fLo mmproj.gguf $MMPROJ || true
|
| 17 |
+
RUN curl -fLo whispermodel.gguf $WHISPERMODEL || true
|
| 18 |
+
CMD ./koboldcpp --model model.gguf --whispermodel whispermodel.gguf --sdmodel imgmodel.gguf --sdthreads 4 --sdquant --sdclamped --mmproj mmproj.gguf $ADDITIONAL --port 7860 --hordemodelname $MODEL_NAME --hordemaxctx 1 --hordegenlen 1 --quiet --preloadstory default.json --chatcompletionsadapter adapter.json --ignoremissing $SECRET
|