adding more threads
This commit is contained in:
@@ -19,7 +19,7 @@ RUN <<eot
|
|||||||
apt -qy install --no-install-recommends \
|
apt -qy install --no-install-recommends \
|
||||||
-o APT::Install-Recommends=false \
|
-o APT::Install-Recommends=false \
|
||||||
-o APT::Install-Suggests=false \
|
-o APT::Install-Suggests=false \
|
||||||
console-setup tzdata dbus x11-utils x11-xserver-utils rocm-smi mesa-vulkan-drivers
|
console-setup tzdata dbus x11-utils x11-xserver-utils dbus-x11 rocm-smi mesa-vulkan-drivers
|
||||||
apt -qy update
|
apt -qy update
|
||||||
DEBIAN_FRONTEND=noninteractive apt -qy install --no-install-recommends \
|
DEBIAN_FRONTEND=noninteractive apt -qy install --no-install-recommends \
|
||||||
-o APT::Install-Recommends=false \
|
-o APT::Install-Recommends=false \
|
||||||
@@ -37,6 +37,8 @@ RUN <<eot
|
|||||||
eot
|
eot
|
||||||
|
|
||||||
ENV DISPLAY=:99
|
ENV DISPLAY=:99
|
||||||
|
# Not sure that this works
|
||||||
|
ENV LLAMA_THREADS=12
|
||||||
|
|
||||||
#########################
|
#########################
|
||||||
|
|
||||||
|
|||||||
@@ -1,18 +1,24 @@
|
|||||||
#!/bin/bash
|
#!/bin/bash
|
||||||
|
|
||||||
rm /tmp/.X99-lock
|
#set GPU Power profile to COMPUTE
|
||||||
Xvfb :99 -screen 0 1920x1080x16 &
|
/usr/bin/rocm-smi --setprofile 4
|
||||||
|
|
||||||
|
rm -f /tmp/.X99-lock
|
||||||
|
mkdir /run/dbus
|
||||||
|
|
||||||
|
/usr/bin/dbus-daemon --fork --system
|
||||||
|
Xvfb :99 -screen 0 1920x1600x16 &
|
||||||
sleep 2
|
sleep 2
|
||||||
# -----------------------------------
|
# -----------------------------------
|
||||||
|
|
||||||
/squashfs-root/lm-studio --no-sandbox &
|
/squashfs-root/lm-studio --no-sandbox --threads 12 &
|
||||||
sleep 30
|
sleep 30
|
||||||
~/.lmstudio/bin/lms server start --cors &
|
~/.lmstudio/bin/lms server start --cors &
|
||||||
|
|
||||||
|
|
||||||
sleep 5
|
sleep 5
|
||||||
# ~/.cache/lm-studio/bin/lms get ${MODEL_PATH}
|
# ~/.cache/lm-studio/bin/lms get ${MODEL_PATH}
|
||||||
~/.lmstudio/bin/lms load --ttl 3600 --context-length ${CONTEXT_LENGTH:-16384} ${MODEL_IDENTIFIER} &
|
~/.lmstudio/bin/lms load --ttl 3600 --context-length ${CONTEXT_LENGTH:-16384} ${MODEL_IDENTIFIER:openai/gpt-oss-20b} &
|
||||||
|
|
||||||
sleep 20
|
sleep 20
|
||||||
cp -f /http-server-config.json /root/.lmstudio/.internal/http-server-config.json
|
cp -f /http-server-config.json /root/.lmstudio/.internal/http-server-config.json
|
||||||
|
|||||||
Reference in New Issue
Block a user