adding more threads

This commit is contained in:
2025-11-10 12:12:20 +01:00
parent c017384ad1
commit 254f71bf47
2 changed files with 13 additions and 5 deletions

View File

@@ -19,7 +19,7 @@ RUN <<eot
apt -qy install --no-install-recommends \
-o APT::Install-Recommends=false \
-o APT::Install-Suggests=false \
console-setup tzdata dbus x11-utils x11-xserver-utils rocm-smi mesa-vulkan-drivers
console-setup tzdata dbus x11-utils x11-xserver-utils dbus-x11 rocm-smi mesa-vulkan-drivers
apt -qy update
DEBIAN_FRONTEND=noninteractive apt -qy install --no-install-recommends \
-o APT::Install-Recommends=false \
@@ -37,6 +37,8 @@ RUN <<eot
eot
ENV DISPLAY=:99
# Not sure that this works
ENV LLAMA_THREADS=12
#########################

View File

@@ -1,18 +1,24 @@
#!/bin/bash
rm /tmp/.X99-lock
Xvfb :99 -screen 0 1920x1080x16 &
#set GPU Power profile to COMPUTE
/usr/bin/rocm-smi --setprofile 4
rm -f /tmp/.X99-lock
mkdir /run/dbus
/usr/bin/dbus-daemon --fork --system
Xvfb :99 -screen 0 1920x1600x16 &
sleep 2
# -----------------------------------
/squashfs-root/lm-studio --no-sandbox &
/squashfs-root/lm-studio --no-sandbox --threads 12 &
sleep 30
~/.lmstudio/bin/lms server start --cors &
sleep 5
# ~/.cache/lm-studio/bin/lms get ${MODEL_PATH}
~/.lmstudio/bin/lms load --ttl 3600 --context-length ${CONTEXT_LENGTH:-16384} ${MODEL_IDENTIFIER} &
~/.lmstudio/bin/lms load --ttl 3600 --context-length ${CONTEXT_LENGTH:-16384} ${MODEL_IDENTIFIER:openai/gpt-oss-20b} &
sleep 20
cp -f /http-server-config.json /root/.lmstudio/.internal/http-server-config.json