summaryrefslogtreecommitdiff
path: root/llama.cpp/scripts/snapdragon/adb
diff options
context:
space:
mode:
Diffstat (limited to 'llama.cpp/scripts/snapdragon/adb')
-rw-r--r--llama.cpp/scripts/snapdragon/adb/llama-cli.farf1
-rwxr-xr-xllama.cpp/scripts/snapdragon/adb/run-bench.sh52
-rwxr-xr-xllama.cpp/scripts/snapdragon/adb/run-cli.sh59
-rwxr-xr-xllama.cpp/scripts/snapdragon/adb/run-completion.sh59
-rwxr-xr-xllama.cpp/scripts/snapdragon/adb/run-mtmd.sh68
-rwxr-xr-xllama.cpp/scripts/snapdragon/adb/run-tool.sh54
6 files changed, 293 insertions, 0 deletions
diff --git a/llama.cpp/scripts/snapdragon/adb/llama-cli.farf b/llama.cpp/scripts/snapdragon/adb/llama-cli.farf
new file mode 100644
index 0000000..de84fe8
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/llama-cli.farf
@@ -0,0 +1 @@
+0xffff
diff --git a/llama.cpp/scripts/snapdragon/adb/run-bench.sh b/llama.cpp/scripts/snapdragon/adb/run-bench.sh
new file mode 100755
index 0000000..2750860
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/run-bench.sh
@@ -0,0 +1,52 @@
+#!/bin/sh
+#
+
+# Basedir on device
+basedir=/data/local/tmp/llama.cpp
+
+branch=.
+[ "$B" != "" ] && branch=$B
+
+adbserial=
+[ "$S" != "" ] && adbserial="-s $S"
+
+adbhost=
+[ "$H" != "" ] && adbhost="-H $H"
+
+model="Llama-3.2-3B-Instruct-Q4_0.gguf"
+[ "$M" != "" ] && model="$M"
+
+device="HTP0"
+[ "$D" != "" ] && device="$D"
+
+verbose=
+[ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V" cli_opts="$cli_opts -v"
+
+experimental=
+[ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
+
+profile=
+[ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1" cli_opts="$cli_opts -v"
+
+opmask=
+[ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
+
+nhvx=
+[ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
+
+ndev=
+[ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
+
+hb=
+[ "$HB" != "" ] && hb="GGML_HEXAGON_HOSTBUF=$HB"
+
+set -x
+
+adb $adbserial $adbhost shell " \
+ cd $basedir; \
+ LD_LIBRARY_PATH=$basedir/$branch/lib \
+ ADSP_LIBRARY_PATH=$basedir/$branch/lib \
+ $ndev $nhvx $opmask $verbose $experimental $profile $hb ./$branch/bin/llama-bench --device $device --mmap 0 -m $basedir/../gguf/$model \
+ --poll 1000 -t 6 --cpu-mask 0xfc --cpu-strict 1 \
+ --batch-size 128 -ngl 99 $cli_opts $@ \
+"
diff --git a/llama.cpp/scripts/snapdragon/adb/run-cli.sh b/llama.cpp/scripts/snapdragon/adb/run-cli.sh
new file mode 100755
index 0000000..d19d4e9
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/run-cli.sh
@@ -0,0 +1,59 @@
+#!/bin/sh
+#
+
+# Basedir on device
+basedir=/data/local/tmp/llama.cpp
+
+cli_opts=
+
+branch=.
+[ "$B" != "" ] && branch=$B
+
+adbserial=
+[ "$S" != "" ] && adbserial="-s $S"
+
+adbhost=
+[ "$H" != "" ] && adbhost="-H $H"
+
+model="Llama-3.2-3B-Instruct-Q4_0.gguf"
+[ "$M" != "" ] && model="$M"
+
+device="HTP0"
+[ "$D" != "" ] && device="$D"
+
+experimental=
+[ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
+
+verbose=
+[ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V" cli_opts="$cli_opts -v"
+
+sched=
+[ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
+
+profile=
+[ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1" cli_opts="$cli_opts -v"
+
+opmask=
+[ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
+
+nhvx=
+[ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
+
+ndev=
+[ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
+
+hb=
+[ "$HB" != "" ] && hb="GGML_HEXAGON_HOSTBUF=$HB"
+
+set -x
+
+adb $adbserial $adbhost shell " \
+ cd $basedir; ulimit -c unlimited; \
+ LD_LIBRARY_PATH=$basedir/$branch/lib \
+ ADSP_LIBRARY_PATH=$basedir/$branch/lib \
+ $verbose $experimental $sched $opmask $profile $nhvx $ndev $hb \
+ ./$branch/bin/llama-cli --no-mmap -m $basedir/../gguf/$model \
+ --poll 1000 -t 6 --cpu-mask 0xfc --cpu-strict 1 \
+ --ctx-size 8192 --batch-size 128 -fa on \
+ -ngl 99 --device $device $cli_opts $@ \
+"
diff --git a/llama.cpp/scripts/snapdragon/adb/run-completion.sh b/llama.cpp/scripts/snapdragon/adb/run-completion.sh
new file mode 100755
index 0000000..da9df11
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/run-completion.sh
@@ -0,0 +1,59 @@
+#!/bin/sh
+#
+
+# Basedir on device
+basedir=/data/local/tmp/llama.cpp
+
+cli_opts=
+
+branch=.
+[ "$B" != "" ] && branch=$B
+
+adbserial=
+[ "$S" != "" ] && adbserial="-s $S"
+
+adbhost=
+[ "$H" != "" ] && adbhost="-H $H"
+
+model="Llama-3.2-3B-Instruct-Q4_0.gguf"
+[ "$M" != "" ] && model="$M"
+
+device="HTP0"
+[ "$D" != "" ] && device="$D"
+
+experimental=
+[ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
+
+verbose=
+[ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V" cli_opts="$cli_opts -v"
+
+sched=
+[ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
+
+profile=
+[ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1" cli_opts="$cli_opts -v"
+
+opmask=
+[ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
+
+nhvx=
+[ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
+
+ndev=
+[ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
+
+hb=
+[ "$HB" != "" ] && hb="GGML_HEXAGON_HOSTBUF=$HB"
+
+set -x
+
+adb $adbserial $adbhost shell " \
+ cd $basedir; ulimit -c unlimited; \
+ LD_LIBRARY_PATH=$basedir/$branch/lib \
+ ADSP_LIBRARY_PATH=$basedir/$branch/lib \
+ $verbose $experimental $sched $opmask $profile $nhvx $ndev $hb \
+ ./$branch/bin/llama-completion --no-mmap -m $basedir/../gguf/$model \
+ --poll 1000 -t 6 --cpu-mask 0xfc --cpu-strict 1 \
+ --ctx-size 8192 --batch-size 128 -fa on \
+ -ngl 99 -no-cnv --device $device $cli_opts $@ \
+"
diff --git a/llama.cpp/scripts/snapdragon/adb/run-mtmd.sh b/llama.cpp/scripts/snapdragon/adb/run-mtmd.sh
new file mode 100755
index 0000000..fc018e7
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/run-mtmd.sh
@@ -0,0 +1,68 @@
+#!/bin/sh
+#
+
+# Basedir on device
+basedir=/data/local/tmp/llama.cpp
+
+cli_opts=
+
+branch=.
+[ "$B" != "" ] && branch=$B
+
+adbserial=
+[ "$S" != "" ] && adbserial="-s $S"
+
+adbhost=
+[ "$H" != "" ] && adbhost="-H $H"
+
+model="gemma-3-4b-it-Q4_0.gguf"
+[ "$M" != "" ] && model="$M"
+
+mmproj="mmproj-F16.gguf"
+[ "$MMPROJ" != "" ] && mmproj="$MMPROJ"
+
+image=
+[ "$IMG" != "" ] && image="$IMG"
+
+device="HTP0"
+[ "$D" != "" ] && device="$D"
+
+verbose=
+[ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V"
+
+experimental="GGML_HEXAGON_EXPERIMENTAL=1"
+[ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
+
+sched=
+[ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
+
+profile=
+[ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1"
+
+opmask=
+[ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
+
+nhvx=
+[ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
+
+ndev=
+[ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
+
+# MTMD backend device for vision model (defaults to CPU if not set)
+mtmd_backend=
+[ "$MTMD_DEVICE" != "" ] && mtmd_backend="MTMD_BACKEND_DEVICE=$MTMD_DEVICE"
+
+set -x
+
+adb $adbserial $adbhost shell " \
+ cd $basedir; ulimit -c unlimited; \
+ LD_LIBRARY_PATH=$basedir/$branch/lib \
+ ADSP_LIBRARY_PATH=$basedir/$branch/lib \
+ $verbose $experimental $sched $opmask $profile $nhvx $ndev $mtmd_backend \
+ ./$branch/bin/llama-mtmd-cli --no-mmap -m $basedir/../gguf/$model \
+ --mmproj $basedir/../gguf/$mmproj \
+ --image $basedir/../gguf/$image \
+ --poll 1000 -t 6 --cpu-mask 0xfc --cpu-strict 1 \
+ --ctx-size 8192 --batch-size 128 -ctk q8_0 -ctv q8_0 -fa on \
+ -ngl 99 --device $device -v $cli_opts $@ \
+"
diff --git a/llama.cpp/scripts/snapdragon/adb/run-tool.sh b/llama.cpp/scripts/snapdragon/adb/run-tool.sh
new file mode 100755
index 0000000..4647ede
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/adb/run-tool.sh
@@ -0,0 +1,54 @@
+#!/bin/sh
+#
+
+# Basedir on device
+basedir=/data/local/tmp/llama.cpp
+
+cli_opts=
+
+branch=.
+[ "$B" != "" ] && branch=$B
+
+adbserial=
+[ "$S" != "" ] && adbserial="-s $S"
+
+adbhost=
+[ "$H" != "" ] && adbhost="-H $H"
+
+device="HTP0"
+[ "$D" != "" ] && device="$D"
+
+verbose=
+[ "$V" != "" ] && verbose="GGML_HEXAGON_VERBOSE=$V"
+
+experimental=
+[ "$E" != "" ] && experimental="GGML_HEXAGON_EXPERIMENTAL=$E"
+
+sched=
+[ "$SCHED" != "" ] && sched="GGML_SCHED_DEBUG=2" cli_opts="$cli_opts -v"
+
+profile=
+[ "$PROF" != "" ] && profile="GGML_HEXAGON_PROFILE=$PROF GGML_HEXAGON_OPSYNC=1"
+
+opmask=
+[ "$OPMASK" != "" ] && opmask="GGML_HEXAGON_OPMASK=$OPMASK"
+
+nhvx=
+[ "$NHVX" != "" ] && nhvx="GGML_HEXAGON_NHVX=$NHVX"
+
+ndev=
+[ "$NDEV" != "" ] && ndev="GGML_HEXAGON_NDEV=$NDEV"
+
+hb=
+[ "$HB" != "" ] && hb="GGML_HEXAGON_HOSTBUF=$HB"
+
+set -x
+
+tool=$1; shift
+
+adb $adbserial $adbhost shell " \
+ cd $basedir; ulimit -c unlimited; \
+ LD_LIBRARY_PATH=$basedir/$branch/lib \
+ ADSP_LIBRARY_PATH=$basedir/$branch/lib \
+ $verbose $experimental $sched $opmask $profile $nhvx $ndev $hb ./$branch/bin/$tool $@ \
+"