summaryrefslogtreecommitdiff
path: root/llama.cpp/scripts/snapdragon/qdc
diff options
context:
space:
mode:
Diffstat (limited to 'llama.cpp/scripts/snapdragon/qdc')
-rw-r--r--llama.cpp/scripts/snapdragon/qdc/readme.md1
-rw-r--r--llama.cpp/scripts/snapdragon/qdc/requirements.txt25
-rw-r--r--llama.cpp/scripts/snapdragon/qdc/tests/test_bench.py63
3 files changed, 89 insertions, 0 deletions
diff --git a/llama.cpp/scripts/snapdragon/qdc/readme.md b/llama.cpp/scripts/snapdragon/qdc/readme.md
new file mode 100644
index 0000000..b92cf24
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/qdc/readme.md
@@ -0,0 +1 @@
+This directory includes pytest based scripts for running CI jobs on Qualcomm Device Cloud (QDC).
diff --git a/llama.cpp/scripts/snapdragon/qdc/requirements.txt b/llama.cpp/scripts/snapdragon/qdc/requirements.txt
new file mode 100644
index 0000000..f04bd68
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/qdc/requirements.txt
@@ -0,0 +1,25 @@
+Appium-Python-Client==5.2.4
+attrs==25.4.0
+certifi==2025.10.5
+exceptiongroup==1.3.0
+h11==0.16.0
+idna==3.11
+iniconfig==2.1.0
+outcome==1.3.0.post0
+packaging==25.0
+pluggy==1.6.0
+Pygments==2.19.2
+PySocks==1.7.1
+pytest==8.4.2
+pytest-dependency==0.6.0
+selenium==4.36.0
+setuptools==80.9.0
+sniffio==1.3.1
+sortedcontainers==2.4.0
+tomli==2.3.0
+trio==0.31.0
+trio-websocket==0.12.2
+typing_extensions==4.15.0
+urllib3==2.5.0
+websocket-client==1.9.0
+wsproto==1.2.0
diff --git a/llama.cpp/scripts/snapdragon/qdc/tests/test_bench.py b/llama.cpp/scripts/snapdragon/qdc/tests/test_bench.py
new file mode 100644
index 0000000..651ab5b
--- /dev/null
+++ b/llama.cpp/scripts/snapdragon/qdc/tests/test_bench.py
@@ -0,0 +1,63 @@
+import pytest
+import subprocess
+import sys
+
+tmp_path='/data/local/tmp'
+pkg_path=f'{tmp_path}/llama.cpp'
+lib_path=f'{pkg_path}/lib'
+bin_path=f'{pkg_path}/bin'
+
+model='../gguf/Llama-3.2-1B-Instruct-Q4_0.gguf'
+cli_pref=f'cd {pkg_path} && LD_LIBRARY_PATH={lib_path} ADSP_LIBRARY_PATH={lib_path} {bin_path}'
+
+
+def run_cmd(cmd):
+ p = subprocess.run(cmd, text = True, stdout = subprocess.PIPE, stderr = subprocess.STDOUT)
+ sys.stdout.write(p.stdout)
+ assert(p.returncode == 0)
+
+
+@pytest.mark.dependency()
+def test_install():
+ run_cmd(['adb', 'push', 'llama.cpp', f'{tmp_path}'])
+ run_cmd(['adb', 'shell', f'chmod 755 {bin_path}/*'])
+
+
+## Basic cli tests
+def run_llama_cli(dev, opts):
+ prompt='what is the most popular cookie in the world?\nPlease provide a very brief bullet point summary.\nBegin your answer with **BEGIN**.'
+ opts = '--batch-size 128 -n 128 -no-cnv --seed 42 ' + opts
+ run_cmd(['adb', 'shell', f'{cli_pref}/llama-cli -m {model} --device {dev} -ngl 99 -t 4 {opts} -p "{prompt}"'])
+
+
+@pytest.mark.dependency(depends=['test_install'])
+def test_llama_cli_cpu():
+ run_llama_cli('none', '-ctk q8_0 -ctv q8_0 -fa on')
+
+
+@pytest.mark.dependency(depends=['test_install'])
+def test_llama_cli_gpu():
+ run_llama_cli('GPUOpenCL', '-fa on')
+
+
+@pytest.mark.dependency(depends=['test_install'])
+def test_llama_cli_npu():
+ run_llama_cli('HTP0', '-ctk q8_0 -ctv q8_0 -fa on')
+
+
+## Basic bench tests
+def run_llama_bench(dev):
+ run_cmd(['adb', 'shell', f'{cli_pref}/llama-bench -m {model} --device {dev} -ngl 99 --batch-size 128 -t 4 -p 128 -n 32'])
+
+
+@pytest.mark.dependency(depends=['test_install'])
+def test_llama_bench_cpu():
+ run_llama_bench('none')
+
+
+def test_llama_bench_gpu():
+ run_llama_bench('GPUOpenCL')
+
+
+def test_llama_bench_npu():
+ run_llama_bench('HTP0')