Skip to content

Commit 477c0a3

Browse files
committed
1 parent 775fda0 commit 477c0a3

File tree

3 files changed

+18
-14
lines changed

3 files changed

+18
-14
lines changed

CMakeLists.txt

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -8,15 +8,16 @@ set(CMAKE_WARN_UNUSED_CLI YES)
88
set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
99

1010
if(CMAKE_SYSTEM_NAME STREQUAL "Android")
11+
set(CMAKE_VERBOSE_MAKEFILE ON)
1112
if(DEFINED HTP_ARCH_VERSION)
1213
if (${HTP_ARCH_VERSION} STREQUAL "v75" OR ${HTP_ARCH_VERSION} STREQUAL "v79")
1314
#works fine on Snapdragon 8Gen3&8Elite with 1.5x - 3x performance gains with the default ggml backend
1415
set(OPT_FLAG " -O3 -march=armv8.7-a -mcpu=cortex-x1 -mtune=cortex-x1 -ffp-model=fast -fno-finite-math-only")
1516
message("OPT_FLAG:${OPT_FLAG}")
16-
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DGGML_USE_HEXAGON ${DEBUG_FLAG} ${OPT_FLAG}")
17-
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DGGML_USE_HEXAGON ${DEBUG_FLAG} ${OPT_FLAG}")
18-
set(CMAKE_C_FLAGS_RELEASE "${CMAKE_C_FLAGS_RELEASE} -DGGML_USE_HEXAGON ${DEBUG_FLAG} ${OPT_FLAG}")
19-
set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -DGGML_USE_HEXAGON ${DEBUG_FLAG} ${OPT_FLAG}")
17+
set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -DGGML_USE_HEXAGON -DGGML_USE_LLAMAFILE ${DEBUG_FLAG} ${OPT_FLAG}")
18+
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DGGML_USE_HEXAGON -DGGML_USE_LLAMAFILE ${DEBUG_FLAG} ${OPT_FLAG}")
19+
set(CMAKE_C_FLAGS_RELEASE "${CMAKE_C_FLAGS_RELEASE} -DGGML_USE_HEXAGON -DGGML_USE_LLAMAFILE ${DEBUG_FLAG} ${OPT_FLAG}")
20+
set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -DGGML_USE_HEXAGON -DGGML_USE_LLAMAFILE ${DEBUG_FLAG} ${OPT_FLAG}")
2021
endif()
2122
endif()
2223
endif()

ggml/src/ggml-hexagon/CMakeLists.txt

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,9 @@ endif()
3939

4040
#check whether user's specified htp arch is valid
4141
set(CHECK_HTP_ARCH "WRONG")
42-
foreach (feat v68 v69 v73 v75 v79)
42+
#ref: https://github.com/quic/ai-hub-apps/tree/main/tutorials/llm_on_genie
43+
#foreach (feat v68 v69 v73 v75 v79)
44+
foreach (feat v73 v75 v79)
4345
if (${feat} STREQUAL ${HTP_ARCH_VERSION})
4446
set(CHECK_HTP_ARCH "GOOD")
4547
endif()

scripts/build-run-android.sh

Lines changed: 10 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -61,23 +61,24 @@ PROMPT_STRING="every day of your life, it is important to take the time to smell
6161
PROMPT_STRING="introduce the movie Once Upon a Time in America briefly.\n"
6262

6363
#for llama-cli, 20.4 MiB in models/t5-very-small-random-F32.gguf
64-
TEST_MODEL_NAME=/sdcard/t5-very-small-random-F32.gguf
64+
#TEST_MODEL_NAME=/sdcard/t5-very-small-random-F32.gguf
6565
#for llama-cli, 1.1 GiB, will be downloaded automatically via this script
6666
#TEST_MODEL_NAME=/sdcard/t5-277M-F32.gguf
67+
TEST_MODEL_NAME=/sdcard/qwen1_5-1_8b-chat-q4_0.gguf
68+
#self-defined LLM models
69+
#TEST_MODEL_NAME=/sdcard/Qwen3-8B-Q8_0.gguf
70+
#TEST_MODEL_NAME=/sdcard/Qwen3-4B-Q8_0.gguf
71+
#TEST_MODEL_NAME=/sdcard/gemma-3-4b-it-Q8_0.gguf
72+
6773

6874
#for llama-bench, 1.12 GiB, will be downloadded automatically via this script
6975
GGUF_MODEL_NAME=/sdcard/qwen1_5-1_8b-chat-q4_0.gguf
7076

71-
#available htp arch version:
72-
#v68 --- Snapdragon 888
73-
#v69 --- Snapdragon 8 Gen1
77+
#ref: https://github.com/quic/ai-hub-apps/tree/main/tutorials/llm_on_genie
78+
#supported htp arch version:
7479
#v73 --- Snapdragon 8 Gen2
7580
#v75 --- Snapdragon 8 Gen3
76-
#v79 --- Snapdragon 8 Elite(aka Gen4)
77-
78-
#8Gen1
79-
#HTP_ARCH_VERSION=v69
80-
#HTP_ARCH_VERSION_a=V69
81+
#v79 --- Snapdragon 8 Elite
8182

8283
#8Gen2
8384
#HTP_ARCH_VERSION=v73

0 commit comments

Comments
 (0)