From 2081ed5bd218a1fc228c1d0750cd3661a5516678 Mon Sep 17 00:00:00 2001 From: Jhen-Jie Hong Date: Wed, 18 Oct 2023 23:48:01 -0500 Subject: [PATCH] feat(android): enable armv8.2-a+fp16+dotprod (#27) * feat(android): enable armv8.2-a+fp16+dotprod * feat(android): split library --- android/src/main/CMakeLists.txt | 59 +++++++++++-------- .../main/java/com/rnllama/LlamaContext.java | 42 ++++++++++++- 2 files changed, 77 insertions(+), 24 deletions(-) diff --git a/android/src/main/CMakeLists.txt b/android/src/main/CMakeLists.txt index e38f9116..4db8a7aa 100644 --- a/android/src/main/CMakeLists.txt +++ b/android/src/main/CMakeLists.txt @@ -5,6 +5,8 @@ project(llama.rn) set(CMAKE_CXX_STANDARD 11) set(RNLLAMA_LIB_DIR ${CMAKE_SOURCE_DIR}/../../../cpp) +include_directories(${RNLLAMA_LIB_DIR}) + set( SOURCE_FILES ${RNLLAMA_LIB_DIR}/ggml-alloc.c @@ -19,36 +21,47 @@ set( ${CMAKE_SOURCE_DIR}/jni.cpp ) -set(RNLLAMA_LIBRARY_NAME rnllama) +find_library(LOG_LIB log) -add_library( - ${RNLLAMA_LIBRARY_NAME} - SHARED - ${SOURCE_FILES} -) +function(build_library target_name) + add_library( + ${target_name} + SHARED + ${SOURCE_FILES} + ) -find_library(LOG_LIB log) + target_link_libraries(${target_name} ${LOG_LIB} android) -target_link_libraries(${RNLLAMA_LIBRARY_NAME} ${LOG_LIB} android) -include_directories(${RNLLAMA_LIB_DIR}) + if (${target_name} STREQUAL "rnllama_v8fp16_va") + target_compile_options(${target_name} PRIVATE -march=armv8.2-a+fp16+dotprod) + endif () -target_compile_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -DLM_GGML_USE_K_QUANTS -pthread) + target_compile_options(${target_name} PRIVATE -DLM_GGML_USE_K_QUANTS -pthread) -if (${CMAKE_BUILD_TYPE} STREQUAL "Debug") - target_compile_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -DRNLLAMA_ANDROID_ENABLE_LOGGING) -endif () + if (${target_name} STREQUAL "rnllama_v8fp16_va") + target_compile_options(${target_name} PRIVATE -march=armv8.2-a+fp16+dotprod) + endif () + + if (${CMAKE_BUILD_TYPE} STREQUAL "Debug") + target_compile_options(${target_name} PRIVATE -DRNLLAMA_ANDROID_ENABLE_LOGGING) + endif () -# NOTE: If you want to debug the native code, you can uncomment if and endif -# if (NOT ${CMAKE_BUILD_TYPE} STREQUAL "Debug") + # NOTE: If you want to debug the native code, you can uncomment if and endif + # if (NOT ${CMAKE_BUILD_TYPE} STREQUAL "Debug") -target_compile_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -Ofast -DNDEBUG) -target_compile_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden) -target_compile_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -ffunction-sections -fdata-sections) + target_compile_options(${target_name} PRIVATE -Ofast -DNDEBUG) + target_compile_options(${target_name} PRIVATE -fvisibility=hidden -fvisibility-inlines-hidden) + target_compile_options(${target_name} PRIVATE -ffunction-sections -fdata-sections) -target_link_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -Wl,--gc-sections) -target_link_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -Wl,--exclude-libs,ALL) -target_link_options(${RNLLAMA_LIBRARY_NAME} PRIVATE -flto) + target_link_options(${target_name} PRIVATE -Wl,--gc-sections) + target_link_options(${target_name} PRIVATE -Wl,--exclude-libs,ALL) + target_link_options(${target_name} PRIVATE -flto) -# endif () + # endif () +endfunction() -# target_compile_features(${RNLLAMA_LIBRARY_NAME} PRIVATE exceptions) +build_library("rnllama") # Default target + +if (${ANDROID_ABI} STREQUAL "arm64-v8a") + build_library("rnllama_v8fp16_va") +endif () diff --git a/android/src/main/java/com/rnllama/LlamaContext.java b/android/src/main/java/com/rnllama/LlamaContext.java index 19c4848b..ba9b6938 100644 --- a/android/src/main/java/com/rnllama/LlamaContext.java +++ b/android/src/main/java/com/rnllama/LlamaContext.java @@ -211,7 +211,30 @@ public void release() { } static { - if (LlamaContext.isArm64V8a() == true || LlamaContext.isX86_64() == true) { + Log.d(NAME, "Primary ABI: " + Build.SUPPORTED_ABIS[0]); + if (LlamaContext.isArm64V8a()) { + boolean loadV8fp16 = false; + if (LlamaContext.isArm64V8a()) { + // ARMv8.2a needs runtime detection support + String cpuInfo = LlamaContext.cpuInfo(); + if (cpuInfo != null) { + Log.d(NAME, "CPU info: " + cpuInfo); + if (cpuInfo.contains("fphp")) { + Log.d(NAME, "CPU supports fp16 arithmetic"); + loadV8fp16 = true; + } + } + } + + if (loadV8fp16) { + Log.d(NAME, "Loading librnllama_v8fp16_va.so"); + System.loadLibrary("rnllama_v8fp16_va"); + } else { + Log.d(NAME, "Loading librnllama.so"); + System.loadLibrary("rnllama"); + } + } else if (LlamaContext.isX86_64()) { + Log.d(NAME, "Loading librnllama.so"); System.loadLibrary("rnllama"); } } @@ -224,6 +247,23 @@ private static boolean isX86_64() { return Build.SUPPORTED_ABIS[0].equals("x86_64"); } + private static String cpuInfo() { + File file = new File("/proc/cpuinfo"); + StringBuilder stringBuilder = new StringBuilder(); + try { + BufferedReader bufferedReader = new BufferedReader(new FileReader(file)); + String line; + while ((line = bufferedReader.readLine()) != null) { + stringBuilder.append(line); + } + bufferedReader.close(); + return stringBuilder.toString(); + } catch (IOException e) { + Log.w(NAME, "Couldn't read /proc/cpuinfo", e); + return null; + } + } + protected static native long initContext( String model, boolean embedding,