diff --git a/.github/workflows/build-aar.yml b/.github/workflows/build-aar.yml
new file mode 100644
index 00000000..1fcd3453
--- /dev/null
+++ b/.github/workflows/build-aar.yml
@@ -0,0 +1,104 @@
+name: Build Android AAR
+
+on:
+  push:
+    branches:
+      - main
+      - android-sdk
+  pull_request:
+
+jobs:
+  build:
+    name: Build AAR
+    runs-on: ubuntu-latest
+    if: github.event_name == 'push'
+
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v3
+
+    - name: Set up JDK 17
+      uses: actions/setup-java@v3
+      with:
+        distribution: 'temurin'
+        java-version: '17'
+
+    - name: Cache Gradle packages
+      uses: actions/cache@v3
+      with:
+        path: ~/.gradle/caches
+        key: ${{ runner.os }}-gradle-${{ hashFiles('**/*.gradle*', '**/gradle-wrapper.properties') }}
+        restore-keys: |
+          ${{ runner.os }}-gradle-
+
+    - name: Navigate to android Directory and Build AAR
+      run: |
+        echo "Navigating to the example directory..."
+        cd android/llama.android
+        echo "Starting Gradle build process in $(pwd)..."
+        ./gradlew assembleRelease --stacktrace --info
+      shell: bash
+
+    - name: Rename and upload AAR
+      run: |
+        echo "Navigating to the android directory to find AAR output..."
+        cd android/llama.android
+        mkdir -p ../artifacts
+        ls -ld ../artifacts || echo "Artifacts directory does not exist."
+        AAR_PATH=$(find ./llama/build/outputs/aar -type f -name "*.aar" | head -n 1)
+        if [ -z "$AAR_PATH" ]; then
+          echo "No AAR file found. Build might have failed."
+          exit 1
+        fi
+        BRANCH_NAME=${{ github.ref_name }}
+        CUSTOM_NAME="com-nexa-${BRANCH_NAME}-${{ github.run_number }}.aar"
+        echo "Found AAR at $AAR_PATH, renaming to $CUSTOM_NAME..."
+        mv "$AAR_PATH" "../artifacts/$CUSTOM_NAME"
+      shell: bash
+
+    - name: Upload AAR as an artifact
+      uses: actions/upload-artifact@v3
+      with:
+        name: custom-aar-${{ github.ref_name }}-${{ github.run_number }}
+        path: android/artifacts/
+
+  release:
+    name: Create GitHub Release
+    needs: build
+    runs-on: ubuntu-latest
+    if: github.event_name == 'push' && contains(github.ref, 'main')
+
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v3
+
+    - name: Download Artifacts
+      uses: actions/download-artifact@v3
+      with:
+        name: custom-aar-${{ github.ref_name }}-${{ github.run_number }}
+        path: release-artifacts
+
+    - name: Create Release
+      id: create_release
+      uses: actions/create-release@v1
+      env:
+        GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+      with:
+        tag_name: v${{ github.run_number }}
+        release_name: "Release v${{ github.run_number }}"
+        body: |
+          This is an automated release containing the latest AAR build.
+          - **Branch:** ${{ github.ref_name }}
+          - **Build Number:** ${{ github.run_number }}
+        draft: false
+        prerelease: false
+
+    - name: Upload AAR to Release
+      uses: actions/upload-release-asset@v1
+      env:
+        GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+      with:
+        upload_url: ${{ steps.create_release.outputs.upload_url }}
+        asset_path: release-artifacts/com-nexa-${{ github.ref_name }}-${{ github.run_number }}.aar
+        asset_name: com-nexa-${{ github.ref_name }}-${{ github.run_number }}.aar
+        asset_content_type: application/java-archive
\ No newline at end of file
diff --git a/.github/workflows/build-wheels-vulkan-win.yaml b/.github/workflows/build-wheels-vulkan-win.yaml
index ac362195..ca68208d 100644
--- a/.github/workflows/build-wheels-vulkan-win.yaml
+++ b/.github/workflows/build-wheels-vulkan-win.yaml
@@ -1,11 +1,8 @@
 name: Build Wheels (Vulkan) (Windows)
-
 on:
   workflow_dispatch:
-
 permissions:
   contents: write
-
 jobs:
   define_matrix:
     name: Define Build Matrix
@@ -15,7 +12,6 @@ jobs:
     defaults:
       run:
         shell: pwsh
-
     steps:
       - name: Define Job Output
         id: set-matrix
@@ -26,10 +22,8 @@ jobs:
               'vulkan_version' = @("1.3.261.1")
               'releasetag' = @("basic")
           }
-
           $matrixOut = ConvertTo-Json $matrix -Compress
           Write-Output ('matrix=' + $matrixOut) >> $env:GITHUB_OUTPUT
-
   build_wheels:
     name: Build Wheel ${{ matrix.os }} Python ${{ matrix.pyver }}
     needs: define_matrix
@@ -42,64 +36,58 @@ jobs:
     env:
       VULKAN_VERSION: ${{ matrix.vulkan_version }}
       RELEASE_TAG: ${{ matrix.releasetag }}
-
     steps:
       - name: Add MSBuild to PATH
         if: runner.os == 'Windows'
         uses: microsoft/setup-msbuild@v2
         with:
           vs-version: "[16.11,16.12)"
-
+          msbuild-architecture: x64
       - name: Checkout Repository
         uses: actions/checkout@v4
         with:
           submodules: "recursive"
-
       - name: Install Vulkan SDK
         run: |
           curl.exe -o $env:RUNNER_TEMP\VulkanSDK-Installer.exe -L "https://sdk.lunarg.com/sdk/download/${{ env.VULKAN_VERSION }}/windows/VulkanSDK-${{ env.VULKAN_VERSION }}-Installer.exe"
           & "$env:RUNNER_TEMP\VulkanSDK-Installer.exe" --accept-licenses --default-answer --confirm-command install
           Add-Content -Path $env:GITHUB_ENV -Value "VULKAN_SDK=C:\VulkanSDK\${{ env.VULKAN_VERSION }}"
           Add-Content -Path $env:GITHUB_PATH -Value "C:\VulkanSDK\${{ env.VULKAN_VERSION }}\Bin"
-
       - name: Setup Python
         uses: actions/setup-python@v5
         with:
           python-version: ${{ matrix.pyver }}
           architecture: 'x64'
           cache: "pip"
-
       - name: Install Ninja Build System
         run: choco install ninja -y
-
       - name: Install Build Dependencies
         run: |
           python -m pip install --upgrade pip
           python -m pip install build wheel setuptools cmake ninja
-          # Install additional dependencies if needed
           python -m pip install scikit-build
-
       - name: Build Wheel
         run: |
           # Set environment variables for CMake and Vulkan
-          $env:CMAKE_ARGS="-DGGML_VULKAN=ON"
+          $env:CMAKE_ARGS="-DGGML_VULKAN=ON -DCMAKE_C_COMPILER=cl -DCMAKE_CXX_COMPILER=cl"
           $env:VULKAN_SDK="C:\VulkanSDK\${{ env.VULKAN_VERSION }}"
           $env:PATH="$env:VULKAN_SDK\Bin;$env:PATH"
-
+          
+          # Set MSVC compiler flags to fix Windows SDK header issues
+          $env:CFLAGS="/D_CRT_SECURE_NO_WARNINGS /DWIN32_LEAN_AND_MEAN /DNOMINMAX /D_WIN32_WINNT=0x0601"
+          $env:CXXFLAGS="/D_CRT_SECURE_NO_WARNINGS /DWIN32_LEAN_AND_MEAN /DNOMINMAX /D_WIN32_WINNT=0x0601"
+          
           # Build the wheel
           python -m build --wheel
-
       - name: Upload Wheel Artifact
         uses: actions/upload-artifact@v4
         with:
           path: dist/*.whl
           name: llama-vulkan-wheel-python${{ matrix.pyver }}.whl
-
       - name: Create GitHub Release
         uses: softprops/action-gh-release@v2
         with:
           files: dist/*
-          # Set tag name to <tag>-vulkan<vulkan_version>
-          tag_name: ${{ github.ref_name }}-vulkan${{ env.VULKAN_VERSION }}
+          tag_name: ${{ github.ref_name }}-vulkan
         env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
\ No newline at end of file
diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index 8ce64f0f..c63c3e1f 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -29,6 +29,14 @@ jobs:
       with:
         python-version: ${{ matrix.python-version }}
 
+    - name: Cache pip packages
+      uses: actions/cache@v3
+      with:
+        path: ~/.cache/pip
+        key: ${{ runner.os }}-pip-${{ hashFiles('**/requirements.txt') }}
+        restore-keys: |
+          ${{ runner.os }}-pip-
+
     - name: Install dependencies
       run: |
         python -m pip install --upgrade pip
@@ -61,4 +69,4 @@ jobs:
     - name: Run tests
       run: |
         python -m pytest tests
-      shell: bash
+      shell: bash
\ No newline at end of file
diff --git a/.github/workflows/generate-index-from-release.yaml b/.github/workflows/generate-index-from-release.yaml
index 11741cab..b993847a 100644
--- a/.github/workflows/generate-index-from-release.yaml
+++ b/.github/workflows/generate-index-from-release.yaml
@@ -3,7 +3,7 @@ name: Wheels Index
 on:
   # Trigger on new release
   workflow_run:
-    workflows: ["Release", "Build Wheels (CUDA)", "Build Wheels (Metal)", "Build Wheels (ROCm)", "Build Wheels (Vulkan)"]
+    workflows: ["Build Wheels (CPU)", "Build Wheels (CUDA)", "Build Wheels (Metal)", "Build Wheels (ROCm)", "Build Wheels (Vulkan)"]
     types:
       - completed
 
diff --git a/.gitignore b/.gitignore
index 9063bffa..a22e3c43 100644
--- a/.gitignore
+++ b/.gitignore
@@ -90,4 +90,13 @@ build_*/
 .cache/
 
 # tests
-quantization_test.py
\ No newline at end of file
+quantization_test.py
+
+# Swift
+.swiftpm/
+UserInterfaceState.xcuserstate
+xcuserdata/
+*.xcworkspace/xcuserdata/
+*.playground/playground.xcworkspace/xcuserdata/
+*.generated.plist
+.build/
\ No newline at end of file
diff --git a/CLI.md b/CLI.md
index 5c4f4ab4..5f219047 100644
--- a/CLI.md
+++ b/CLI.md
@@ -31,7 +31,7 @@ options:
 
 ### List Local Models
 
-List all models on your local computer.
+List all models on your local computer. You can use `nexa run <model_name>` to run any model shown in the list.
 
 ```
 nexa list
@@ -46,11 +46,12 @@ nexa pull MODEL_PATH
 usage: nexa pull [-h] model_path
 
 positional arguments:
-  model_path  Path or identifier for the model in Nexa Model Hub, or Hugging Face repo ID when using -hf flag
+  model_path  Path or identifier for the model in Nexa Model Hub, Hugging Face repo ID when using -hf flag, or ModelScope model ID when using -ms flag
 
 options:
   -h, --help            show this help message and exit
   -hf, --huggingface    Pull model from Hugging Face Hub
+  -ms, --modelscope     Pull model from ModelScope Hub
   -o, --output_path OUTPUT_PATH
                         Custom output path for the pulled model
 ```
@@ -96,11 +97,13 @@ Run a model on your local computer. If the model file is not yet downloaded, it
 
 By default, `nexa` will run gguf models. To run onnx models, use `nexa onnx MODEL_PATH`
 
+You can run any model shown in `nexa list` command.
+
 #### Run Text-Generation Model
 
 ```
 nexa run MODEL_PATH
-usage: nexa run [-h] [-t TEMPERATURE] [-m MAX_NEW_TOKENS] [-k TOP_K] [-p TOP_P] [-sw [STOP_WORDS ...]] [-pf] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] model_path
+usage: nexa run [-h] [-t TEMPERATURE] [-m MAX_NEW_TOKENS] [-k TOP_K] [-p TOP_P] [-sw [STOP_WORDS ...]] [-pf] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] [-ms] model_path
 
 positional arguments:
   model_path            Path or identifier for the model in Nexa Model Hub
@@ -109,9 +112,10 @@ options:
   -h, --help            show this help message and exit
   -pf, --profiling      Enable profiling logs for the inference process
   -st, --streamlit      Run the inference in Streamlit UI, can be used with -lp or -hf
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf or -ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
 
 Text generation options:
   -t, --temperature TEMPERATURE
@@ -135,7 +139,7 @@ nexa run llama2
 
 ```
 nexa run MODEL_PATH
-usage: nexa run [-h] [-i2i] [-ns NUM_INFERENCE_STEPS] [-np NUM_IMAGES_PER_PROMPT] [-H HEIGHT] [-W WIDTH] [-g GUIDANCE_SCALE] [-o OUTPUT] [-s RANDOM_SEED] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] model_path
+usage: nexa run [-h] [-i2i] [-ns NUM_INFERENCE_STEPS] [-np NUM_IMAGES_PER_PROMPT] [-H HEIGHT] [-W WIDTH] [-g GUIDANCE_SCALE] [-o OUTPUT] [-s RANDOM_SEED] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] [-ms] model_path
 
 positional arguments:
   model_path            Path or identifier for the model in Nexa Model Hub
@@ -143,9 +147,10 @@ positional arguments:
 options:
   -h, --help            show this help message and exit
   -st, --streamlit      Run the inference in Streamlit UI, can be used with -lp or -hf
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf or -ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
 
 Image generation options:
   -i2i, --img2img       Whether to run image-to-image generation
@@ -180,7 +185,7 @@ nexa run sd1-4
 
 ```
 nexa run MODEL_PATH
-usage: nexa run [-h] [-t TEMPERATURE] [-m MAX_NEW_TOKENS] [-k TOP_K] [-p TOP_P] [-sw [STOP_WORDS ...]] [-pf] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] model_path
+usage: nexa run [-h] [-t TEMPERATURE] [-m MAX_NEW_TOKENS] [-k TOP_K] [-p TOP_P] [-sw [STOP_WORDS ...]] [-pf] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] [-ms] model_path
 
 positional arguments:
   model_path            Path or identifier for the model in Nexa Model Hub
@@ -189,9 +194,10 @@ options:
   -h, --help            show this help message and exit
   -pf, --profiling      Enable profiling logs for the inference process
   -st, --streamlit      Run the inference in Streamlit UI, can be used with -lp or -hf
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf or -ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
 
 VLM generation options:
   -t, --temperature TEMPERATURE
@@ -215,7 +221,7 @@ nexa run nanollava
 
 ```
 nexa run MODEL_PATH
-usage: nexa run [-h] [-o OUTPUT_DIR] [-b BEAM_SIZE] [-l LANGUAGE] [--task TASK] [-t TEMPERATURE] [-c COMPUTE_TYPE] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] model_path
+usage: nexa run [-h] [-o OUTPUT_DIR] [-b BEAM_SIZE] [-l LANGUAGE] [--task TASK] [-t TEMPERATURE] [-c COMPUTE_TYPE] [-st] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] [-ms] model_path
 
 positional arguments:
   model_path            Path or identifier for the model in Nexa Model Hub
@@ -223,9 +229,10 @@ positional arguments:
 options:
   -h, --help            show this help message and exit
   -st, --streamlit      Run the inference in Streamlit UI, can be used with -lp or -hf
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf or -ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
 
 Automatic Speech Recognition options:
   -b, --beam_size BEAM_SIZE
@@ -249,7 +256,7 @@ nexa run faster-whisper-tiny
 
 ```
 nexa embed MODEL_PATH
-usage: nexa embed [-h] [-lp] [-hf] [-n] [-nt] model_path prompt
+usage: nexa embed [-h] [-lp] [-hf] [-ms] [-n] [-nt] model_path prompt
 
 positional arguments:
   model_path            Path or identifier for the model in Nexa Model Hub
@@ -257,8 +264,9 @@ positional arguments:
 
 options:
   -h, --help            show this help message and exit
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
   -n, --normalize       Normalize the embeddings
   -nt, --no_truncate    Not truncate the embeddings
 ```
@@ -274,6 +282,10 @@ nexa embed sentence-transformers/all-MiniLM-L6-v2:gguf-fp16 "I love Nexa AI." >>
 
 ### Convert and quantize a Hugging Face Model to GGUF
 
+Additional package `nexa-gguf` is required to run this command.
+
+You can install it by `pip install "nexaai[convert]"` or `pip install nexa-gguf`.
+
 ```
 nexa convert HF_MODEL_PATH [ftype] [output_file]
 usage: nexa convert [-h] [-t NTHREAD] [--convert_type CONVERT_TYPE] [--bigendian] [--use_temp_file] [--no_lazy]
@@ -312,6 +324,7 @@ options:
   --only_copy           Only copy tensors (ignores ftype, allow_requantize, and quantize_output_tensor)
   --pure                Quantize all tensors to the default type
   --keep_split          Quantize to the same number of shards
+  -ms --modelscope      Load model from ModelScope Hub
 ```
 
 #### Example
@@ -335,16 +348,17 @@ Start a local server using models on your local computer.
 
 ```
 nexa server MODEL_PATH
-usage: nexa server [-h] [--host HOST] [--port PORT] [--reload] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] model_path
+usage: nexa server [-h] [--host HOST] [--port PORT] [--reload] [-lp] [-mt {NLP, COMPUTER_VISION, MULTIMODAL, AUDIO}] [-hf] [-ms] model_path
 
 positional arguments:
   model_path   Path or identifier for the model in S3
 
 options:
   -h, --help   show this help message and exit
-  -lp, --local_path     Indicate that the model path provided is the local path, must be used with -mt
-  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-  -hf, --huggingface    Load model from Hugging Face Hub, must be used with -mt
+  -lp, --local_path     Indicate that the model path provided is the local path
+  -mt, --model_type     Indicate the model running type, must be used with -lp or -hf or -ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+  -hf, --huggingface    Load model from Hugging Face Hub
+  -ms, --modelscope     Load model from ModelScope Hub
   --host HOST  Host to bind the server to
   --port PORT  Port to bind the server to
   --reload     Enable automatic reloading on code changes
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 4670bff2..41738eb8 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -3,9 +3,43 @@ project(nexa_gguf)
 
 include(ExternalProject)
 
+# Platform-specific settings
+if(WIN32)
+    # Windows-specific settings
+    add_definitions(-D_CRT_SECURE_NO_WARNINGS)
+    # OpenMP is optional on Windows
+    find_package(OpenMP QUIET)
+    if(NOT OpenMP_FOUND)
+        message(STATUS "OpenMP not found - OpenMP support will be disabled")
+        set(OpenMP_C_FLAGS "")
+        set(OpenMP_CXX_FLAGS "")
+        set(OpenMP_EXE_LINKER_FLAGS "")
+    endif()
+elseif(APPLE)
+    # macOS-specific settings
+    find_package(OpenMP QUIET)
+    if(NOT OpenMP_FOUND)
+        message(STATUS "OpenMP not found - OpenMP support will be disabled")
+        set(OpenMP_C_FLAGS "")
+        set(OpenMP_CXX_FLAGS "")
+        set(OpenMP_EXE_LINKER_FLAGS "")
+    endif()
+else()
+    # Linux and other Unix systems
+    find_package(OpenMP REQUIRED)
+endif()
+
 set(CMAKE_POSITION_INDEPENDENT_CODE ON)
 set(CMAKE_CXX_STANDARD 17)
 
+# Windows-specific configurations
+if(WIN32)
+    add_definitions(-D_CRT_SECURE_NO_WARNINGS)
+    add_definitions(-DNOMINMAX)
+    add_definitions(-D_WIN32_WINNT=0x0A00)  # Target Windows 10 or later
+    set(CMAKE_WINDOWS_EXPORT_ALL_SYMBOLS ON)
+endif()
+
 # Function to collect all user-defined options
 function(get_all_options output_var)
     get_cmake_property(variables VARIABLES)
@@ -101,10 +135,11 @@ if(STABLE_DIFFUSION_BUILD)
             -DBUILD_SHARED_LIBS=ON
             -DSD_METAL=${GGML_METAL}
             -DSD_CUBLAS=${GGML_CUDA}
+            -DSD_HIPBLAS=${GGML_HIPBLAS}
+            -DSD_VULKAN=${GGML_VULKAN}
         BUILD_ALWAYS 1
         BUILD_COMMAND ${CMAKE_COMMAND} --build . --config Release -- ${MSBUILD_ARGS}
         INSTALL_COMMAND ${CMAKE_COMMAND} --build . --config Release --target install
-        LOG_INSTALL 1
     )
 endif()
 
@@ -114,6 +149,18 @@ if(LLAMA_BUILD)
     set(LLAMA_CUDA ${GGML_CUDA})
     set(LLAMA_METAL ${GGML_METAL})
 
+    if(WIN32)
+        # Add Windows-specific definitions and flags for llama.cpp
+        list(APPEND COMMON_CMAKE_OPTIONS
+            -DCMAKE_WINDOWS_EXPORT_ALL_SYMBOLS=ON
+            -DLLAMA_NATIVE=OFF           # Disable native CPU optimizations on Windows
+            -DLLAMA_DISABLE_CXXABI=ON    # Disable cxxabi.h dependency
+        )
+
+        # Add compile definition for all targets
+        add_compile_definitions(LLAMA_DISABLE_CXXABI)
+    endif()
+
     ExternalProject_Add(llama_project
         SOURCE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/dependency/llama.cpp
         BINARY_DIR ${CMAKE_CURRENT_BINARY_DIR}/llama_build
@@ -123,8 +170,12 @@ if(LLAMA_BUILD)
             -DCMAKE_INSTALL_PREFIX=${CMAKE_CURRENT_BINARY_DIR}/llama_install
             -DCMAKE_POSITION_INDEPENDENT_CODE=ON
             -DCMAKE_CXX_STANDARD=17
+            -DBUILD_SHARED_LIBS=ON
             -DLLAMA_CUDA=${LLAMA_CUDA}
             -DLLAMA_METAL=${LLAMA_METAL}
+            -DCMAKE_C_FLAGS=${OpenMP_C_FLAGS}
+            -DCMAKE_CXX_FLAGS=${OpenMP_CXX_FLAGS}
+            -DCMAKE_EXE_LINKER_FLAGS=${OpenMP_EXE_LINKER_FLAGS}
             -DGGML_AVX=$<IF:$<AND:$<PLATFORM_ID:Darwin>,$<NOT:$<STREQUAL:${CMAKE_SYSTEM_PROCESSOR},arm64>>>,OFF,ON>
             -DGGML_AVX2=$<IF:$<AND:$<PLATFORM_ID:Darwin>,$<NOT:$<STREQUAL:${CMAKE_SYSTEM_PROCESSOR},arm64>>>,OFF,ON>
             -DGGML_FMA=$<IF:$<AND:$<PLATFORM_ID:Darwin>,$<NOT:$<STREQUAL:${CMAKE_SYSTEM_PROCESSOR},arm64>>>,OFF,ON>
@@ -137,8 +188,13 @@ if(LLAMA_BUILD)
 endif()
 
 # bark_cpp project
-option(BARK_BUILD "Build bark.cpp" ON)
+# Temporarily disabled since version v0.0.9.3
+option(BARK_BUILD "Build bark.cpp" OFF)
 if(BARK_BUILD)
+    # Filter out HIPBLAS and Vulkan options for bark.cpp since it doesn't support them
+    set(BARK_CMAKE_OPTIONS ${USER_DEFINED_OPTIONS})
+    list(FILTER BARK_CMAKE_OPTIONS EXCLUDE REGEX "GGML_HIPBLAS|GGML_VULKAN")
+    
     ExternalProject_Add(bark_project
         SOURCE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/dependency/bark.cpp
         BINARY_DIR ${CMAKE_CURRENT_BINARY_DIR}/bark_build
@@ -149,7 +205,7 @@ if(BARK_BUILD)
             -DCMAKE_POSITION_INDEPENDENT_CODE=ON
             -DCMAKE_CXX_STANDARD=17
             -DGGML_CUDA=${GGML_CUDA}
-            -DGGML_METAL=${GGML_METAL}
+            -DGGML_METAL=OFF
             -DBUILD_SHARED_LIBS=ON
             -DBARK_BUILD_EXAMPLES=OFF
         BUILD_ALWAYS 1
diff --git a/Package.swift b/Package.swift
new file mode 100644
index 00000000..a5ffa87f
--- /dev/null
+++ b/Package.swift
@@ -0,0 +1,32 @@
+// swift-tools-version: 6.0
+
+import PackageDescription
+
+let package = Package(
+    name: "NexaSwift",
+    platforms: [
+        .macOS(.v15),
+        .iOS(.v18),
+        .watchOS(.v11),
+        .tvOS(.v18),
+        .visionOS(.v2)
+    ],
+    products: [
+        .library(name: "NexaSwift", targets: ["NexaSwift"]),
+    ],
+    dependencies: [
+        .package(url: "https://github.com/ggerganov/llama.cpp.git", branch: "master")
+    ],
+    targets: [
+        .target(
+            name: "NexaSwift", 
+            dependencies: [
+                .product(name: "llama", package: "llama.cpp")
+            ],
+            path: "swift/Sources/NexaSwift"),
+        .testTarget(
+            name: "NexaSwiftTests", 
+            dependencies: ["NexaSwift"],
+            path: "swift/Tests/NexaSwiftTests"),
+    ]
+)
diff --git a/README.md b/README.md
index d685f756..17887873 100644
--- a/README.md
+++ b/README.md
@@ -1,59 +1,50 @@
-<div align="center">
-
-<h1>Nexa SDK</h1>
-
-[![MacOS][MacOS-image]][release-url] [![Linux][Linux-image]][release-url] [![Windows][Windows-image]][release-url]
-
-[![GitHub Release](https://img.shields.io/github/v/release/NexaAI/nexa-sdk)](https://github.com/NexaAI/nexa-sdk/releases/latest) [![Build workflow](https://img.shields.io/github/actions/workflow/status/NexaAI/nexa-sdk/ci.yaml?label=CI&logo=github)](https://github.com/NexaAI/nexa-sdk/actions/workflows/ci.yaml?query=branch%3Amain) ![GitHub License](https://img.shields.io/github/license/NexaAI/nexa-sdk)
-
-<!-- ![PyPI - Python Version](https://img.shields.io/pypi/pyversions/nexaai) ![PyPI - Downloads](https://img.shields.io/pypi/dm/nexaai?color=orange) -->
-
-[![Discord](https://dcbadge.limes.pink/api/server/thRu2HaK4D?style=flat&compact=true)](https://discord.gg/thRu2HaK4D)
+<video src="https://user-images.githubusercontent.com/assets/375570dc-0e7a-4a99-840d-c1ef6502e5aa.mp4" autoplay muted loop playsinline style="max-width: 100%;"></video>
 
-[On-device Model Hub](https://model-hub.nexa4ai.com/) / [Nexa SDK Documentation](https://docs.nexaai.com/)
+<h1>Nexa SDK - Local On-Device Inference Framework</h1>
 
 [release-url]: https://github.com/NexaAI/nexa-sdk/releases
 [Windows-image]: https://img.shields.io/badge/windows-0078D4?logo=windows
 [MacOS-image]: https://img.shields.io/badge/-MacOS-black?logo=apple
 [Linux-image]: https://img.shields.io/badge/-Linux-333?logo=ubuntu
 
-</div>
+[![MacOS][MacOS-image]][release-url] [![Linux][Linux-image]][release-url] [![Windows][Windows-image]][release-url] [![](https://img.shields.io/endpoint?url=https%3A%2F%2Fswiftpackageindex.com%2Fapi%2Fpackages%2FNexaAI%2Fnexa-sdk%2Fbadge%3Ftype%3Dplatforms)](https://swiftpackageindex.com/NexaAI/nexa-sdk) [![Build workflow](https://img.shields.io/github/actions/workflow/status/NexaAI/nexa-sdk/ci.yaml?label=CI&logo=github)](https://github.com/NexaAI/nexa-sdk/actions/workflows/ci.yaml?query=branch%3Amain) ![GitHub License](https://img.shields.io/github/license/NexaAI/nexa-sdk) [![GitHub Release](https://img.shields.io/github/v/release/NexaAI/nexa-sdk)](https://github.com/NexaAI/nexa-sdk/releases/latest)
 
-Nexa SDK is a comprehensive toolkit for supporting **ONNX** and **GGML** models. It supports text generation, image generation, vision-language models (VLM), and speech-to-text (ASR), and text-to-speech (TTS) capabilities. Additionally, it offers an OpenAI-compatible API server with JSON schema mode for function calling and streaming support, and a user-friendly Streamlit UI. Users can run Nexa SDK in any device with Python environment, and GPU acceleration is supported, including CUDA, Metal, and ROCm. An executable version is also available.
+[**On-Device Model Hub**](https://nexa.ai/models) | [**Documentation**](https://docs.nexa.ai/) | [**Discord**](https://discord.gg/thRu2HaK4D) | [**Blogs**](https://nexa.ai/blogs) | [**X (Twitter)**](https://x.com/nexa_ai)
 
-<video src="https://user-images.githubusercontent.com/assets/375570dc-0e7a-4a99-840d-c1ef6502e5aa.mp4" autoplay muted loop playsinline style="max-width: 100%;"></video>
+**Nexa SDK** is a local on-device inference framework for ONNX and GGML models, supporting text generation, image generation, vision-language models (VLM), audio-language models, speech-to-text (ASR), and text-to-speech (TTS) capabilities. Installable via Python Package or Executable Installer.
+
+### Features
+
+- **Device Support:** CPU, GPU (CUDA, Metal, ROCm), iOS
+- **Server:** OpenAI-compatible API, JSON schema for function calling and streaming support
+- **Local UI:** Streamlit for interactive model deployment and testing
 
 ## Latest News 🔥
 
-- [2024/10] Support embedding model: `nexa embed <model_path> <prompt>`
-- [2024/10] Support pull and run supported Computer Vision models in GGUF format from HuggingFace: `nexa run -hf <model_id> -mt COMPUTER_VISION`
-- [2024/10] Support VLM in local server.
-- [2024/10] Added option to customize maximum context window for NLP and VLM models.
-- [2024/10] Support running model from user's local path
-- [2024/10] Added LoRA support for NLP models.
-- [2024/10] Added support for whisper-large-v3-turbo: `nexa run faster-whisper-large-turbo`
-- [2024/10] Added support for AMD-Llama-135m: `nexa run AMD-Llama-135m:fp16`
-- [2024/09] Nexa now has executables for easy installation: [Install Nexa SDK](https://nexaai.com/download-sdk) ✨
-- [2024/09] Added support for Llama 3.2 models: `nexa run llama3.2`
-- [2024/09] Added support for Qwen2.5, Qwen2.5-coder and Qwen2.5-Math models: `nexa run qwen2.5`
-- [2024/09] Support pull and run NLP models in GGUF format from HuggingFace: `nexa run -hf <model_id> -mt NLP`
-- [2024/09] Added support for ROCm
-- [2024/09] Added support for Phi-3.5 models: `nexa run phi3.5`
-- [2024/09] Added support for OpenELM models: `nexa run openelm`
-- [2024/09] Introduced logits API support for more advanced model interactions
-- [2024/09] Added support for Flux models: `nexa run flux`
-- [2024/09] Added support for Stable Diffusion 3 model: `nexa run sd3`
-- [2024/09] Added support for Stable Diffusion 2.1 model: `nexa run sd2-1`
+- Support Nexa AI's own vision language model (0.9B parameters): `nexa run omniVLM` and audio language model (2.9B parameters): `nexa run omniaudio`
+- Support audio language model: `nexa run qwen2audio`, **we are the first open-source toolkit to support audio language model with GGML tensor library.**
+- Support iOS Swift binding for local inference on **iOS mobile** devices.
+- Support embedding model: `nexa embed <model_path> <prompt>`
+- Support pull and run supported Computer Vision models in GGUF format from HuggingFace or ModelScope: `nexa run -hf <hf_model_id> -mt COMPUTER_VISION` or `nexa run -ms <ms_model_id> -mt COMPUTER_VISION`
+- Support pull and run NLP models in GGUF format from HuggingFace or ModelScope: `nexa run -hf <hf_model_id> -mt NLP` or `nexa run -ms <ms_model_id> -mt NLP`
 
 Welcome to submit your requests through [issues](https://github.com/NexaAI/nexa-sdk/issues/new/choose), we ship weekly.
 
-## Installation - Executable
+## Install Option 1: Executable Installer
 
-### macOS
+<p>
+    <a href="https://public-storage.nexa4ai.com/nexa-sdk-executable-installer/nexa-sdk-0.0.9.5-macos-installer.pkg">
+        <img src="./assets/mac.png" style="height: 1em; width: auto" /> <strong> macOS Installer </strong>
+    </a>
+</p>
 
-[Download](https://public-storage.nexa4ai.com/nexa-sdk-executable-installer/nexa-macos-installer.pkg)
+<p>
+    <a href="https://public-storage.nexa4ai.com/nexa-sdk-executable-installer/nexa-sdk-0.0.9.5-windows-setup.exe">
+        <img src="./assets/windows.png" style="height: 1em; width: auto" /> <strong>Windows Installer</strong>
+    </a>
+</p>
 
-### Linux
+<strong> <img src="./assets/linux.png" style="height: 1em; width: auto" /> Linux Installer </strong>
 
 ```bash
 curl -fsSL https://public-storage.nexa4ai.com/install.sh | sh
@@ -70,32 +61,24 @@ nexa-exe <command>
 
 </details>
 
-### Windows
-
-Coming soon. Install with Python package below 👇
-
-## Installation - Python Package
-
-We have released pre-built wheels for various Python versions, platforms, and backends for convenient installation on our [index page](https://nexaai.github.io/nexa-sdk/whl/).
+## Install Option 2: Python Package
 
-> [!NOTE]
->
-> 1. If you want to use <strong>ONNX model</strong>, just replace `pip install nexaai` with `pip install "nexaai[onnx]"` in provided commands.
-> 2. If you want to convert and quantize huggingface models to GGUF models, just replace `pip install nexaai` with `pip install "nexaai[nexa-gguf]"`.
-> 3. For Chinese developers, we recommend you to use <strong>Tsinghua Open Source Mirror</strong> as extra index url, just replace `--extra-index-url https://pypi.org/simple` with `--extra-index-url https://pypi.tuna.tsinghua.edu.cn/simple` in provided commands.
+We have released pre-built wheels for various Python versions, platforms, and backends for convenient installation on our [index page](https://github.nexa.ai/whl/).
 
-#### CPU
+<details> <summary><strong style="font-size: 1.2em;">CPU</strong></summary>
 
 ```bash
-pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/cpu --extra-index-url https://pypi.org/simple --no-cache-dir
+pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/cpu --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
-#### GPU (Metal)
+</details>
+
+<details> <summary><strong style="font-size: 1.2em;">Apple GPU (Metal)</strong></summary>
 
 For the GPU version supporting **Metal (macOS)**:
 
 ```bash
-CMAKE_ARGS="-DGGML_METAL=ON -DSD_METAL=ON" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/metal --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_METAL=ON -DSD_METAL=ON" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/metal --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 <details>
@@ -108,37 +91,38 @@ wget https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge
 bash Miniforge3-MacOSX-arm64.sh
 conda create -n nexasdk python=3.10
 conda activate nexasdk
-CMAKE_ARGS="-DGGML_METAL=ON -DSD_METAL=ON" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/metal --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_METAL=ON -DSD_METAL=ON" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/metal --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
+</details>
 </details>
 
-#### GPU (CUDA)
+<details> <summary><strong style="font-size: 1.2em;">Nvidia GPU (CUDA)</strong></summary>
 
 To install with CUDA support, make sure you have [CUDA Toolkit 12.0 or later](https://developer.nvidia.com/cuda-12-0-0-download-archive) installed.
 
 For **Linux**:
 
 ```bash
-CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 For **Windows PowerShell**:
 
 ```bash
-$env:CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON"; pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
+$env:CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON"; pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 For **Windows Command Prompt**:
 
 ```bash
-set CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" & pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
+set CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" & pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 For **Windows Git Bash**:
 
 ```bash
-CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_CUDA=ON -DSD_CUBLAS=ON" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/cu124 --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 <details>
@@ -156,39 +140,45 @@ CMAKE_ARGS="-DCMAKE_CXX_FLAGS=-fopenmp" pip install nexaai
 
 </details>
 
-#### GPU (ROCm)
+</details>
+
+<details> <summary><strong style="font-size: 1.2em;">AMD GPU (ROCm)</strong></summary>
 
 To install with ROCm support, make sure you have [ROCm 6.2.1 or later](https://rocm.docs.amd.com/projects/install-on-linux/en/docs-6.2.1/install/quick-start.html) installed.
 
 For **Linux**:
 
 ```bash
-CMAKE_ARGS="-DGGML_HIPBLAS=on" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/rocm621 --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_HIPBLAS=on" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/rocm621 --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
-#### GPU (Vulkan)
+</details>
+
+<details> <summary><strong style="font-size: 1.2em;">GPU (Vulkan)</strong></summary>
 
 To install with Vulkan support, make sure you have [Vulkan SDK 1.3.261.1 or later](https://vulkan.lunarg.com/sdk/home) installed.
 
 For **Windows PowerShell**:
 
 ```bash
-$env:CMAKE_ARGS="-DGGML_VULKAN=on"; pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
+$env:CMAKE_ARGS="-DGGML_VULKAN=on"; pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 For **Windows Command Prompt**:
 
 ```bash
-set CMAKE_ARGS="-DGGML_VULKAN=on" & pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
+set CMAKE_ARGS="-DGGML_VULKAN=on" & pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
 For **Windows Git Bash**:
 
 ```bash
-CMAKE_ARGS="-DGGML_VULKAN=on" pip install nexaai --prefer-binary --index-url https://nexaai.github.io/nexa-sdk/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
+CMAKE_ARGS="-DGGML_VULKAN=on" pip install nexaai --prefer-binary --index-url https://github.nexa.ai/whl/vulkan --extra-index-url https://pypi.org/simple --no-cache-dir
 ```
 
-### Local Build
+</details>
+
+<details> <summary><strong style="font-size: 1.2em;">Local Build</strong></summary>
 
 How to clone this repo
 
@@ -208,105 +198,109 @@ Then you can build and install the package
 pip install -e .
 ```
 
-## Features
-
-- **Model Support:**
-
-  - **ONNX & GGML models**
-  - **Conversion Engine**
-  - **Inference Engine**:
-    - **Text Generation**
-    - **Image Generation**
-    - **Vision-Language Models (VLM)**
-    - **Speech-to-Text (ASR)**
-
-Detailed API documentation is available [here](https://docs.nexaai.com/).
+</details>
 
-- **Server:**
-  - OpenAI-compatible API
-  - JSON schema mode for function calling
-  - Streaming support
-- **Streamlit UI** for interactive model deployment and testing
+## Differentiation
 
 Below is our differentiation from other similar tools:
 
-| **Feature**                | **[Nexa SDK](https://github.com/NexaAI/nexa-sdk)** | **[ollama](https://github.com/ollama/ollama)** | **[Optimum](https://github.com/huggingface/optimum)** | **[LM Studio](https://github.com/lmstudio-ai)** |
-| -------------------------- | :------------------------------------------------: | :--------------------------------------------: | :---------------------------------------------------: | :---------------------------------------------: |
-| **GGML Support**           |                         ✅                         |                       ✅                       |                          ❌                           |                       ✅                        |
-| **ONNX Support**           |                         ✅                         |                       ❌                       |                          ✅                           |                       ❌                        |
-| **Text Generation**        |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
-| **Image Generation**       |                         ✅                         |                       ❌                       |                          ❌                           |                       ❌                        |
-| **Vision-Language Models** |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
-| **Text-to-Speech**         |                         ✅                         |                       ❌                       |                          ✅                           |                       ❌                        |
-| **Server Capability**      |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
-| **User Interface**         |                         ✅                         |                       ❌                       |                          ❌                           |                       ✅                        |
+| **Feature**                 | **[Nexa SDK](https://github.com/NexaAI/nexa-sdk)** | **[ollama](https://github.com/ollama/ollama)** | **[Optimum](https://github.com/huggingface/optimum)** | **[LM Studio](https://github.com/lmstudio-ai)** |
+| --------------------------- | :------------------------------------------------: | :--------------------------------------------: | :---------------------------------------------------: | :---------------------------------------------: |
+| **GGML Support**            |                         ✅                         |                       ✅                       |                          ❌                           |                       ✅                        |
+| **ONNX Support**            |                         ✅                         |                       ❌                       |                          ✅                           |                       ❌                        |
+| **Text Generation**         |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
+| **Image Generation**        |                         ✅                         |                       ❌                       |                          ❌                           |                       ❌                        |
+| **Vision-Language Models**  |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
+| **Audio-Language Models**   |                         ✅                         |                       ❌                       |                          ❌                           |                       ❌                        |
+| **Text-to-Speech**          |                         ✅                         |                       ❌                       |                          ✅                           |                       ❌                        |
+| **Server Capability**       |                         ✅                         |                       ✅                       |                          ✅                           |                       ✅                        |
+| **User Interface**          |                         ✅                         |                       ❌                       |                          ❌                           |                       ✅                        |
+| **Executable Installation** |                         ✅                         |                       ✅                       |                          ❌                           |                       ✅                        |
 
 ## Supported Models & Model Hub
 
 Our on-device model hub offers all types of quantized models (text, image, audio, multimodal) with filters for RAM, file size, Tasks, etc. to help you easily explore models with UI. Explore on-device models at [On-device Model Hub](https://model-hub.nexa4ai.com/)
 
-Supported models (full list at [Model Hub](https://nexa.ai/models)):
+Supported model examples (full list at [Model Hub](https://nexa.ai/models)):
 | Model | Type | Format | Command |
 | ------------------------------------------------------------------------------------------------------- | --------------- | --------- | -------------------------------------- |
-| [octopus-v2](https://www.nexaai.com/NexaAI/Octopus-v2/gguf-q4_0/readme) | NLP | GGUF | `nexa run octopus-v2` |
-| [octopus-v4](https://www.nexaai.com/NexaAI/Octopus-v4/gguf-q4_0/readme) | NLP | GGUF | `nexa run octopus-v4` |
-| [gpt2](https://nexaai.com/openai/gpt2/gguf-q4_0/readme) | NLP | GGUF | `nexa run gpt2` |
-| [tinyllama](https://www.nexaai.com/TinyLlama/TinyLlama-1.1B-Chat-v1.0/gguf-fp16/readme) | NLP | GGUF | `nexa run tinyllama` |
-| [llama2](https://www.nexaai.com/meta/Llama2-7b-chat/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run llama2` |
-| [llama2-uncensored](https://www.nexaai.com/georgesung/Llama2-7b-chat-uncensored/gguf-q4_0/readme) | NLP | GGUF | `nexa run llama2-uncensored` |
-| [llama2-function-calling](https://www.nexaai.com/Trelis/Llama2-7b-function-calling/gguf-q4_K_M/readme) | NLP | GGUF | `nexa run llama2-function-calling` |
-| [llama3](https://www.nexaai.com/meta/Llama3-8B-Instruct/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run llama3` |
-| [llama3.1](https://www.nexaai.com/meta/Llama3.1-8B-Instruct/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run llama3.1` |
-| [llama3.2](https://nexaai.com/meta/Llama3.2-3B-Instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run llama3.2` |
-| [llama3-uncensored](https://www.nexaai.com/Orenguteng/Llama3-8B-Lexi-Uncensored/gguf-q4_K_M/readme) | NLP | GGUF | `nexa run llama3-uncensored` |
-| [gemma](https://www.nexaai.com/google/gemma-1.1-2b-instruct/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run gemma` |
-| [gemma2](https://www.nexaai.com/google/gemma-2-2b-instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run gemma2` |
-| [qwen1.5](https://www.nexaai.com/Qwen/Qwen1.5-7B-Instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run qwen1.5` |
-| [qwen2](https://www.nexaai.com/Qwen/Qwen2-1.5B-Instruct/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run qwen2` |
-| [qwen2.5](https://www.nexaai.com/Qwen/Qwen2.5-1.5B-Instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run qwen2.5` |
-| [mathqwen](https://nexaai.com/Qwen/Qwen2.5-Math-1.5B-Instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run mathqwen` |
-| [codeqwen](https://www.nexaai.com/Qwen/CodeQwen1.5-7B-Instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run codeqwen` |
-| [mistral](https://www.nexaai.com/mistralai/Mistral-7B-Instruct-v0.3/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run mistral` |
-| [dolphin-mistral](https://www.nexaai.com/CognitiveComputations/dolphin-2.8-mistral-7b/gguf-q4_0/readme) | NLP | GGUF | `nexa run dolphin-mistral` |
-| [codegemma](https://www.nexaai.com/google/codegemma-2b/gguf-q4_0/readme) | NLP | GGUF | `nexa run codegemma` |
-| [codellama](https://www.nexaai.com/meta/CodeLlama-7b-Instruct/gguf-q2_K/readme) | NLP | GGUF | `nexa run codellama` |
-| [deepseek-coder](https://www.nexaai.com/DeepSeek/deepseek-coder-1.3b-instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run deepseek-coder` |
-| [phi2](https://www.nexaai.com/microsoft/Phi-2/gguf-q4_0/readme) | NLP | GGUF | `nexa run phi2` |
-| [phi3](https://www.nexaai.com/microsoft/Phi-3-mini-128k-instruct/gguf-q4_0/readme) | NLP | GGUF/ONNX | `nexa run phi3` |
-| [phi3.5](https://nexaai.com/microsoft/Phi-3.5-mini-instruct/gguf-q4_0/readme) | NLP | GGUF | `nexa run phi3.5` |
-| [openelm](https://nexaai.com/apple/OpenELM-3B/gguf-q4_K_M/readme) | NLP | GGUF | `nexa run openelm` |
-| [AMD-Llama-135m](https://nexaai.com/amd/AMD-Llama-135m/gguf-fp16/readme) | NLP | GGUF | `nexa run AMD-Llama-135m:fp16` |
+| [omniaudio](https://nexa.ai/NexaAI/omniaudio/gguf-q4_0/readme) | AudioLM | GGUF | `nexa run omniaudio` |
+| [qwen2audio](https://nexa.ai/Qwen/Qwen2-Audio-7.8B-Instruct/gguf-q4_K_M/readme) | AudioLM | GGUF | `nexa run qwen2audio` |
+| [octopus-v2](https://www.nexaai.com/NexaAI/Octopus-v2/gguf-q4_0/readme) | Function Call | GGUF | `nexa run octopus-v2` |
+| [octo-net](https://www.nexaai.com/NexaAI/Octo-net/gguf-q4_0/readme) | Text | GGUF | `nexa run octo-net` |
+| [omniVLM](https://nexa.ai/NexaAI/omniVLM/gguf-fp16/readme) | Multimodal | GGUF | `nexa run omniVLM` |
 | [nanollava](https://www.nexaai.com/qnguyen3/nanoLLaVA/gguf-fp16/readme) | Multimodal | GGUF | `nexa run nanollava` |
 | [llava-phi3](https://www.nexaai.com/xtuner/llava-phi-3-mini/gguf-q4_0/readme) | Multimodal | GGUF | `nexa run llava-phi3` |
 | [llava-llama3](https://www.nexaai.com/xtuner/llava-llama-3-8b-v1.1/gguf-q4_0/readme) | Multimodal | GGUF | `nexa run llava-llama3` |
 | [llava1.6-mistral](https://www.nexaai.com/liuhaotian/llava-v1.6-mistral-7b/gguf-q4_0/readme) | Multimodal | GGUF | `nexa run llava1.6-mistral` |
 | [llava1.6-vicuna](https://www.nexaai.com/liuhaotian/llava-v1.6-vicuna-7b/gguf-q4_0/readme) | Multimodal | GGUF | `nexa run llava1.6-vicuna` |
-| [stable-diffusion-v1-4](https://www.nexaai.com/runwayml/stable-diffusion-v1-4/gguf-q4_0/readme) | Computer Vision | GGUF | `nexa run sd1-4` |
-| [stable-diffusion-v1-5](https://www.nexaai.com/runwayml/stable-diffusion-v1-5/gguf-q4_0/readme) | Computer Vision | GGUF/ONNX | `nexa run sd1-5` |
-| [stable-diffusion-v2-1](https://nexaai.com/StabilityAI/stable-diffusion-v2-1/gguf-q4_0/readme) | Computer Vision | GGUF | `nexa run sd2-1` |
-| [stable-diffusion-3-medium](https://nexaai.com/StabilityAI/stable-diffusion-3-medium/gguf-q4_0/readme) | Computer Vision | GGUF | `nexa run sd3` |
-| [FLUX.1-schnell](https://nexaai.com/BlackForestLabs/FLUX.1-schnell/gguf-q4_0/readme) | Computer Vision | GGUF | `nexa run flux` |
-| [lcm-dreamshaper](https://www.nexaai.com/SimianLuo/lcm-dreamshaper-v7/gguf-fp16/readme) | Computer Vision | GGUF/ONNX | `nexa run lcm-dreamshaper` |
-| [hassaku-lcm](https://nexaai.com/stablediffusionapi/hassaku-hentai-model-v13-LCM/gguf-fp16/readme) | Computer Vision | GGUF | `nexa run hassaku-lcm` |
-| [anything-lcm](https://www.nexaai.com/Linaqruf/anything-v30-LCM/gguf-fp16/readme) | Computer Vision | GGUF | `nexa run anything-lcm` |
-| [faster-whisper-tiny](https://www.nexaai.com/Systran/faster-whisper-tiny/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-tiny` |
-| [faster-whisper-small](https://www.nexaai.com/Systran/faster-whisper-small/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-small` |
-| [faster-whisper-medium](https://www.nexaai.com/Systran/faster-whisper-medium/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-medium` |
-| [faster-whisper-base](https://www.nexaai.com/Systran/faster-whisper-base/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-base` |
-| [faster-whisper-large](https://www.nexaai.com/Systran/faster-whisper-large-v3/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-large` |
-| [whisper-large-v3-turbo](https://nexaai.com/Systran/faster-whisper-large-v3-turbo/bin-cpu-fp16/readme) | Audio | BIN | `nexa run faster-whisper-large-turbo` |
-| [whisper-tiny.en](https://nexaai.com/openai/whisper-tiny.en/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-tiny.en` |
-| [whisper-tiny](https://nexaai.com/openai/whisper-tiny/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-tiny` |
-| [whisper-small.en](https://nexaai.com/openai/whisper-small.en/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-small.en` |
-| [whisper-small](https://nexaai.com/openai/whisper-small/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-small` |
-| [whisper-base.en](https://nexaai.com/openai/whisper-base.en/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-base.en` |
-| [whisper-base](https://nexaai.com/openai/whisper-base/onnx-cpu-fp32/readme) | Audio | ONNX | `nexa run whisper-base` |
+| [llama3.2](https://nexaai.com/meta/Llama3.2-3B-Instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run llama3.2` |
+| [llama3-uncensored](https://www.nexaai.com/Orenguteng/Llama3-8B-Lexi-Uncensored/gguf-q4_K_M/readme) | Text | GGUF | `nexa run llama3-uncensored` |
+| [gemma2](https://www.nexaai.com/google/gemma-2-2b-instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run gemma2` |
+| [qwen2.5](https://www.nexaai.com/Qwen/Qwen2.5-1.5B-Instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run qwen2.5` |
+| [mathqwen](https://nexaai.com/Qwen/Qwen2.5-Math-1.5B-Instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run mathqwen` |
+| [codeqwen](https://www.nexaai.com/Qwen/CodeQwen1.5-7B-Instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run codeqwen` |
+| [mistral](https://www.nexaai.com/mistralai/Mistral-7B-Instruct-v0.3/gguf-q4_0/readme) | Text | GGUF/ONNX | `nexa run mistral` |
+| [deepseek-coder](https://www.nexaai.com/DeepSeek/deepseek-coder-1.3b-instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run deepseek-coder` |
+| [phi3.5](https://nexaai.com/microsoft/Phi-3.5-mini-instruct/gguf-q4_0/readme) | Text | GGUF | `nexa run phi3.5` |
+| [openelm](https://nexaai.com/apple/OpenELM-3B/gguf-q4_K_M/readme) | Text | GGUF | `nexa run openelm` |
+| [stable-diffusion-v2-1](https://nexaai.com/StabilityAI/stable-diffusion-v2-1/gguf-q4_0/readme) | Image Generation | GGUF | `nexa run sd2-1` |
+| [stable-diffusion-3-medium](https://nexaai.com/StabilityAI/stable-diffusion-3-medium/gguf-q4_0/readme) | Image Generation | GGUF | `nexa run sd3` |
+| [FLUX.1-schnell](https://nexaai.com/BlackForestLabs/FLUX.1-schnell/gguf-q4_0/readme) | Image Generation | GGUF | `nexa run flux` |
+| [lcm-dreamshaper](https://www.nexaai.com/SimianLuo/lcm-dreamshaper-v7/gguf-fp16/readme) | Image Generation | GGUF/ONNX | `nexa run lcm-dreamshaper` |
+| [whisper-large-v3-turbo](https://nexaai.com/Systran/faster-whisper-large-v3-turbo/bin-cpu-fp16/readme) | Speech-to-Text | BIN | `nexa run faster-whisper-large-turbo` |
+| [whisper-tiny.en](https://nexaai.com/openai/whisper-tiny.en/onnx-cpu-fp32/readme) | Speech-to-Text | ONNX | `nexa run whisper-tiny.en` |
 | [mxbai-embed-large-v1](https://nexa.ai/mixedbread-ai/mxbai-embed-large-v1/gguf-fp16/readme) | Embedding | GGUF | `nexa embed mxbai` |
 | [nomic-embed-text-v1.5](https://nexa.ai/nomic-ai/nomic-embed-text-v1.5/gguf-fp16/readme) | Embedding | GGUF | `nexa embed nomic` |
-| [all-MiniLM-L6-v2](https://nexa.ai/sentence-transformers/all-MiniLM-L6-v2/gguf-fp16/readme) | Embedding | GGUF | `nexa embed all-MiniLM-L6-v2:fp16` |
 | [all-MiniLM-L12-v2](https://nexa.ai/sentence-transformers/all-MiniLM-L12-v2/gguf-fp16/readme) | Embedding | GGUF | `nexa embed all-MiniLM-L12-v2:fp16` |
+| [bark-small](https://nexa.ai/suno/bark-small/gguf-fp16/readme) | Text-to-Speech | GGUF | `nexa run bark-small:fp16` |
+
+## Run Models from 🤗 HuggingFace or 🤖 ModelScope
 
-## CLI Reference
+You can pull, convert (to .gguf), quantize and run [llama.cpp supported](https://github.com/ggerganov/llama.cpp#description) text generation models from HF or MS with Nexa SDK.
+
+### Run .gguf File
+
+Use `nexa run -hf <hf-model-id>` or `nexa run -ms <ms-model-id>` to run models with provided .gguf files:
+
+```bash
+nexa run -hf Qwen/Qwen2.5-Coder-7B-Instruct-GGUF
+```
+
+```bash
+nexa run -ms Qwen/Qwen2.5-Coder-7B-Instruct-GGUF
+```
+
+> **Note:** You will be prompted to select a single .gguf file. If your desired quantization version has multiple split files (like fp16-00001-of-00004), please use Nexa's conversion tool (see below) to convert and quantize the model locally.
+
+### Convert .safetensors Files
+
+Install [Nexa Python package](https://github.com/NexaAI/nexa-sdk?tab=readme-ov-file#install-option-2-python-package), and install Nexa conversion tool with `pip install "nexaai[convert]"`, then convert models from huggingface with `nexa convert <hf-model-id>`:
+
+```bash
+nexa convert HuggingFaceTB/SmolLM2-135M-Instruct
+```
+
+Or you can convert models from ModelScope with `nexa convert -ms <ms-model-id>`:
+
+```bash
+nexa convert -ms Qwen/Qwen2.5-7B-Instruct
+```
+
+> **Note:** Check our [leaderboard](https://nexa.ai/leaderboard) for performance benchmarks of different quantized versions of mainstream language models and [HuggingFace docs](https://huggingface.co/docs/optimum/en/concept_guides/quantization) to learn about quantization options.
+
+📋 You can view downloaded and converted models with `nexa list`
+
+## Documentation
+
+> [!NOTE]
+>
+> 1. If you want to use <strong>ONNX model</strong>, just replace `pip install nexaai` with `pip install "nexaai[onnx]"` in provided commands.
+> 2. If you want to <strong>run benchmark evaluation</strong>, just replace `pip install nexaai` with `pip install "nexaai[eval]"` in provided commands.
+> 3. If you want to <strong>convert and quantize huggingface models to GGUF models</strong>, just replace `pip install nexaai` with `pip install "nexaai[convert]"` in provided commands.
+> 4. For Chinese developers, we recommend you to use <strong>Tsinghua Open Source Mirror</strong> as extra index url, just replace `--extra-index-url https://pypi.org/simple` with `--extra-index-url https://pypi.tuna.tsinghua.edu.cn/simple` in provided commands.
+
+### CLI Reference
 
 Here's a brief overview of the main CLI commands:
 
@@ -325,15 +319,22 @@ Here's a brief overview of the main CLI commands:
 
 For detailed information on CLI commands and usage, please refer to the [CLI Reference](CLI.md) document.
 
-## Start Local Server
+### Start Local Server
 
 To start a local server using models on your local computer, you can use the `nexa server` command.
 For detailed information on server setup, API endpoints, and usage examples, please refer to the [Server Reference](SERVER.md) document.
 
+### Swift Package
+
+**[Swift SDK](https://github.com/NexaAI/nexa-sdk/tree/main/swift):** Provides a Swifty API, allowing Swift developers to easily integrate and use llama.cpp models in their projects.
+
+[**More Docs**](https://docs.nexa.ai/)
+
 ## Acknowledgements
 
 We would like to thank the following projects:
 
 - [llama.cpp](https://github.com/ggerganov/llama.cpp)
 - [stable-diffusion.cpp](https://github.com/leejet/stable-diffusion.cpp)
+- [bark.cpp](https://github.com/PABannier/bark.cpp)
 - [optimum](https://github.com/huggingface/optimum)
diff --git a/SERVER.md b/SERVER.md
index 10462e8c..b75efa45 100644
--- a/SERVER.md
+++ b/SERVER.md
@@ -8,9 +8,10 @@ usage: nexa server [-h] [--host HOST] [--port PORT] [--reload] model_path
 
 ### Options:
 
-- `-lp, --local_path`: Indicate that the model path provided is the local path, must be used with -mt
-- `-mt, --model_type`: Indicate the model running type, must be used with -lp or -hf, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
-- `-hf, --huggingface`: Load model from Hugging Face Hub, must be used with -mt
+- `-lp, --local_path`: Indicate that the model path provided is the local path
+- `-mt, --model_type`: Indicate the model running type, must be used with -lp or -hf or ms, choose from [NLP, COMPUTER_VISION, MULTIMODAL, AUDIO]
+- `-hf, --huggingface`: Load model from Hugging Face Hub
+- `-ms, --modelscope`: Load model from ModelScope Hub
 - `--host`: Host to bind the server to
 - `--port`: Port to bind the server to
 - `--reload`: Enable automatic reloading on code changes
diff --git a/android/llama.android/.gitignore b/android/llama.android/.gitignore
new file mode 100644
index 00000000..347e252e
--- /dev/null
+++ b/android/llama.android/.gitignore
@@ -0,0 +1,33 @@
+# Gradle files
+.gradle/
+build/
+
+# Local configuration file (sdk path, etc)
+local.properties
+
+# Log/OS Files
+*.log
+
+# Android Studio generated files and folders
+captures/
+.externalNativeBuild/
+.cxx/
+*.apk
+output.json
+
+# IntelliJ
+*.iml
+.idea/
+misc.xml
+deploymentTargetDropDown.xml
+render.experimental.xml
+
+# Keystore files
+*.jks
+*.keystore
+
+# Google Services (e.g. APIs or Firebase)
+google-services.json
+
+# Android Profiling
+*.hprof
diff --git a/android/llama.android/README.md b/android/llama.android/README.md
new file mode 100644
index 00000000..aa91234c
--- /dev/null
+++ b/android/llama.android/README.md
@@ -0,0 +1,54 @@
+# Nexa
+
+**Nexa** is a Kotlin wrapper for the [llama.cpp](https://github.com/ggerganov/llama.cpp.git) library. offering a convenient Kotlin API for Android developers. It allows seamless integration of llama.cpp models into Android applications.
+**NOTE:** Currently, Nexa supports Vision-Language Model (VLM) inference capabilities.
+
+## Installation
+
+To add Nexa to your Android project, follow these steps:
+
+- Create a libs folder in your project’s root directory.
+- Copy the .aar file into the libs folder.
+- Add dependency to your build.gradle file:
+
+```
+implementation files("libs/com.nexa.aar")
+```
+
+## Usage
+### 1. Initialize NexaSwift with model path and projector path
+
+Create a configuration and initialize NexaSwift with the path to your model file:
+
+```kotlin
+nexaVlmInference = NexaVlmInference(pathToModel,
+    mmprojectorPath, imagePath,
+    maxNewTokens = 128,
+    stopWords = listOf("</s>"))
+nexaVlmInference.loadModel()
+```
+
+### 2. Completion API
+
+#### Streaming Mode
+
+```swift
+nexaVlmInference.createCompletionStream(prompt, imagePath)
+    ?.catch {
+        print(it.message)
+    }
+    ?.collect { print(it) }
+```
+
+### 3. release all resources
+```kotlin
+nexaVlmInference.dispose()
+```
+
+## Quick Start
+
+Open the [android test project](./app-java) folder in Android Studio and run the project.
+
+## Download Models
+
+You can download models from the [Nexa AI ModelHub](https://nexa.ai/models).
\ No newline at end of file
diff --git a/android/llama.android/app-java/.gitignore b/android/llama.android/app-java/.gitignore
new file mode 100644
index 00000000..42df58a2
--- /dev/null
+++ b/android/llama.android/app-java/.gitignore
@@ -0,0 +1,2 @@
+/build
+!*.png
\ No newline at end of file
diff --git a/android/llama.android/app-java/build.gradle b/android/llama.android/app-java/build.gradle
new file mode 100644
index 00000000..2729f317
--- /dev/null
+++ b/android/llama.android/app-java/build.gradle
@@ -0,0 +1,52 @@
+plugins {
+    id 'com.android.application'
+    id 'kotlin-android'
+}
+
+android {
+    namespace 'ai.nexa.app_java'
+    compileSdk 34
+
+    defaultConfig {
+        applicationId "ai.nexa.app_java"
+        minSdk 33
+        targetSdk 34
+        versionCode 1
+        versionName "1.0"
+
+        testInstrumentationRunner "androidx.test.runner.AndroidJUnitRunner"
+    }
+
+    buildTypes {
+        release {
+            minifyEnabled false
+            proguardFiles getDefaultProguardFile('proguard-android-optimize.txt'), 'proguard-rules.pro'
+        }
+    }
+    compileOptions {
+        sourceCompatibility JavaVersion.VERSION_17  // or VERSION_1_8
+        targetCompatibility JavaVersion.VERSION_17  // or VERSION_1_8
+    }
+
+    kotlinOptions {
+        jvmTarget = "17"  // or "1.8"
+    }
+}
+
+dependencies {
+
+    implementation 'androidx.appcompat:appcompat:1.7.0'
+    implementation 'com.google.android.material:material:1.12.0'
+    testImplementation 'junit:junit:4.13.2'
+    androidTestImplementation 'androidx.test.ext:junit:1.2.1'
+    androidTestImplementation 'androidx.test.espresso:espresso-core:3.6.1'
+
+    implementation "org.jetbrains.kotlin:kotlin-stdlib:1.9.20"
+    implementation "org.jetbrains.kotlinx:kotlinx-coroutines-android:1.7.3"
+
+    implementation 'com.github.bumptech.glide:glide:4.16.0'
+    annotationProcessor 'com.github.bumptech.glide:compiler:4.16.0'
+
+   implementation project(":llama")
+    // implementation files("libs/com.nexa.aar")
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/proguard-rules.pro b/android/llama.android/app-java/proguard-rules.pro
new file mode 100644
index 00000000..481bb434
--- /dev/null
+++ b/android/llama.android/app-java/proguard-rules.pro
@@ -0,0 +1,21 @@
+# Add project specific ProGuard rules here.
+# You can control the set of applied configuration files using the
+# proguardFiles setting in build.gradle.
+#
+# For more details, see
+#   http://developer.android.com/guide/developing/tools/proguard.html
+
+# If your project uses WebView with JS, uncomment the following
+# and specify the fully qualified class name to the JavaScript interface
+# class:
+#-keepclassmembers class fqcn.of.javascript.interface.for.webview {
+#   public *;
+#}
+
+# Uncomment this to preserve the line number information for
+# debugging stack traces.
+#-keepattributes SourceFile,LineNumberTable
+
+# If you keep the line number information, uncomment this to
+# hide the original source file name.
+#-renamesourcefileattribute SourceFile
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/androidTest/java/ai/nexa/app_java/ExampleInstrumentedTest.java b/android/llama.android/app-java/src/androidTest/java/ai/nexa/app_java/ExampleInstrumentedTest.java
new file mode 100644
index 00000000..7f3c2198
--- /dev/null
+++ b/android/llama.android/app-java/src/androidTest/java/ai/nexa/app_java/ExampleInstrumentedTest.java
@@ -0,0 +1,26 @@
+package ai.nexa.app_java;
+
+import android.content.Context;
+
+import androidx.test.platform.app.InstrumentationRegistry;
+import androidx.test.ext.junit.runners.AndroidJUnit4;
+
+import org.junit.Test;
+import org.junit.runner.RunWith;
+
+import static org.junit.Assert.*;
+
+/**
+ * Instrumented test, which will execute on an Android device.
+ *
+ * @see <a href="http://d.android.com/tools/testing">Testing documentation</a>
+ */
+@RunWith(AndroidJUnit4.class)
+public class ExampleInstrumentedTest {
+    @Test
+    public void useAppContext() {
+        // Context of the app under test.
+        Context appContext = InstrumentationRegistry.getInstrumentation().getTargetContext();
+        assertEquals("ai.nexa.app_java", appContext.getPackageName());
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/AndroidManifest.xml b/android/llama.android/app-java/src/main/AndroidManifest.xml
new file mode 100644
index 00000000..8aaea0a2
--- /dev/null
+++ b/android/llama.android/app-java/src/main/AndroidManifest.xml
@@ -0,0 +1,49 @@
+<?xml version="1.0" encoding="utf-8"?>
+<manifest xmlns:android="http://schemas.android.com/apk/res/android">
+
+    <uses-permission android:name="android.permission.ACCESS_NETWORK_STATE" />
+    <uses-permission android:name="android.permission.INTERNET" />
+    <uses-permission android:name="android.permission.RECORD_AUDIO"/>
+    <uses-permission android:name="android.permission.SEND_SMS"/>
+    <uses-permission android:name="android.permission.CAMERA"/>
+    <uses-permission android:name="android.permission.READ_EXTERNAL_STORAGE" />
+    <uses-permission android:name="android.permission.WRITE_EXTERNAL_STORAGE"/>
+    <uses-permission android:name="android.permission.ACCESS_FINE_LOCATION" />
+    <uses-permission android:name="android.permission.ACCESS_COARSE_LOCATION" />
+
+    <application
+        android:allowBackup="true"
+        android:dataExtractionRules="@xml/data_extraction_rules"
+        android:fullBackupContent="@xml/backup_rules"
+        android:icon="@mipmap/octopus"
+        android:label="VlmSDK"
+        android:roundIcon="@mipmap/octopus_round"
+        android:supportsRtl="true"
+        android:theme="@style/Theme.LayoutTest"
+        android:networkSecurityConfig="@xml/network_security_config">
+        <activity
+            android:name=".MainActivity"
+            android:exported="true"
+            android:windowSoftInputMode="adjustResize">>
+            <intent-filter>
+                <action android:name="android.intent.action.MAIN" />
+
+                <category android:name="android.intent.category.LAUNCHER" />
+            </intent-filter>
+        </activity>
+        <meta-data
+            android:name="preloaded_fonts"
+            android:resource="@array/preloaded_fonts" />
+
+        <provider
+            android:name="androidx.core.content.FileProvider"
+            android:authorities="${applicationId}.fileprovider"
+            android:exported="false"
+            android:grantUriPermissions="true">
+            <meta-data
+                android:name="android.support.FILE_PROVIDER_PATHS"
+                android:resource="@xml/file_paths" />
+        </provider>
+    </application>
+
+</manifest>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/ImagePathHelper.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/ImagePathHelper.java
new file mode 100644
index 00000000..a8b0ef00
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/ImagePathHelper.java
@@ -0,0 +1,112 @@
+package ai.nexa.app_java;
+
+import android.content.Context;
+import android.database.Cursor;
+import android.net.Uri;
+import android.provider.DocumentsContract;
+import android.provider.MediaStore;
+import android.util.Log;
+
+import java.io.File;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
+
+public class ImagePathHelper {
+    private static final String TAG = "MessageProcessor";
+    private final Context context;
+
+    public ImagePathHelper(Context context) {
+        this.context = context;
+    }
+
+    public String getPathFromUri(String uriString) {
+        try {
+            Uri uri = Uri.parse(uriString);
+
+            // Handle "content://" scheme
+            if ("content".equals(uri.getScheme())) {
+                // Handle Google Photos and other document providers
+                if (DocumentsContract.isDocumentUri(context, uri)) {
+                    final String docId = DocumentsContract.getDocumentId(uri);
+
+                    // MediaStore documents
+                    if ("com.android.providers.media.documents".equals(uri.getAuthority())) {
+                        final String[] split = docId.split(":");
+                        final String type = split[0];
+                        Uri contentUri = null;
+
+                        if ("image".equals(type)) {
+                            contentUri = MediaStore.Images.Media.EXTERNAL_CONTENT_URI;
+                        }
+
+                        final String selection = "_id=?";
+                        final String[] selectionArgs = new String[]{split[1]};
+                        return getDataColumn(context, contentUri, selection, selectionArgs);
+                    }
+                }
+                // MediaStore (general case)
+                return getDataColumn(context, uri, null, null);
+            }
+            // Handle "file://" scheme
+            else if ("file".equals(uri.getScheme())) {
+                return uri.getPath();
+            }
+            // Handle absolute path
+            else if (new File(uriString).exists()) {
+                return uriString;
+            }
+
+            return null;
+        } catch (Exception e) {
+            Log.e(TAG, "Error getting path from URI: " + uriString, e);
+            return null;
+        }
+    }
+
+    public String copyUriToPrivateFile(Context context, String uriString) throws IOException {
+        // 将字符串转换回 Uri
+        Uri uri = Uri.parse(uriString);
+
+        // 应用私有目录
+        File privateDir = context.getExternalFilesDir("images");
+        if (privateDir == null) {
+            throw new IOException("Private directory not available");
+        }
+
+        // 创建目标文件
+        File destFile = new File(privateDir, "temp_image_" + System.currentTimeMillis() + ".jpg");
+
+        try (InputStream inputStream = context.getContentResolver().openInputStream(uri);
+             OutputStream outputStream = new FileOutputStream(destFile)) {
+
+            if (inputStream == null) {
+                throw new IOException("Failed to open URI input stream");
+            }
+
+            // 读取并写入数据
+            byte[] buffer = new byte[4096];
+            int bytesRead;
+            while ((bytesRead = inputStream.read(buffer)) != -1) {
+                outputStream.write(buffer, 0, bytesRead);
+            }
+        }
+
+        // 返回文件路径
+        return destFile.getAbsolutePath();
+    }
+
+    private String getDataColumn(Context context, Uri uri, String selection, String[] selectionArgs) {
+        final String[] projection = {MediaStore.Images.Media.DATA};
+        try (Cursor cursor = context.getContentResolver().query(uri, projection, selection, selectionArgs, null)) {
+            if (cursor != null && cursor.moveToFirst()) {
+                final int columnIndex = cursor.getColumnIndexOrThrow(MediaStore.Images.Media.DATA);
+                return cursor.getString(columnIndex);
+            }
+        } catch (Exception e) {
+            Log.e(TAG, "Error getting data column", e);
+        }
+        return null;
+    }
+}
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinFlowHelper.kt b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinFlowHelper.kt
new file mode 100644
index 00000000..0183ff14
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinFlowHelper.kt
@@ -0,0 +1,44 @@
+package ai.nexa.app_java
+
+import kotlinx.coroutines.CoroutineScope
+import kotlinx.coroutines.Dispatchers
+import kotlinx.coroutines.cancelChildren
+import kotlinx.coroutines.flow.Flow
+import kotlinx.coroutines.launch
+import kotlinx.coroutines.withContext
+
+class KotlinFlowHelper {
+    private val scope = CoroutineScope(Dispatchers.IO)
+
+    fun collectFlow(
+        flow: Flow<String>,  // Added missing flow parameter
+        onToken: (String) -> Unit,
+        onComplete: (String) -> Unit,
+        onError: (String) -> Unit
+    ) {
+        scope.launch {
+            try {
+                val fullResponse = StringBuilder()
+                withContext(Dispatchers.IO) {
+                    flow.collect { value ->
+                        fullResponse.append(value)
+                        withContext(Dispatchers.Main) {
+                            onToken(value)
+                        }
+                    }
+                }
+                withContext(Dispatchers.Main) {
+                    onComplete(fullResponse.toString())
+                }
+            } catch (e: Exception) {
+                withContext(Dispatchers.Main) {
+                    onError(e.message ?: "Unknown error")
+                }
+            }
+        }
+    }
+
+    fun cancel() {
+        scope.coroutineContext.cancelChildren()
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinJavaUtils.kt b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinJavaUtils.kt
new file mode 100644
index 00000000..1fc8437c
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/KotlinJavaUtils.kt
@@ -0,0 +1,11 @@
+package ai.nexa.app_java
+
+import java.util.function.Consumer
+
+object KotlinJavaUtils {
+    @JvmStatic
+    fun toKotlinCallback(callback: Consumer<String>): (String) -> Unit = { value ->
+        callback.accept(value)
+        Unit
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/LlamaBridge.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/LlamaBridge.java
new file mode 100644
index 00000000..e48ec8d5
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/LlamaBridge.java
@@ -0,0 +1,283 @@
+package ai.nexa.app_java;
+
+import android.content.Context;
+import com.nexa.NexaVlmInference;
+import android.util.Log;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.concurrent.CancellationException;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+
+import kotlin.Unit;
+import kotlin.coroutines.Continuation;
+import kotlin.jvm.functions.Function1;
+import kotlinx.coroutines.BuildersKt;
+import kotlinx.coroutines.CoroutineStart;
+import kotlinx.coroutines.Dispatchers;
+import kotlinx.coroutines.GlobalScope;
+import kotlinx.coroutines.Job;
+import kotlinx.coroutines.flow.Flow;
+import kotlinx.coroutines.flow.FlowCollector;
+
+public class LlamaBridge {
+    private static final String TAG = "LlamaBridge";
+    private final Context context;
+    private final ExecutorService executor;
+    private final MessageHandler messageHandler;
+    private final VlmModelManager modelManager;
+    private final ImagePathHelper imagePathHelper;
+    private NexaVlmInference nexaVlmInference;
+    private boolean isModelLoaded = false;
+
+    private final KotlinFlowHelper flowHelper = new KotlinFlowHelper();
+
+    // Default inference parameters
+    private static final float DEFAULT_TEMPERATURE = 1.0f;
+    private static final int DEFAULT_MAX_TOKENS = 64;
+    private static final int DEFAULT_TOP_K = 50;
+    private static final float DEFAULT_TOP_P = 0.9f;
+
+    public interface InferenceCallback {
+        void onStart();
+        void onToken(String token);
+        void onComplete(String fullResponse);
+        void onError(String error);
+    }
+
+    public LlamaBridge(Context context, MessageHandler messageHandler) {
+        this.context = context;
+        this.messageHandler = messageHandler;
+        this.executor = Executors.newSingleThreadExecutor();
+        this.modelManager = new VlmModelManager(context);
+        this.imagePathHelper = new ImagePathHelper(context);
+    }
+
+    public boolean areModelsAvailable() {
+        return modelManager.areModelsAvailable();
+    }
+
+    public void loadModel() {
+        executor.execute(() -> {
+            try {
+                if (!modelManager.areModelsAvailable()) {
+                    throw new IOException("Required model files are not available");
+                }
+
+                String modelPath = modelManager.getTextModelPath();
+                String projectorPath = modelManager.getMmProjModelPath();
+
+                Log.d(TAG, "Loading model from: " + modelPath);
+                Log.d(TAG, "Loading projector from: " + projectorPath);
+
+                // Create with default values for optional parameters
+                nexaVlmInference = new NexaVlmInference(
+                        modelPath,            // modelPath
+                        projectorPath,        // projectorPath
+                        "",                   // imagePath (empty string as default)
+                        new ArrayList<>(Arrays.asList("</s>")),    // stopWords (empty list)
+                        DEFAULT_TEMPERATURE,  // temperature
+                        DEFAULT_MAX_TOKENS,   // maxNewTokens
+                        DEFAULT_TOP_K,        // topK
+                        DEFAULT_TOP_P         // topP
+                );
+                nexaVlmInference.loadModel();
+                isModelLoaded = true;
+
+                Log.d(TAG, "Model loaded successfully.");
+//                messageHandler.addMessage(new MessageModal("Model loaded successfully", "assistant", null));
+            } catch (Exception e) {
+                Log.e(TAG, "Failed to load model", e);
+                messageHandler.addMessage(new MessageModal("Error loading model: " + e.getMessage(), "assistant", null));
+            }
+        });
+    }
+
+//    public void processMessage(String message, String imageUri, InferenceCallback callback) {
+//        if (!isModelLoaded) {
+//            callback.onError("Model not loaded yet");
+//            return;
+//        }
+//
+//        try {
+//            // Add user message first
+//            MessageModal userMessage = new MessageModal(message, "user", imageUri);
+//            messageHandler.addMessage(userMessage);
+//
+//            // Create an initial empty assistant message
+//            MessageModal assistantMessage = new MessageModal("", "assistant", null);
+//            messageHandler.addMessage(assistantMessage);
+//
+//            // Convert image URI to absolute path
+//            String imageAbsolutePath = imagePathHelper.getPathFromUri(imageUri);
+//
+//            Flow<String> flow = nexaVlmInference.createCompletionStream(
+//                    message,
+//                    imageAbsolutePath,
+//                    new ArrayList<>(),
+//                    DEFAULT_TEMPERATURE,
+//                    DEFAULT_MAX_TOKENS,
+//                    DEFAULT_TOP_K,
+//                    DEFAULT_TOP_P
+//            );
+//
+//            if (flow != null) {
+//                CoroutineScope scope = CoroutineScopeKt.CoroutineScope(Dispatchers.getMain());
+//
+//                Job job = FlowKt.launchIn(
+//                        FlowKt.onEach(flow, new Function2<String, Continuation<? super Unit>, Object>() {
+//                            @Override
+//                            public Object invoke(String token, Continuation<? super Unit> continuation) {
+//                                messageHandler.updateLastAssistantMessage(token);
+//                                callback.onToken(token);
+//                                return Unit.INSTANCE;
+//                            }
+//                        }),
+//                        scope
+//                );
+//            } else {
+//                messageHandler.finalizeLastAssistantMessage("Error: Failed to create completion stream");
+//                callback.onError("Failed to create completion stream");
+//            }
+//        } catch (Exception e) {
+//            Log.e(TAG, "Error processing message", e);
+//            messageHandler.finalizeLastAssistantMessage("Error: " + e.getMessage());
+//            callback.onError(e.getMessage());
+//        }
+//    }
+
+    public void processMessage(String message, String imageUri, InferenceCallback callback) {
+        if (!isModelLoaded) {
+            callback.onError("Model not loaded yet");
+            return;
+        }
+
+        String imageAbsolutePath = null;
+        try {
+            imageAbsolutePath = imagePathHelper.copyUriToPrivateFile(context, imageUri);
+        } catch (IOException e) {
+            callback.onError("Failed to process image: " + e.getMessage());
+            return;
+        }
+
+        final String imagePath = imageAbsolutePath;
+        MessageModal assistantMessage = new MessageModal("", "bot", null);
+        messageHandler.addMessage(assistantMessage);
+
+        try {
+            Flow<String> flow = nexaVlmInference.createCompletionStream(
+                    message,
+                    imagePath,
+                    new ArrayList<>(Arrays.asList("</s>")),
+                    DEFAULT_TEMPERATURE,
+                    DEFAULT_MAX_TOKENS,
+                    DEFAULT_TOP_K,
+                    DEFAULT_TOP_P
+            );
+
+            callback.onStart();
+            StringBuilder fullResponse = new StringBuilder();
+
+            Job collectJob = BuildersKt.launch(
+                    GlobalScope.INSTANCE,
+                    Dispatchers.getIO(),
+                    CoroutineStart.DEFAULT,
+                    (coroutineScope, continuation) -> {
+                        flow.collect(new FlowCollector<String>() {
+                            @Override
+                            public Object emit(String token, Continuation<? super Unit> continuation) {
+                                fullResponse.append(token);
+                                callback.onToken(token);
+                                return Unit.INSTANCE;
+                            }
+                        }, continuation);
+                        callback.onComplete(fullResponse.toString());
+                        return Unit.INSTANCE;
+                    }
+            );
+
+            collectJob.invokeOnCompletion(new Function1<Throwable, Unit>() {
+                @Override
+                public Unit invoke(Throwable throwable) {
+                    if (throwable != null && !(throwable instanceof CancellationException)) {
+                        callback.onError("Stream collection failed: " + throwable.getMessage());
+                    }
+                    return Unit.INSTANCE;
+                }
+            });
+
+        } catch (Exception e) {
+            Log.e(TAG, "Inference failed", e);
+            callback.onError(e.getMessage());
+        }
+    }
+
+    public void cleanup() {
+        flowHelper.cancel();
+    }
+
+//    public void processMessageWithParams(
+//            String message,
+//            String imageUri,
+//            float temperature,
+//            int maxTokens,
+//            int topK,
+//            float topP,
+//            InferenceCallback callback) {
+//
+//        if (!isModelLoaded) {
+//            callback.onError("Model not loaded yet");
+//            return;
+//        }
+//
+//        executor.execute(() -> {
+//            StringBuilder fullResponse = new StringBuilder();
+//            try {
+//                callback.onStart();
+//
+//                Flow<String> completionStream = nexaVlmInference.createCompletionStream(
+//                        message,
+//                        imageUri,
+//                        new ArrayList<>(),
+//                        temperature,
+//                        maxTokens,
+//                        topK,
+//                        topP
+//                );
+//
+//                completionStream.collect(new FlowCollector<String>() {
+//                    @Override
+//                    public Object emit(String value, Continuation<? super Unit> continuation) {
+//                        fullResponse.append(value);
+//                        callback.onToken(value);
+//                        return Unit.INSTANCE;
+//                    }
+//                });
+//
+//                callback.onComplete(fullResponse.toString());
+//
+//            } catch (Exception e) {
+//                Log.e(TAG, "Inference failed", e);
+//                callback.onError(e.getMessage());
+//            }
+//        });
+//    }
+
+
+    public void shutdown() {
+        if (nexaVlmInference != null) {
+            executor.execute(() -> {
+                try {
+                    nexaVlmInference.dispose();
+                } catch (Exception e) {
+                    Log.e(TAG, "Error closing inference", e);
+                }
+                nexaVlmInference = null;
+                isModelLoaded = false;
+            });
+        }
+        executor.shutdown();
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MainActivity.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MainActivity.java
new file mode 100644
index 00000000..29be7214
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MainActivity.java
@@ -0,0 +1,345 @@
+package ai.nexa.app_java;
+
+import android.Manifest;
+import android.content.Context;
+import android.content.Intent;
+import android.content.pm.PackageManager;
+import android.net.Uri;
+import android.os.Bundle;
+import android.os.Message;
+import android.provider.MediaStore;
+import android.speech.RecognizerIntent;
+import android.speech.SpeechRecognizer;
+import android.util.Log;
+import android.view.MotionEvent;
+import android.view.View;
+import android.view.inputmethod.InputMethodManager;
+import android.widget.EditText;
+import android.widget.ImageButton;
+import android.widget.LinearLayout;
+import android.widget.TextView;
+import android.widget.Toast;
+
+import androidx.annotation.NonNull;
+import androidx.appcompat.app.AppCompatActivity;
+import androidx.core.app.ActivityCompat;
+import androidx.recyclerview.widget.LinearLayoutManager;
+import androidx.recyclerview.widget.RecyclerView;
+
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Locale;
+
+public class MainActivity extends AppCompatActivity {
+
+    private static final String TAG = "ChatApp";
+    private static final int PICK_IMAGE_REQUEST = 30311;
+    private static final int REQUEST_RECORD_AUDIO_PERMISSION = 200;
+    private static final int READ_EXTERNAL_STORAGE_PERMISSION = 303;
+
+    private RecyclerView chatsRV;
+    private ImageButton selectImageButton;
+    private ImageButton sendMsgIB;
+    private EditText userMsgEdt;
+    private String justSelectedImageUri;
+
+    private LinearLayout linearLayout;
+    private TextView titleAfterChatTextView;
+    private RecyclerView recyclerView;
+
+    private ArrayList<MessageModal> messageModalArrayList;
+    private MessageRVAdapter messageRVAdapter;
+    private MessageHandler messageHandler;
+    private LlamaBridge llamaBridge;
+    private SpeechRecognizer speechRecognizer;
+
+    @Override
+    protected void onCreate(Bundle savedInstanceState) {
+        super.onCreate(savedInstanceState);
+        setContentView(R.layout.activity_main);
+
+        Log.d(TAG, "onCreate: Starting MainActivity");
+
+        initializeViews();
+        setupRecyclerView();
+        initializeLlamaBridge();
+        createSpeechRecognizerIntent();
+        setupClickListeners();
+
+        Log.d(TAG, "onCreate: MainActivity setup complete");
+    }
+
+    private void initializeViews() {
+        chatsRV = findViewById(R.id.idRVChats);
+        selectImageButton = findViewById(R.id.btnUploadImage);
+        sendMsgIB = findViewById(R.id.idIBSend);
+        userMsgEdt = findViewById(R.id.idEdtMessage);
+        linearLayout = findViewById(R.id.idLayoutBeforeChat);
+        titleAfterChatTextView = findViewById(R.id.textView);
+        recyclerView = findViewById(R.id.idRVChats);
+    }
+
+    private void setupRecyclerView() {
+        messageModalArrayList = new ArrayList<>();
+        messageRVAdapter = new MessageRVAdapter(messageModalArrayList, this);
+        chatsRV.setLayoutManager(new LinearLayoutManager(this, RecyclerView.VERTICAL, false));
+        chatsRV.setAdapter(messageRVAdapter);
+        messageHandler = new MessageHandler(messageModalArrayList, messageRVAdapter, recyclerView);
+    }
+
+    private void initializeLlamaBridge() {
+        llamaBridge = new LlamaBridge(this, messageHandler);
+        if (!llamaBridge.areModelsAvailable()) {
+            Toast.makeText(this, "Required model files are not available", Toast.LENGTH_LONG).show();
+            return;
+        }
+        llamaBridge.loadModel();
+    }
+
+    private void setupClickListeners() {
+        selectImageButton.setOnClickListener(v -> {
+            Intent intent = new Intent(Intent.ACTION_PICK, MediaStore.Images.Media.EXTERNAL_CONTENT_URI);
+            startActivityForResult(intent, PICK_IMAGE_REQUEST);
+        });
+
+        sendMsgIB.setOnClickListener(v -> {
+            hideKeyboard(v);
+            sendTextMessage();
+        });
+    }
+
+    private void updateChatBotDisplay() {
+        linearLayout.setVisibility(View.GONE);
+        titleAfterChatTextView.setVisibility(View.VISIBLE);
+        recyclerView.setVisibility(View.VISIBLE);
+    }
+
+    private void sendTextMessage() {
+        updateChatBotDisplay();
+
+        String userMessage = userMsgEdt.getText().toString().trim();
+        if (!userMessage.isEmpty()) {
+            Log.d(TAG, "Sending message: " + userMessage);
+            messageHandler.addMessage(new MessageModal(userMessage, "user", null));
+
+            if (justSelectedImageUri == null) {
+                messageHandler.addMessage(new MessageModal("Please select an image first.", "bot", null));
+                return;
+            }
+
+            // Use LlamaBridge for inference
+            llamaBridge.processMessage(userMessage, justSelectedImageUri, new LlamaBridge.InferenceCallback() {
+                @Override
+                public void onStart() {
+                    // Optional: Show loading indicator
+                }
+
+                @Override
+                public void onToken(String token) {
+                    // Update the UI with each token as it comes in
+                    runOnUiThread(() -> {
+                        messageHandler.updateLastBotMessage(token);
+                    });
+                }
+
+                @Override
+                public void onComplete(String fullResponse) {
+                    // Final update with complete response
+                    runOnUiThread(() -> {
+                        messageHandler.finalizeLastBotMessage(fullResponse);
+                    });
+                }
+
+                @Override
+                public void onError(String error) {
+                    runOnUiThread(() -> {
+                        Toast.makeText(MainActivity.this, "Error: " + error, Toast.LENGTH_SHORT).show();
+                        messageHandler.addMessage(new MessageModal("Error processing message: " + error, "assistant", null));
+                    });
+                }
+            });
+
+            userMsgEdt.setText(""); // Clear the input field after sending
+            justSelectedImageUri = null; // Clear the image URI after sending
+        } else {
+            Toast.makeText(MainActivity.this, "Please enter your message.", Toast.LENGTH_SHORT).show();
+        }
+    }
+
+    private void sendImageAsMessage(String imageUri) {
+        updateChatBotDisplay();
+        messageHandler.addMessage(new MessageModal("", "user", imageUri));
+        justSelectedImageUri = imageUri;
+    }
+
+    @Override
+    protected void onDestroy() {
+        super.onDestroy();
+        if (llamaBridge != null) {
+            llamaBridge.shutdown();
+        }
+        if (speechRecognizer != null) {
+            speechRecognizer.destroy();
+        }
+    }
+
+    private void createSpeechRecognizerIntent() {
+        requestMicrophonePermission();
+
+        ImageButton btnStart = findViewById(R.id.btnStart);
+
+        speechRecognizer = SpeechRecognizer.createSpeechRecognizer(this);
+
+        Intent speechRecognizerIntent = new Intent(RecognizerIntent.ACTION_RECOGNIZE_SPEECH);
+        speechRecognizerIntent.putExtra(RecognizerIntent.EXTRA_LANGUAGE_MODEL, RecognizerIntent.LANGUAGE_MODEL_FREE_FORM);
+        speechRecognizerIntent.putExtra(RecognizerIntent.EXTRA_LANGUAGE, Locale.getDefault());
+        speechRecognizerIntent.putExtra(RecognizerIntent.EXTRA_PARTIAL_RESULTS, true);
+
+        speechRecognizer.setRecognitionListener(new android.speech.RecognitionListener() {
+            @Override
+            public void onReadyForSpeech(Bundle params) {
+            }
+
+            @Override
+            public void onBeginningOfSpeech() {
+            }
+
+            @Override
+            public void onRmsChanged(float rmsdB) {
+            }
+
+            @Override
+            public void onBufferReceived(byte[] buffer) {
+            }
+
+            @Override
+            public void onEndOfSpeech() {
+            }
+
+            @Override
+            public void onError(int error) {
+                String errorMessage = getErrorText(error);
+                Log.d("SpeechRecognition", "Error occurred: " + errorMessage);
+            }
+
+            public String getErrorText(int errorCode) {
+                String message;
+                switch (errorCode) {
+                    case SpeechRecognizer.ERROR_AUDIO:
+                        message = "Audio recording error";
+                        break;
+                    case SpeechRecognizer.ERROR_CLIENT:
+                        message = "Client side error";
+                        break;
+                    case SpeechRecognizer.ERROR_INSUFFICIENT_PERMISSIONS:
+                        message = "Insufficient permissions";
+                        break;
+                    case SpeechRecognizer.ERROR_NETWORK:
+                        message = "Network error";
+                        break;
+                    case SpeechRecognizer.ERROR_NETWORK_TIMEOUT:
+                        message = "Network timeout";
+                        break;
+                    case SpeechRecognizer.ERROR_NO_MATCH:
+                        message = "No match";
+                        break;
+                    case SpeechRecognizer.ERROR_RECOGNIZER_BUSY:
+                        message = "RecognitionService busy";
+                        break;
+                    case SpeechRecognizer.ERROR_SERVER:
+                        message = "Error from server";
+                        break;
+                    case SpeechRecognizer.ERROR_SPEECH_TIMEOUT:
+                        message = "No speech input";
+                        break;
+                    default:
+                        message = "Didn't understand, please try again.";
+                        break;
+                }
+                return message;
+            }
+
+            @Override
+            public void onResults(Bundle results) {
+                ArrayList<String> matches = results.getStringArrayList(SpeechRecognizer.RESULTS_RECOGNITION);
+                if (matches != null && !matches.isEmpty()) {
+                    userMsgEdt.setText(matches.get(0)); // Set the recognized text to the EditText
+                    sendTextMessage();
+                }
+            }
+
+            @Override
+            public void onPartialResults(Bundle partialResults) {
+                // This is called for partial results
+                ArrayList<String> partialMatches = partialResults.getStringArrayList(SpeechRecognizer.RESULTS_RECOGNITION);
+                if (partialMatches != null && !partialMatches.isEmpty()) {
+                    userMsgEdt.setText(partialMatches.get(0)); // Update EditText with the partial result
+                }
+            }
+
+            @Override
+            public void onEvent(int eventType, Bundle params) {
+            }
+        });
+
+        btnStart.setOnTouchListener(new View.OnTouchListener() {
+            @Override
+            public boolean onTouch(View v, MotionEvent event) {
+                switch (event.getAction()) {
+                    case MotionEvent.ACTION_DOWN:
+                        // Button is pressed
+                        speechRecognizer.startListening(speechRecognizerIntent);
+                        return true; // Return true to indicate the event was handled
+                    case MotionEvent.ACTION_UP:
+                        // Button is released
+                        speechRecognizer.stopListening();
+                        return true; // Return true to indicate the event was handled
+                }
+                return false; // Return false for other actions
+            }
+        });
+    }
+
+    private void requestMicrophonePermission() {
+        ActivityCompat.requestPermissions(this, new String[]{Manifest.permission.RECORD_AUDIO}, REQUEST_RECORD_AUDIO_PERMISSION);
+    }
+
+    @Override
+    public void onRequestPermissionsResult(int requestCode, @NonNull String[] permissions, @NonNull int[] grantResults) {
+        super.onRequestPermissionsResult(requestCode, permissions, grantResults);
+        switch (requestCode) {
+            case READ_EXTERNAL_STORAGE_PERMISSION:
+                if (grantResults.length > 0 && grantResults[0] == PackageManager.PERMISSION_GRANTED) {
+                    Toast.makeText(this, "Read External Storage Permission Granted", Toast.LENGTH_SHORT).show();
+                    Intent intent = new Intent(Intent.ACTION_PICK, MediaStore.Images.Media.EXTERNAL_CONTENT_URI);
+                    startActivityForResult(intent, PICK_IMAGE_REQUEST);
+                } else {
+                    Toast.makeText(this, "Read External Storage Permission Denied", Toast.LENGTH_SHORT).show();
+                }
+                break;
+            default:
+                break;
+        }
+
+    }
+
+    @Override
+    protected void onActivityResult(int requestCode, int resultCode, Intent data) {
+        super.onActivityResult(requestCode, resultCode, data);
+        if (requestCode == PICK_IMAGE_REQUEST && resultCode == RESULT_OK && data != null) {
+            Uri selectedImage = data.getData();
+            if (selectedImage != null) {
+                String imageUriString = selectedImage.toString();
+                sendImageAsMessage(imageUriString);
+            }
+        }
+    }
+
+    public void hideKeyboard(View view) {
+        InputMethodManager inputMethodManager = (InputMethodManager) getSystemService(Context.INPUT_METHOD_SERVICE);
+        if (inputMethodManager != null) {
+            inputMethodManager.hideSoftInputFromWindow(view.getWindowToken(), InputMethodManager.HIDE_NOT_ALWAYS);
+        }
+    }
+
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageHandler.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageHandler.java
new file mode 100644
index 00000000..39720c1f
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageHandler.java
@@ -0,0 +1,127 @@
+package ai.nexa.app_java;
+
+import androidx.recyclerview.widget.RecyclerView;
+import android.os.Handler;
+import android.os.Looper;
+
+import java.util.ArrayList;
+
+public class MessageHandler {
+    private final ArrayList<MessageModal> messageModalArrayList;
+    private final MessageRVAdapter messageRVAdapter;
+    private final RecyclerView recyclerView;
+    private final Handler mainHandler;
+
+    public MessageHandler(ArrayList<MessageModal> messageModalArrayList, MessageRVAdapter messageRVAdapter, RecyclerView recyclerView) {
+        this.messageModalArrayList = messageModalArrayList;
+        this.messageRVAdapter = messageRVAdapter;
+        this.recyclerView = recyclerView;
+        this.mainHandler = new Handler(Looper.getMainLooper());
+    }
+
+    /**
+     * Add a new message to the chat
+     */
+    public void addMessage(MessageModal message) {
+        ensureMainThread(() -> {
+            messageModalArrayList.add(message);
+            messageRVAdapter.notifyItemInserted(messageModalArrayList.size() - 1);
+            scrollToBottom();
+        });
+    }
+
+    /**
+     * Update the last bot message with new token
+     */
+    public void updateLastBotMessage(String newToken) {
+        ensureMainThread(() -> {
+            if (!messageModalArrayList.isEmpty()) {
+                int lastIndex = messageModalArrayList.size() - 1;
+                MessageModal lastMessage = messageModalArrayList.get(lastIndex);
+
+                // If last message is from bot, update it
+                if ("bot".equals(lastMessage.getSender())) {
+                    String currentMessage = lastMessage.getMessage();
+                    lastMessage.setMessage(currentMessage + newToken);
+                    messageRVAdapter.notifyItemChanged(lastIndex);
+                } else {
+                    // Create new bot message
+                    MessageModal newMessage = new MessageModal(newToken, "bot", null);
+                    messageModalArrayList.add(newMessage);
+                    messageRVAdapter.notifyItemInserted(messageModalArrayList.size() - 1);
+                }
+                scrollToBottom();
+            }
+        });
+    }
+
+    /**
+     * Finalize the last bot message with complete response
+     */
+    public void finalizeLastBotMessage(String completeMessage) {
+        ensureMainThread(() -> {
+            if (!messageModalArrayList.isEmpty()) {
+                int lastIndex = messageModalArrayList.size() - 1;
+                MessageModal lastMessage = messageModalArrayList.get(lastIndex);
+
+                if ("bot".equals(lastMessage.getSender())) {
+                    lastMessage.setMessage(completeMessage);
+                    messageRVAdapter.notifyItemChanged(lastIndex);
+                } else {
+                    MessageModal newMessage = new MessageModal(completeMessage, "bot", null);
+                    messageModalArrayList.add(newMessage);
+                    messageRVAdapter.notifyItemInserted(messageModalArrayList.size() - 1);
+                }
+                scrollToBottom();
+            }
+        });
+    }
+
+    /**
+     * Clear all messages from the chat
+     */
+    public void clearMessages() {
+        ensureMainThread(() -> {
+            messageModalArrayList.clear();
+            messageRVAdapter.notifyDataSetChanged();
+        });
+    }
+
+    /**
+     * Get the last message in the chat
+     */
+    public MessageModal getLastMessage() {
+        if (!messageModalArrayList.isEmpty()) {
+            return messageModalArrayList.get(messageModalArrayList.size() - 1);
+        }
+        return null;
+    }
+
+    /**
+     * Check if the last message is from the bot
+     */
+    public boolean isLastMessageFromBot() {
+        MessageModal lastMessage = getLastMessage();
+        return lastMessage != null && "bot".equals(lastMessage.getSender());
+    }
+
+    /**
+     * Scroll the RecyclerView to the bottom
+     */
+    private void scrollToBottom() {
+        if (messageModalArrayList.size() > 1) {
+            recyclerView.smoothScrollToPosition(messageModalArrayList.size() - 1);
+        }
+    }
+
+    /**
+     * Ensure all UI updates happen on the main thread
+     */
+    private void ensureMainThread(Runnable action) {
+        if (Looper.myLooper() == Looper.getMainLooper()) {
+            action.run();
+        } else {
+            mainHandler.post(action);
+        }
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageModal.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageModal.java
new file mode 100644
index 00000000..1e60921b
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageModal.java
@@ -0,0 +1,42 @@
+package ai.nexa.app_java;
+
+public class MessageModal {
+
+
+    private String message;
+    private String sender;
+
+    private String imageUri;
+
+    public MessageModal(String message, String sender, String imageUri) {
+        this.message = message;
+        this.sender = sender;
+        this.imageUri = imageUri;
+    }
+
+
+    public String getMessage() {
+        return message;
+    }
+
+    public void setMessage(String message) {
+        this.message = message;
+    }
+
+    public String getSender() {
+        return sender;
+    }
+
+    public void setSender(String sender) {
+        this.sender = sender;
+    }
+
+    public String getImageUri() {
+        return imageUri;
+    }
+
+    public void setImageUri(String imageUri) {
+        this.imageUri = imageUri;
+    }
+}
+
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageRVAdapter.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageRVAdapter.java
new file mode 100644
index 00000000..90977681
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/MessageRVAdapter.java
@@ -0,0 +1,102 @@
+package ai.nexa.app_java;
+
+import android.content.Context;
+import android.view.LayoutInflater;
+import android.view.View;
+import android.view.ViewGroup;
+import android.widget.ImageView;
+import android.widget.TextView;
+
+import androidx.annotation.NonNull;
+import androidx.recyclerview.widget.RecyclerView;
+
+import com.bumptech.glide.Glide;
+
+import java.util.ArrayList;
+
+public class MessageRVAdapter extends RecyclerView.Adapter {
+
+    private ArrayList<MessageModal> messageModalArrayList;
+    private Context context;
+
+    public MessageRVAdapter(ArrayList<MessageModal> messageModalArrayList, Context context) {
+        this.messageModalArrayList = messageModalArrayList;
+        this.context = context;
+    }
+
+    @NonNull
+    @Override
+    public RecyclerView.ViewHolder onCreateViewHolder(@NonNull ViewGroup parent, int viewType) {
+        View view;
+        switch (viewType) {
+            case 0:
+                view = LayoutInflater.from(parent.getContext()).inflate(R.layout.user_msg, parent, false);
+                return new UserViewHolder(view);
+            case 1:
+                view = LayoutInflater.from(parent.getContext()).inflate(R.layout.bot_msg, parent, false);
+                return new BotViewHolder(view);
+        }
+        return null;
+    }
+
+    @Override
+    public void onBindViewHolder(@NonNull RecyclerView.ViewHolder holder, int position) {
+        MessageModal modal = messageModalArrayList.get(position);
+        switch (modal.getSender()) {
+            case "user":
+                UserViewHolder userHolder = (UserViewHolder) holder;
+                if (modal.getImageUri() != null && !modal.getImageUri().isEmpty()) {
+                    userHolder.userImage.setVisibility(View.VISIBLE);
+                    userHolder.userTV.setVisibility(View.GONE);
+                    Glide.with(userHolder.itemView.getContext())
+                            .load(modal.getImageUri())
+                            .into(userHolder.userImage);
+                } else {
+                    userHolder.userImage.setVisibility(View.GONE);
+                    userHolder.userTV.setVisibility(View.VISIBLE);
+                    userHolder.userTV.setText(modal.getMessage());
+                }
+                break;
+            case "bot":
+                ((BotViewHolder) holder).botTV.setText(modal.getMessage());
+                break;
+        }
+    }
+
+    @Override
+    public int getItemCount() {
+        return messageModalArrayList.size();
+    }
+
+    @Override
+    public int getItemViewType(int position) {
+        switch (messageModalArrayList.get(position).getSender()) {
+            case "user":
+                return 0;
+            case "bot":
+                return 1;
+            default:
+                return -1;
+        }
+    }
+
+    public static class UserViewHolder extends RecyclerView.ViewHolder {
+        TextView userTV;
+        ImageView userImage;
+
+        public UserViewHolder(@NonNull View itemView) {
+            super(itemView);
+            userTV = itemView.findViewById(R.id.idTVUser);
+            userImage = itemView.findViewById(R.id.idIVUserImage);
+        }
+    }
+
+    public static class BotViewHolder extends RecyclerView.ViewHolder {
+        TextView botTV;
+
+        public BotViewHolder(@NonNull View itemView) {
+            super(itemView);
+            botTV = itemView.findViewById(R.id.idTVBot);
+        }
+    }
+}
diff --git a/android/llama.android/app-java/src/main/java/ai/nexa/app_java/VlmModelManager.java b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/VlmModelManager.java
new file mode 100644
index 00000000..9ebd8d45
--- /dev/null
+++ b/android/llama.android/app-java/src/main/java/ai/nexa/app_java/VlmModelManager.java
@@ -0,0 +1,125 @@
+package ai.nexa.app_java;
+
+import android.content.Context;
+import android.os.Environment;
+import android.util.Log;
+
+import java.io.File;
+import java.io.IOException;
+
+public class VlmModelManager {
+    private static final String TAG = "LlamaBridge";
+    private static final String MODELS_DIR = "models";
+    private static final String MODEL_TEXT_FILENAME = "nanollava-text-model-q4_0.gguf";
+    private static final String MODEL_MMPROJ_FILENAME = "nanollava-mmproj-f16.gguf";
+
+    private final Context context;
+    private File textModelFile;
+    private File mmProjModelFile;
+    private final File externalModelDir;
+
+    public VlmModelManager(Context context) {
+        this.context = context;
+        this.externalModelDir = new File(Environment.getExternalStorageDirectory(),
+                "Android/data/" + context.getPackageName() + "/files");
+    }
+
+    /**
+     * Search for model in common locations
+     * @param modelFilename The name of the model file to find
+     * @return File path to the model if found, null otherwise
+     */
+    private String findExistingModel(String modelFilename) {
+        // List of possible locations to check
+        File[] locations = {
+                // External storage specific path
+                new File(externalModelDir, modelFilename),
+                // Downloads folder
+                new File(Environment.getExternalStoragePublicDirectory(
+                        Environment.DIRECTORY_DOWNLOADS), modelFilename),
+                // App's private external storage
+                new File(context.getExternalFilesDir(null), MODELS_DIR + "/" + modelFilename),
+                // App's private internal storage
+                new File(context.getFilesDir(), MODELS_DIR + "/" + modelFilename)
+        };
+
+        for (File location : locations) {
+            if (location.exists() && location.canRead()) {
+                Log.d(TAG, "Found model at: " + location.getAbsolutePath());
+                return location.getAbsolutePath();
+            }
+        }
+        return null;
+    }
+
+    /**
+     * Get text model path, searching in storage locations
+     * @return Path to the model file
+     * @throws IOException if model cannot be found or accessed
+     */
+    public String getTextModelPath() throws IOException {
+        // If we already have a valid model file, return it
+        if (textModelFile != null && textModelFile.exists() && textModelFile.canRead()) {
+            return textModelFile.getAbsolutePath();
+        }
+
+        // Search for existing model
+        String path = findExistingModel(MODEL_TEXT_FILENAME);
+        if (path != null) {
+            textModelFile = new File(path);
+            return path;
+        }
+
+        throw new IOException("Text model not found in any storage location");
+    }
+
+    /**
+     * Get mmproj model path, searching in storage locations
+     * @return Path to the model file
+     * @throws IOException if model cannot be found or accessed
+     */
+    public String getMmProjModelPath() throws IOException {
+        // If we already have a valid model file, return it
+        if (mmProjModelFile != null && mmProjModelFile.exists() && mmProjModelFile.canRead()) {
+            return mmProjModelFile.getAbsolutePath();
+        }
+
+        // Search for existing model
+        String path = findExistingModel(MODEL_MMPROJ_FILENAME);
+        if (path != null) {
+            mmProjModelFile = new File(path);
+            return path;
+        }
+
+        throw new IOException("MMProj model not found in any storage location");
+    }
+
+    /**
+     * Check if both required models exist in any location
+     * @return true if both models are found
+     */
+    public boolean areModelsAvailable() {
+        try {
+            getTextModelPath();
+            getMmProjModelPath();
+            return true;
+        } catch (IOException e) {
+            Log.w(TAG, "Models not available: " + e.getMessage());
+            return false;
+        }
+    }
+
+    /**
+     * Get the directory containing the models
+     * @return File object for the models directory, or null if models aren't found
+     */
+    public File getModelsDirectory() {
+        try {
+            String textModelPath = getTextModelPath();
+            return new File(textModelPath).getParentFile();
+        } catch (IOException e) {
+            Log.w(TAG, "Could not determine models directory: " + e.getMessage());
+            return null;
+        }
+    }
+}
diff --git a/android/llama.android/app-java/src/main/res/drawable-hdpi/ic_menu_send.png b/android/llama.android/app-java/src/main/res/drawable-hdpi/ic_menu_send.png
new file mode 100644
index 00000000..f34a9658
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable-hdpi/ic_menu_send.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable-mdpi/ic_menu_send.png b/android/llama.android/app-java/src/main/res/drawable-mdpi/ic_menu_send.png
new file mode 100644
index 00000000..e83f6010
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable-mdpi/ic_menu_send.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable-v24/ic_launcher_foreground.xml b/android/llama.android/app-java/src/main/res/drawable-v24/ic_launcher_foreground.xml
new file mode 100644
index 00000000..2b068d11
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable-v24/ic_launcher_foreground.xml
@@ -0,0 +1,30 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    xmlns:aapt="http://schemas.android.com/aapt"
+    android:width="108dp"
+    android:height="108dp"
+    android:viewportWidth="108"
+    android:viewportHeight="108">
+    <path android:pathData="M31,63.928c0,0 6.4,-11 12.1,-13.1c7.2,-2.6 26,-1.4 26,-1.4l38.1,38.1L107,108.928l-32,-1L31,63.928z">
+        <aapt:attr name="android:fillColor">
+            <gradient
+                android:endX="85.84757"
+                android:endY="92.4963"
+                android:startX="42.9492"
+                android:startY="49.59793"
+                android:type="linear">
+                <item
+                    android:color="#44000000"
+                    android:offset="0.0" />
+                <item
+                    android:color="#00000000"
+                    android:offset="1.0" />
+            </gradient>
+        </aapt:attr>
+    </path>
+    <path
+        android:fillColor="#FFFFFF"
+        android:fillType="nonZero"
+        android:pathData="M65.3,45.828l3.8,-6.6c0.2,-0.4 0.1,-0.9 -0.3,-1.1c-0.4,-0.2 -0.9,-0.1 -1.1,0.3l-3.9,6.7c-6.3,-2.8 -13.4,-2.8 -19.7,0l-3.9,-6.7c-0.2,-0.4 -0.7,-0.5 -1.1,-0.3C38.8,38.328 38.7,38.828 38.9,39.228l3.8,6.6C36.2,49.428 31.7,56.028 31,63.928h46C76.3,56.028 71.8,49.428 65.3,45.828zM43.4,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2c-0.3,-0.7 -0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C45.3,56.528 44.5,57.328 43.4,57.328L43.4,57.328zM64.6,57.328c-0.8,0 -1.5,-0.5 -1.8,-1.2s-0.1,-1.5 0.4,-2.1c0.5,-0.5 1.4,-0.7 2.1,-0.4c0.7,0.3 1.2,1 1.2,1.8C66.5,56.528 65.6,57.328 64.6,57.328L64.6,57.328z"
+        android:strokeWidth="1"
+        android:strokeColor="#00000000" />
+</vector>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/drawable-xhdpi/ic_menu_send.png b/android/llama.android/app-java/src/main/res/drawable-xhdpi/ic_menu_send.png
new file mode 100644
index 00000000..882722eb
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable-xhdpi/ic_menu_send.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable-xxhdpi/ic_menu_send.png b/android/llama.android/app-java/src/main/res/drawable-xxhdpi/ic_menu_send.png
new file mode 100644
index 00000000..08108e76
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable-xxhdpi/ic_menu_send.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable-xxxhdpi/ic_menu_send.png b/android/llama.android/app-java/src/main/res/drawable-xxxhdpi/ic_menu_send.png
new file mode 100644
index 00000000..8f7eb62c
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable-xxxhdpi/ic_menu_send.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable/bg_send_message.xml b/android/llama.android/app-java/src/main/res/drawable/bg_send_message.xml
new file mode 100644
index 00000000..972981d8
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/bg_send_message.xml
@@ -0,0 +1,9 @@
+<shape xmlns:android="http://schemas.android.com/apk/res/android"
+    android:shape="rectangle">
+    <solid android:color="#f0e5ff" />
+    <corners
+        android:bottomRightRadius="0dp"
+        android:topRightRadius="23dp"
+        android:bottomLeftRadius="23dp"
+        android:topLeftRadius="23dp" />
+</shape>
diff --git a/android/llama.android/app-java/src/main/res/drawable/bot_message.xml b/android/llama.android/app-java/src/main/res/drawable/bot_message.xml
new file mode 100644
index 00000000..8dda5f87
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/bot_message.xml
@@ -0,0 +1,11 @@
+<shape xmlns:android="http://schemas.android.com/apk/res/android"
+    android:shape="rectangle">
+    <solid android:color="@color/grey" />
+    <corners
+        android:bottomRightRadius="10dp"
+        android:topRightRadius="23dp"
+        android:bottomLeftRadius="23dp"
+        android:topLeftRadius="23dp" />
+</shape>
+
+
diff --git a/android/llama.android/app-java/src/main/res/drawable/gradient_background.xml b/android/llama.android/app-java/src/main/res/drawable/gradient_background.xml
new file mode 100644
index 00000000..6d9a5345
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/gradient_background.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="utf-8"?>
+<shape xmlns:android="http://schemas.android.com/apk/res/android"
+    android:shape="rectangle">
+    <gradient
+        android:startColor="#03070D"
+        android:endColor="#142854"
+        android:angle="-90"/>
+</shape>
diff --git a/android/llama.android/app-java/src/main/res/drawable/ic_bot.xml b/android/llama.android/app-java/src/main/res/drawable/ic_bot.xml
new file mode 100644
index 00000000..660ed4e0
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/ic_bot.xml
@@ -0,0 +1,171 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="1024dp" android:viewportHeight="1024" android:viewportWidth="1024" android:width="1024dp">
+
+  <path android:fillColor="#000000" android:pathData="M863.6,714.2C880.4,724.9 885.7,740.8 878.1,756.8C874.2,765 865.8,770.4 858.3,769.6C849.8,768.7 845.4,760.8 849.3,753.2C850.3,751.3 851.6,749.5 852.4,747.5C853.3,745.4 853.3,743.2 851.4,741.5C849.3,739.7 847.3,740.8 845.4,742C844.3,742.7 843.2,743.5 842.3,744.5C830.5,757.1 815.9,759.4 799.7,756C778.1,751.4 766,737.7 761.7,716.6C760,708.6 760,708.6 752.5,711.5C734.1,718.6 715.1,718.9 695.9,715.9C689.8,714.9 683.8,713.9 677.8,712.3C673.9,711.3 671.7,712.3 669.6,715.6C663.1,725.8 655.3,735 644.6,741C627.5,750.7 609.2,755 589.5,753.5C576.7,752.6 564,751.5 551.6,747.9C523.4,739.6 503.4,721.7 489.7,696.1C483.5,684.5 478.7,672.2 474.9,659.6C472.2,650.5 467.9,649.4 461.3,656.4C428.7,691.1 387,707.6 341.4,716C322.7,719.5 303.9,717.8 286,710.4C281.9,708.8 280.5,710.5 279.7,714C278.8,717.6 278.2,721.2 277.1,724.7C271.5,743.2 258.7,753.2 239.8,756.4C223.4,759.2 209.1,756.2 197.3,743.9C195.1,741.7 192.4,738.8 189.1,742C186.1,744.8 187.3,747.9 189.5,750.9C193.1,755.9 193.2,760.8 190,765.2C187.2,769.1 182,770.8 176.6,769.5C164.4,766.5 156.3,752 159.1,738.1C163.4,716 184.8,704.7 205.6,713.4C210.1,715.3 214.3,717.6 218.4,720.2C232.6,729.4 241.9,719.5 242.5,707.1C243,694.8 241.1,682.5 241.6,670.2C241.6,669.2 241.3,668.1 240.7,667.4C233.1,657.7 226.3,647.4 216.4,639.7C206.9,632.4 196,630.3 184.6,629.3C151.3,626.3 121.2,615.1 96.7,591.8C75.2,571.5 66.2,545.3 66.6,516.1C66.9,488.9 76.2,465.3 96,446.2C106.1,436.6 118,430.8 131.9,429C153.5,426.2 172.2,444.5 169.6,466.1C167.6,483.2 158.3,494.2 143.9,496.9C134,498.7 123.4,492.6 120.3,483.3C117.2,473.8 124.9,465 134.6,467.1C137.2,467.6 139.5,468.1 140.2,465C140.8,462 138.4,460.9 136.3,459.9C133.5,458.7 130.7,459.3 128.1,460.5C118.1,465.2 112.7,473.2 111.5,483.9C110,496.1 113.4,507.6 117.5,519C118.3,521.3 119.7,522 122.1,520.4C137.8,509.8 154.6,500.9 170.1,489.9C179.9,483 190.3,476.9 200.3,470.3C210.1,463.9 222.2,468.2 225.8,479.3C231.2,495.5 233,512.4 236.1,529C237.2,535.2 234.6,540.5 228.7,543.6C223.7,546.2 218.8,549.1 214.4,552.6C212.8,553.9 211.1,554.9 210.5,556.8C211.7,559.2 213.4,558.1 215,558C227.1,557.4 239.2,557 251.2,560.2C265.6,564.2 277.3,572.5 288.2,582.2C289.9,583.7 291.4,586.2 293.8,586.3C296.5,586.3 299.8,586.2 301.6,583.8C303.5,581.1 300.9,579.1 299.3,577.4C282.2,559.3 275.2,537.2 272.7,513.1C270.4,490.7 259.2,473.8 240.1,462C232.9,457.5 225.7,453 218.7,448.2C208.2,441.1 199.6,432 192.4,421.7C180.9,405.4 180.2,387.6 185.3,368.8C191.1,347.4 202.9,330.2 220.3,316.7C226.6,311.8 232.9,306.8 238.2,300.7C248.5,288.9 248.2,274.8 237.1,263.6C232.7,259.1 227.7,255.1 223.2,250.7C215.3,243.1 210.8,234.1 214.1,222.8C217.5,211 225.4,203.5 237.3,200.3C249.4,197 263.6,205.9 266,218.1C266.8,222 266.7,225.9 263.3,228.7C259.9,231.4 256.1,230.8 252.4,229.3C249.1,228 245.5,224.6 242.9,229.4C240.4,233.9 244.5,236.5 247.6,238.5C262,248.3 271.8,261.2 275.6,278.3C278.7,292.3 276.4,305 267.5,316.5C259.7,326.5 249.9,334.7 242,344.6C237.4,350.4 233.5,356.6 231.6,363.8C227.9,378.2 234.3,389.1 244.7,398.1C250.8,403.4 258.2,406.6 265.5,409.8C274.7,413.8 284.1,417.2 292.8,422.3C310.1,432.5 319.4,448.9 327.2,466.5C332.7,479.1 336.7,492.4 343.8,504.4C350.4,515.5 359.6,523.2 371.8,527.3C373.4,527.9 375.1,529 377,528.1C377.6,526.3 376.3,525.3 375.4,524.1C352.1,492.5 343.4,456.8 347.6,418C355.4,346.7 412.1,286.4 482.4,274.7C543.1,264.5 595.3,281.1 637.5,326.1C661.5,351.5 675.3,382.1 678.5,417.3C681.5,450 676.1,480.9 660,509.8C656.5,516.1 652.1,521.9 647.8,527.7C649.3,529.1 650.5,528.7 651.5,528.4C669.3,523.7 683,513.9 691.5,497C698.3,483.3 703.5,468.9 710.9,455.4C720.5,437.9 733.7,424.4 751.4,415.1C760.9,410.1 770.3,404.5 777.9,396.6C789.6,384.7 791.8,371.4 784.5,356.4C780.3,347.7 773.9,340.7 767.1,334C760.8,327.8 754.2,321.9 749.1,314.6C736.7,296.9 739.9,279 749.1,261.4C753.9,252.4 761.2,245.5 769.6,239.8C772.1,238.2 774.5,236.4 776,233.7C776.9,232.1 777.9,230.4 776.5,228.6C775,226.8 773,226.8 771,227.4C769.4,228 767.9,228.8 766.4,229.4C762.6,230.9 758.7,231.2 755.6,228.3C752.7,225.5 752.4,221.9 753.4,218.1C757.1,204.2 771.8,196.3 785.2,201.3C804.8,208.7 814.2,232.7 796.6,250.1C793.4,253.3 790.1,256.3 786.6,259.2C782.3,262.9 778.5,267 776,272.2C771.4,281.7 772,290.5 778.9,298.8C786.1,307.4 795.1,314.1 803.7,321.2C824.3,338.3 834.9,360.7 836.8,386.7C838.4,407.1 829,423.7 813.1,436.5C811.3,437.9 809,438.9 808.5,442.3C814,442.8 819.3,443.4 824.7,443.6C834.9,443.9 845.1,443.6 855.2,444.6C857.3,444.8 859.1,444.4 860.6,442.7C875.4,426.1 898.2,425.6 917.2,437C939.1,450.2 951.7,470.2 957,494.6C965,532.1 955.2,565.3 928.3,592.1C907.9,612.3 882.1,623.3 853.8,628.3C849.3,629.1 844.7,629.9 840.1,630.7C825.6,633.3 815.1,641.8 806.7,653.4C805.6,654.9 804.6,656.5 803.5,657.9C798.7,663.9 796.4,670.1 797.9,678.2C799.6,687 796.9,696.1 797.2,705.1C797.4,709.3 798.3,713.3 800.5,717C804.6,723.9 811.1,725.9 818.5,722.2C823.6,719.7 828.3,716.5 833.5,714.2C843.3,709.9 853.3,708.6 863.6,714.2M257.7,736.2C266.4,726.8 270.5,715.8 270,703C269.7,694.2 269.7,685.3 269.6,676.5C269.6,651.2 281.7,632.4 301.3,617.7C306.5,613.8 312.6,612.6 319.2,613.3C330.9,614.4 338.6,621.6 345.3,630.1C349.3,635 352.6,640.5 356.5,645.4C372.6,665.5 394.6,670.3 417.7,658.9C430.8,652.5 441.3,642.9 450.8,632C457,625 463.4,618.2 471,612.7C477,608.3 479.2,608.7 482.7,615.1C486.1,621.3 488.6,627.8 490.3,634.6C493.9,648.6 495.5,663.1 500.3,676.8C509.5,703.1 526.8,720.7 554.6,726.8C573.5,730.9 592,728.7 610.3,723.3C635.6,716 653.4,700.3 663.2,675.7C666.8,666.5 670.1,657.3 673.7,648.1C678.5,636 684.9,625.1 695.9,617.4C706.1,610.3 717,608 729,612.6C734.9,614.9 739.8,618.4 744.5,622.4C763.7,638.8 772.8,659.1 770.6,684.7C769.6,695.4 769.3,706.3 772.2,717C775.9,731 784.3,740.5 798.5,744.2C802.1,745.2 806.1,744.6 809.9,745.2C817.1,746.4 823.4,744.8 829.1,740.3C832.1,737.9 834.9,735.3 838.1,733.2C848.9,726 860.4,729.1 865.9,740.8C867.3,743.9 869.2,744.5 872.2,743.8C874.3,736 870.4,730.5 865.7,725.3C857.3,716.1 840.2,717.5 830.7,724.7C827.8,726.9 824.8,729 821.4,730.5C810.7,735 800.1,731.5 794.2,721.6C791,716.1 789.8,710.2 789.7,703.9C789.5,691.3 791.3,678.7 788.8,666.1C786.1,651.9 782.9,638.1 775.3,625.6C762.4,604.5 742.9,594.7 718.8,593.4C706.1,592.7 693.4,593 682.3,600.9C672.1,608.2 663.5,616.6 657.4,627.7C652.3,637.1 648,646.9 643.5,656.5C638.1,668 632.1,679 623.6,688.7C602.3,713.4 570.9,711.8 552.5,685.1C545.2,674.5 542.2,662.5 540.6,650C539.1,639 539.6,628.4 544.2,618.2C547.9,610.1 551.5,609.2 558.5,614.4C567.4,621.1 576.3,627.9 584.5,635.5C596.5,646.4 609.5,656 622.9,665C625,666.4 627,666.9 628.4,664.5C634,654.7 638.2,644.2 642.6,634.2C639.5,631 634.4,631.2 633.4,626C636.1,626.2 638.4,626.6 640.7,626.5C644.4,626.5 648,625.2 649.1,621.5C650.1,618.2 646.3,617.5 644.3,616C628.6,603.5 616.8,588.1 610.4,568.8C609.3,565.6 608,562.1 609.3,558.4C611.7,558.7 612.4,560.4 613.3,561.7C617.3,567.2 621.4,572.7 625.3,578.3C629.7,584.6 636.2,587.9 643.1,590.6C644.6,591.2 646.3,591.5 647.7,590.1C656.8,581.2 667,580.5 677.9,586.4C680.3,587.7 682.6,587.5 685,586.5C699.1,580.3 710.8,571.3 720.2,559.2C723.8,554.6 726,549.8 726.2,543.8C726.4,536.9 726.6,530.1 726.8,523.3C727.1,505.7 727.6,488 728.7,470.4C729.1,464.7 731.6,460.2 736.9,457.5C743,454.5 748.9,451 755.3,448.7C770.8,443.2 783.7,434.1 795.6,423.3C812.1,408.3 817.4,390 812.2,368.5C808.7,354.1 801,342 791.3,330.9C781.9,320.4 771,311.1 764.7,298C758.7,285.5 760.2,273.9 769,263.6C775,256.5 782.2,250.5 788.6,243.7C797.6,234.1 794.9,217.8 783.5,212.4C777.5,209.6 771.1,211.4 768.3,216.8C769.5,218.1 771.1,217.6 772.6,217.6C783.1,217.7 788.3,225.7 784.1,235.6C782,240.5 778.1,243.9 774,247.1C763.3,255.3 755.4,265.5 751.2,278.5C746.9,292.3 749.6,304.1 759.8,314.3C766.3,320.7 772.9,327.1 779.4,333.5C783.5,337.5 787.2,341.8 790.3,346.5C804.8,368.2 801.3,392.9 781.1,409.4C775.8,413.8 770,417.5 763.8,420.3C737.9,431.7 720.8,451 711.2,477.4C707.9,486.3 703.9,495 699.9,503.6C692.2,520 680.2,531.8 662.3,537C647.7,541.3 632.9,544.1 617.7,545.1C615.8,545.2 613.4,546.1 611.7,543.5C613.8,540.8 617.2,539.9 619.6,537.7C621.7,535.8 625.5,534.5 624.2,530.8C623.1,527.5 619.5,528.5 616.8,528.3C607.7,527.5 600.4,524 596.5,515.2C595,511.7 595.5,508.3 598,505.4C600.4,502.5 603.6,501.3 607.4,502.1C609,502.4 610.6,503 612.2,503.6C613.9,504.2 615.3,504.2 616.6,502.6C621.1,497.2 626.6,496.3 632.6,500C637.3,502.9 641.1,501.5 644.6,497.9C646.4,495.9 648,493.8 649.8,491.8C651.3,490.2 652.5,488.1 655.3,487.7C654.3,494.7 648.1,499.2 647,507C663,495.2 674.2,433 665.9,408.2C664.1,409.3 666.6,412.6 663.5,412.9C662,412.4 661.8,410.9 661.5,409.7C660,402 658.6,394.3 657,386.7C654.4,374.1 653.2,361.2 640.8,352.9C635.5,349.3 632.1,343 629.4,336.8C627.4,332.4 624.8,328.3 621.2,325C587.4,293.9 547.6,280 501.8,283.1C475.5,284.9 450.9,292.4 429.2,307.3C376.4,343.4 351.4,393.1 359.4,457.4C363.9,493.1 379.9,522.2 412.2,540.7C413.7,541.5 415.7,542 416,544.5C414.6,545.6 412.9,545.2 411.3,545.2C401.8,545.2 392.5,543.6 383.1,542.3C356.5,538.5 338.6,524.3 329.2,499.2C326.1,491.1 322.6,483.2 319.7,475C310.2,448.9 293,431 266.3,422.2C256.8,419.1 247.7,414.8 239.5,409C231,403 224.1,395.5 221.1,385.4C218.4,376.5 219.1,367.4 221.1,358.5C221.6,356.2 221.5,354.3 219.6,352.6C215.6,355.4 215.1,361.3 210,362.1C209.7,364.7 209.4,367 209.3,369.3C209,377.6 208.2,385.9 210,394.2C211.1,399.2 215.2,402.6 217.3,407.1C223.1,419.2 230.4,429.9 242.6,437C256.9,445.4 270,455.4 278,470.7C283.2,480.5 286.8,490.8 289.3,501.5C293,517.4 295.9,533.5 304.1,547.9C309.2,556.9 315.3,564.9 323.4,571.3C325,572.7 326.9,573.4 328.9,572.4C331.1,571.5 330.8,569.4 330.7,567.6C330.5,563.6 330,559.7 329.8,555.7C329.3,543.9 338.8,536.7 350,540.6C360.4,544.2 371,547 381.8,549.3C392.9,551.8 395.9,555.5 396.2,566.8C396.3,569.3 396.1,571.9 396.3,574.3C396.5,576.9 395.5,579.6 397.9,582.8C405.5,575.5 409.7,565.6 417.4,557.9C418.6,561.7 418.4,564.4 417.6,567.1C411.7,588.8 398.5,605.2 380.5,618.2C379,619.3 376.4,620 376.8,622.4C377.2,624.7 379.7,625.2 381.8,625.8C384.1,626.5 386.3,626.9 388.7,626.1C390,625.6 391.5,624.9 392.8,626.4C392.8,628.3 391.5,629.1 390.3,629.9C384.7,634 378.6,634.6 372.3,631.9C366.4,629.3 361.8,624.9 357.4,620.3C350.5,613.2 343.2,606.7 334.6,601.7C327.8,597.9 320.5,594.1 312.5,594.6C294.5,595.8 279.3,603.3 268.6,618C252.8,639.6 248.9,664.5 249.9,690.5C250.2,699.3 251,708.1 248.2,716.8C244.7,728.1 235.1,734.2 223.6,732C215,730.4 207.4,726.2 199.9,722C193.6,718.6 184.8,718.1 179.2,722.3C177.5,723.6 174.6,724.5 176,727.6C177.3,730.6 180,730.4 182.5,729.8C193.8,727 203,730.5 210.7,739C214.3,742.9 219,745.1 224.4,745.7C236.4,746.8 247.6,744.8 257.7,736.2M826.2,473.3C814.1,473 801.9,473 789.8,472.1C773.2,470.8 756.5,471.1 740.1,468.6C736.8,468.1 735.4,469.7 735.3,472.8C735,479.8 734.6,486.7 734.4,493.7C734.1,505.7 734.5,517.7 733.5,529.7C732.7,539.1 732.6,548.6 732.4,558.1C732.3,562.6 734,565.4 739.3,565.9C752.8,567.4 766.5,567.8 780.1,568.7C796.7,569.9 813.2,571.2 829.8,572.4C845.1,573.5 860.3,574.8 875.6,575.8C881.7,576.1 883.5,574.4 883.7,568.3C884.2,546 884.3,523.7 883.8,501.4C883.7,498.5 882.4,497.1 879.8,496.6C869.1,494.5 862,487.9 857.2,478.6C855.6,475.5 853.6,474.2 850.1,474.3C842.5,474.4 834.8,474.2 826.2,473.3M101.4,552.1C110,574.1 125.9,588.5 147.9,596.6C165.7,603.1 184.4,604.3 203,604.4C219.5,604.6 233.7,609 245.9,620.2C250,623.9 251.6,623.6 254.4,618.7C259,610.5 265.1,603.5 272.1,597.2C275.9,593.8 276.3,589.4 272.8,585.5C271.3,583.8 269.4,582.4 267.6,580.9C249.5,566.8 229,564.5 207.4,569C192.3,572.2 177.5,573.9 162,570.4C134.2,564 115.6,548.1 108.3,520.1C105.5,509.2 103.5,498 101.1,487C100.7,485.3 101.3,483.2 98.4,481.9C97.2,489.7 92.7,496.2 92.2,504.2C91.2,520.7 95.4,536.2 101.4,552.1M919.5,459C910.4,447.7 899.6,439.7 884,442.4C873.1,444.2 864.5,454.2 863.4,465.9C862.5,475.7 868.5,485.7 877.6,489.5C884.7,492.4 892.7,490.3 896.9,484.3C898.3,482.4 899.6,480.3 897.3,478.1C895.1,476 893,476.4 890.9,478.7C888.2,481.7 884.9,481.9 881.3,480.4C874.8,477.7 871.4,471.5 872.6,464.2C873.8,457.1 880.2,451.2 887.3,450.7C902.9,449.7 918.7,463.3 921.3,480.7C924.6,503.5 918.8,524.7 906.9,544.1C904,548.7 902.9,552.9 903.5,558.1C904.1,562.8 903.5,567.5 899.8,571.1C891.7,579.1 882.2,583.3 870.5,582C862.7,581.2 854.9,580.9 847.1,580.3C831.2,579.1 815.2,578.3 799.4,576.4C784.8,574.7 772,577.5 761,587.5C757.4,590.8 757.3,592.4 761.5,595C769.8,600.1 776.3,606.9 781.5,615C783.7,618.4 785.8,622 787.8,625.3C790.8,625.1 792,623.1 793.4,621.6C802.5,612.5 813.2,606.9 826.3,605.5C841.2,603.9 856.2,603.1 870.6,598.7C888.3,593.4 904.5,585 914.4,569.1C927.8,547.7 936.4,524.2 933.5,498.2C932,484.4 928.5,471 919.5,459M751.4,644.1C748.5,639.9 745.9,635.6 741.2,632.5C732.2,647.1 719.9,654.3 703,652.2C699.7,651.8 698.6,654 697.7,656.4C694,666 690.4,675.7 686.5,685.2C685,689.1 686,690.8 690,691.2C699,692.2 707.9,691.9 716.8,690.6C731.6,688.5 745,682.9 756.7,673.6C759.6,671.3 760.7,668.7 759.8,664.9C758.2,657.8 755.8,650.9 751.4,644.1M319.7,688.7C323.3,689.3 326.9,690.1 330.6,690.4C337.2,690.9 343.8,691.1 350.5,690.4C351.9,690.3 353.6,689.9 354.3,688.3C354.8,686.9 353.8,685.8 352.6,685.1C339.1,677.5 330.7,665.5 323.5,652.3C322.6,650.7 321.4,649.3 319.7,648.5C313.1,645.8 307.7,641.4 302.5,636.7C299.2,633.6 296.8,634.2 294.3,637.4C287.9,645.5 283.4,654.4 281,664.5C280.1,668.2 281,670.4 283.8,672.7C294.1,681 306,685.8 319.7,688.7M560.9,679.6C567.5,689 576,695.4 587.6,697.2C595,698.3 606.1,693.5 609.1,687.7C606.3,684.8 602.6,683.2 599.2,681.2C588,674.5 578.9,665.1 568.3,657.7C565.7,655.8 563.1,654 559.9,653.5C554.1,652.6 550.7,656.6 552.3,662C554.1,668.1 556.8,673.9 560.9,679.6M378.3,591.3C380.1,590.9 380.7,589.6 380.7,588C380.7,581.8 380.7,575.7 380.7,569.5C380.7,567.2 379.4,565.6 377.4,565C368.2,562.1 359,559.1 349.3,558.2C344,557.7 341.1,561.4 341.7,566.7C342.5,574.1 347.2,578.9 352.9,582.9C356.6,585.6 362.7,585.5 362.3,592.7C364.2,589.6 365.4,585.7 369.3,588.1C371.9,589.8 374.8,590.3 378.3,591.3M789.4,464.8C791.9,464.8 794.4,464.9 796.9,464.9C798.4,464.9 800.4,464.7 800.1,462.7C799.2,457.1 802.7,454.2 806.9,451.5C789.9,445.2 756.2,451.2 747.6,462.3C761.5,463.8 774.9,464.9 789.4,464.8M914,480.6C912.6,474.4 909.7,469.2 904.1,465.4C902.6,468.3 903.7,470.3 904.5,472.2C905.7,475 907.1,478 906,480.9C902.4,489.9 902.7,499.5 901.8,508.8C901,516.4 901.6,524.1 901.6,531.8C902.2,531.9 902.8,532 903.4,532C911.5,516.2 916.7,499.7 914,480.6M255.7,293.8C252,302.9 247.3,311.4 242.6,319.9C241.9,321.2 240.5,322.5 242,323.8C243.4,325 244.5,323.8 245.5,323C249.6,319.8 253.8,316.8 257.6,313.4C270.1,302.3 273,282 258.8,270.7C257.3,273 256.9,275.6 257.1,278.2C257.6,283.2 257.3,288.2 255.7,293.8M606.2,506.4C600.7,507.2 598.7,511.4 601.8,515.9C605.7,521.6 614.9,525.1 621.7,523.5C628.3,521.9 633.4,515.3 632.6,509.3C632.2,505.9 630.2,503.5 627,502.5C624.4,501.6 622.6,503 621.1,505C616.3,511.5 616.3,511.5 609.2,507.7C608.4,507.3 607.6,507 606.2,506.4M890.3,560.4C890.3,563.6 890.3,566.8 890.3,570.3C896.9,565.3 897.7,563 896.9,555.6C895.8,545.2 894.5,534.9 895.5,524.3C896.2,516.2 895.1,508 896.5,499.9C896.8,498.2 896.8,495.9 894.2,495.9C892,495.8 890.3,496.9 890.4,499.5C890.4,500.8 890.3,502.2 890.3,503.5C890.3,522.1 890.3,540.8 890.3,560.4M238.2,242.2C230.1,235.4 232,225 243.3,215.7C240.9,212.4 238.2,211.5 234.4,213.5C224.1,218.8 221.8,234.1 229.9,242.4C235.5,248.1 242.2,252.5 248.2,257.7C250.6,259.7 251.2,263.8 255.9,264.1C252.1,255 243.7,250.2 238.2,242.2M843.4,466.8C845.3,466.9 847.1,467 848.9,466.9C850.5,466.9 852.5,467.4 853.3,465.5C854.2,463.5 852.4,462.7 851.2,461.5C848.5,458.9 848.9,456.6 852.3,455C853.2,454.6 854.4,454.6 854.3,451.9C843.1,451.9 831.9,451.9 820.3,451.9C822.8,453.4 824.9,455.1 824.6,458.4C824.2,461.8 820.7,462.7 818.8,465.5C827,467.5 834.8,466.3 843.4,466.8M174,538.5C187.4,529.2 200.8,519.8 214.2,510.5C213.2,509 212.1,508.9 211.6,509.3C208,512.3 201.2,510 199.8,516.5C199.7,517.1 198.6,518 197.9,518C194.7,517.9 193.1,520.7 190.8,521.8C188.9,521.4 188.1,518.8 185.9,519.6C184.4,520.1 184.5,521.7 184.4,523C184,528.9 176.9,534.1 171,532.5C171.2,536.8 170,539.6 165.1,537.6C163.6,539.4 164.3,542.2 161.8,543.2C158.9,544.3 159.2,540 156.5,540.1C156.6,543.9 156.1,547.5 153.1,550.5C160.8,548 166.5,542.4 174,538.5M470.1,639.6C476.2,640.7 480.5,644.2 482.7,650.2C483.6,652.7 484.4,655.2 485.6,657.6C486.3,659.3 486.9,661.5 490.3,661C490.2,654.9 489.1,649.1 486.8,643.6C485,643.6 485.3,646.2 482.4,645.5C486.6,636.3 483.9,628.2 477.3,620.3C474.1,626.7 470.3,632.2 470.1,639.6M159.8,465C157.1,461 159.1,454.8 153.6,452.1C152.1,451.3 151.1,448.6 149.1,450.1C147.1,451.7 149.2,453.4 149.9,454.9C155.7,467.8 153.8,473.9 141.4,481.2C140.5,481.8 139.8,482.3 140,483.5C140.2,484.7 141,485.6 142.2,485.8C145.6,486.2 149.3,486.5 151.6,483.7C155.8,478.5 160.4,473.3 159.8,465M739.7,573.4C733.1,573.4 730.8,578.9 726.1,582.6C741.6,587.6 749.2,585.6 755.2,575.2C750.4,573.6 745.3,574.5 739.7,573.4M346.5,650.5C342.1,652.2 339,655.3 339.6,660.1C340.1,664.3 342.9,667.6 347.2,668.4C352.4,669.5 354.3,664.9 357.3,661.6C354.1,657.6 351.3,653.4 346.5,650.5M378.3,673.1C375.8,672.2 373.3,671.5 370.9,670.4C368.7,669.4 367.2,669.8 365.7,671.7C362.5,675.7 362.5,679.5 366.2,682.5C370.3,686 376.3,685.6 379.4,681.7C382.8,677.5 382.7,675.2 378.3,673.1M720.6,641.2C724.1,639 727.7,636.9 728.9,632.5C720,628.7 709.1,634.1 705.3,644.1C710.5,645.3 713.4,644.8 720.6,641.2M327,639.4C328.5,640.6 329.7,642 331.3,642.8C334.3,644.4 337.3,643.7 339.5,641.4C342,638.9 339.7,636.8 338.3,634.9C336.9,633 335.3,631.3 333.6,629.7C331.9,628.1 330,626.5 327.5,628.5C325.2,630.4 323.7,632.8 324.8,635.9C325.2,637 326,637.9 327,639.4M803.8,638.4C809.6,633.5 811.1,629.5 808.9,624.8C807.8,622.4 806.4,621.7 804.4,623.6C801.3,626.4 798.4,629.4 795.3,632.2C793.6,633.8 793.9,635.3 795.3,636.9C797.4,639.5 799.9,640.6 803.8,638.4M592.7,742.8C598,745.1 603.5,744 606,740.2C607.2,738.4 607.7,736.5 606.6,734.5C605.6,732.7 603.8,733 602.2,733.2C599.6,733.5 596.9,733.9 594.3,734.2C592,734.5 589.3,734.2 588.6,737.1C587.8,739.9 590.1,741.2 592.7,742.8M637,730.4C638.5,727.9 639.7,725.4 637.1,722.8C634.6,720.3 632.5,722.5 630.4,723.3C629,723.9 627.6,724.5 626.3,725.2C624.3,726.4 621,726.9 621.7,730.2C622.4,733.4 625.2,734.8 628.5,735C631.9,735.1 634.6,734 637,730.4M400.5,684.7C407.4,683.7 411.5,679.5 414.8,673.6C411.6,672.5 404.7,673.4 400.2,674.9C398,675.7 396.4,677 396.3,679.5C396.1,682.1 396.9,684.1 400.5,684.7M665.3,693.3C666.6,694.7 668.1,695.1 669.8,694.3C673.5,692.7 678.2,680.8 676.5,677.1C675.8,675.3 673.5,673.5 672.5,675.4C669.5,681 665.1,686 665.3,693.3M549,635.6C549,637.1 548.9,638.6 549,640.1C549.2,641.8 550.1,642.9 552.1,642.2C555.1,641.2 558.2,640.1 561.6,639C559.8,633.7 557.9,628.9 553.9,625.1C550.2,627.6 549.1,630.9 549,635.6M928.2,564.6C926.8,566.7 925.5,568.8 924.2,570.9C922.8,573.1 923.4,574.7 925.5,575.9C928.5,577.6 932.5,576.1 935.2,572C937.3,568.7 937.9,565.4 934.6,562.6C932,560.3 930.1,561.4 928.2,564.6M711.9,700.3C708.4,700.3 704.9,700.2 701.5,700.4C697.9,700.6 697.7,702.7 699.5,705.2C702.3,709.4 711,710 714.2,706.1C716.1,703.8 717,701.3 711.9,700.3M678.6,657.7C678.1,659.7 678.9,660.9 680.8,661.4C682.5,661.9 683.6,660.7 684.5,659.5C686.9,656.1 688.4,652.3 689.5,648.3C689.9,646.4 689.6,644.5 687.6,643.7C685.3,642.8 684,644.4 683.3,646C681.6,649.6 680.3,653.3 678.6,657.7M560.7,742.2C563.4,743.2 566.2,743.4 569,742.6C570.7,742.1 571.8,740.8 571.8,738.9C571.7,737.2 570.6,736.1 569.1,735.8C565.7,735.1 562.2,734.6 558.8,734.1C557.4,734 556.1,734.5 555.6,736C555.1,737.5 555.6,738.7 556.7,739.6C557.7,740.4 558.9,741.1 560.7,742.2M245.7,634.7C243.4,632.5 241.5,628.8 237.6,631.6C235.2,633.3 234.8,636 236,638.8C237.2,641.6 238.8,644.5 242.2,644.5C245.6,644.4 244.8,640.8 245.8,638.7C246.3,637.7 246.4,636.5 245.7,634.7M940.6,549.3C944.2,547.1 945.4,543.5 945.5,539.6C945.6,537.5 944.5,535.8 942.2,535.3C939.8,534.8 938.4,536.1 937.7,538.2C936.9,540.3 936.4,542.6 935.7,544.8C934.6,548.6 936,550.2 940.6,549.3M226.7,618.8C224.3,617.2 221.6,616.2 218.9,615.5C216.9,615 214.7,615.1 213.9,617.5C213.1,619.8 214.2,621.8 216,623.2C218.6,625.4 221.5,626.5 224.7,624.9C227,623.8 228.6,622.2 226.7,618.8M591.3,651.3C590.2,650.6 589.4,649.2 587.9,650C587,655.4 591.9,662.7 596.9,663.6C598.8,664 600.2,663.2 601.1,661.6C602.2,659.8 600.8,658.9 599.6,658C597,655.9 594.4,653.8 591.3,651.3M950.2,516.4C950.4,515.8 950.7,515.2 950.7,514.5C950.9,511 951.4,506.6 947,506.1C942.1,505.5 943.4,510.7 942.6,513.5C941.9,515.6 941.7,518.4 944.4,519.5C946.8,520.6 948.4,518.8 950.2,516.4M654.9,715.4C655.8,714.7 657,714.1 657.5,713.2C659,710.5 662.5,707.4 659.3,704.5C655.7,701.2 653.6,705.7 651.4,707.6C650,708.9 648,710.3 649,712.6C649.9,714.7 651.8,715.8 654.9,715.4M729.3,702.5C733.6,704.9 737.3,703.4 740.7,700.7C742.6,699.1 743.4,697.1 741.8,694.5C737.7,695.7 733.8,696.8 729.9,698.1C727.5,698.8 727,700.2 729.3,702.5M665.6,595.3C668,595.8 670.2,595.4 672.1,593.8C668.4,588.5 657.2,587.7 652.9,592.4C656.6,594.9 660.9,594.3 665.6,595.3M823.6,616.4C824.2,619.6 826.3,620.8 829.3,620.8C832.4,620.9 835,620 836.6,617.3C837.8,615.4 837.8,613.5 835,613.5C831.1,613.4 827,612.8 823.6,616.4M162.9,502.8C153.1,509 143.3,515.1 133.5,521.3C133.9,521.9 134.4,522.6 134.8,523.3C145.4,516.2 156.4,509.8 166.6,502.2C166.4,501.8 166.1,501.4 165.9,501.1C165.1,501.5 164.3,502 162.9,502.8M131.9,444.1C130.1,444.7 127.9,444.4 126.9,447.3C132.8,451.1 138.9,449.7 146.3,448C141.8,443.6 136.7,445.7 131.9,444.1M850.7,612.9C850.6,617.4 854.1,616.7 856.7,616.6C860.2,616.6 863.5,615.7 864.4,611C859.6,609.5 855.4,610.9 850.7,612.9M432.8,666.5C437.6,665.1 439.8,661.3 441.9,657C438.4,656.6 431.2,660.6 430.5,663C430.1,664.6 431,665.5 432.8,666.5M703,627.5C704.1,626.3 705.4,625.1 704,623C699.6,623.2 697.2,626.5 694.5,629.3C693.6,630.3 692.9,631.6 694.3,632.8C695.6,633.9 696.8,633.5 697.8,632.5C699.4,631 701,629.5 703,627.5M911.7,586.3C909.5,588.4 906.5,590 905.1,593.4C910,594.8 912.6,591.9 915.2,589.2C916.3,588.1 917.3,586.7 916.1,585.3C914.7,583.6 913.5,585.1 911.7,586.3M891.3,605.2C892.8,602.8 892.4,601 889.4,601.8C886.3,602.7 883,603.5 880.6,606.6C884.6,610.4 887.7,608.2 891.3,605.2M306.9,696.5C306.1,696.3 305.3,696.2 304.5,696C302.6,695.5 300.7,695.3 299.8,697.5C299.1,699.3 300.4,700.3 301.8,700.9C304.2,701.9 306.8,702.9 308.8,700.8C310.4,699.1 309.1,697.8 306.9,696.5M126,531.4C126.1,533.5 126.6,535.6 129.3,535.3C130.9,535.1 132,533.6 131.5,531.9C131,530.4 132.4,527.9 129.9,527.3C127.4,526.6 126.3,528.3 126,531.4M330.9,700.3C329,700.6 327.8,701.6 328.4,703.6C329,705.3 330.6,705.7 332.1,705.3C333.9,704.9 336.6,705 336.5,702.4C336.3,699.7 333.6,700.4 330.9,700.3M816.4,459.7C817.4,459.1 818.8,458.3 816.8,457.4C813.4,455.7 810.3,456.3 807.6,459.6C810.5,461.6 813.2,460.9 816.4,459.7M721.3,622.5C723.9,622.5 726.6,623.9 729.6,622.3C727.4,620 724.8,619.6 722.3,618.8C721.3,618.5 720.3,618.3 719.7,619.3C719,620.5 719.5,621.5 721.3,622.5M613.8,669.3C611.1,672.7 614.1,674.1 616.2,675.8C617.2,676.5 618.7,676.8 619.3,675.5C620.6,672.5 617.8,671.6 616.1,670.2C615.6,669.8 615,669.6 613.8,669.3M888.5,465.1C888.5,463.5 889,461.8 886.7,460.7C884.6,462.1 883.6,464.2 883.6,466.8C883.6,467.7 884.2,468.4 885.1,468.4C887,468.5 887.6,467.1 888.5,465.1M759.8,690.7C760.8,688.7 761.1,686.8 759.7,684.3C757.9,684.9 755.6,685.2 755.6,687.6C755.5,689.5 756.7,691.3 759.8,690.7M361.3,548.5C360.2,548.6 358.9,547.6 357.9,549.2C360.8,549.9 363.4,551.5 366.9,551.4C365.4,549.5 363.5,549.4 361.3,548.5M170.1,613.4C169.3,611.4 167.8,610.9 166.1,611.7C165.1,612.2 165,613.5 165.8,614.2C167.2,615.4 168.8,616 170.1,613.4M313,625.1C313.9,624.5 315.7,625.2 315.9,623C313.4,621.9 311.6,622.6 309.7,624.3C310.8,625.6 311.6,625.5 313,625.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M434.3,736.8C437.7,743.6 440.1,750.3 440.9,757.5C441.2,760 441.4,762.5 440.8,765C439.7,770.3 437.3,772.3 432,771.1C428.8,770.3 426.5,771.2 424.1,772.9C420.7,775.3 417.1,777.4 413.7,779.8C409.5,782.8 409.6,786 414,788.7C420.8,793 422,799.3 416.8,805.4C410.2,813.2 400.9,816 391.4,818.2C388.7,818.9 385.8,819.1 383,819.3C379.8,819.6 377,818.7 375.2,815.8C373.1,812.4 371.1,813.8 369.3,815.8C362.2,823.4 354.4,830.4 348.4,838.7C340.7,849.3 331,851.5 319.1,849.2C293.7,844.3 270.4,818.6 269.2,792.8C268.6,780.3 274.4,769.5 290.4,764.3C295.5,762.7 297,760.3 296.7,755.4C296.2,748.4 295.9,741.4 295.8,734.4C295.7,728.2 297.3,726.6 303.3,725.2C307.4,724.3 311.3,725 315.1,726.4C318.3,727.6 320.1,730.2 320.3,733.7C320.6,739 320.9,744.3 321,749.6C321,753.5 322.8,755 326.6,754.5C333.9,753.5 341.1,752.5 348.4,751.5C352.7,750.9 356.7,749.7 360.6,747.5C371.3,741.3 381.9,735.1 392.2,728.3C395.5,726.1 397.4,723.5 398.2,719.2C399.6,711 404.9,704.8 414.9,711.9C423.8,718.2 429,727.3 434.3,736.8M327.2,842.8C336.3,842.1 341.1,837.2 341.7,828.2C342.9,811.7 335.7,798.5 324.9,786.9C317.5,778.9 308.8,772.9 297.2,773C288,773 276.4,778.3 277.8,792.4C278.3,797.2 280.4,801.3 282.3,805.5C283,807.1 283.6,809.3 285.9,808.9C287.9,808.5 287.7,806.4 288.1,804.8C289.7,797.6 294.7,793.6 302,793.7C310.5,793.8 319.1,800.9 321.4,809.8C323.9,819.5 317.6,826.7 307.6,825.6C304.4,825.2 301.2,823.9 297.6,825.3C298.3,829.7 300,833.4 303.8,835.6C310.8,839.7 318,843 327.2,842.8M394.6,798.1C403.1,794.6 405.1,789.6 401.5,781.3C400,777.7 399,773.8 397.8,770C396.8,766.7 396.2,763.2 393.4,760.5C392,761.2 390.8,761.9 389.5,762.6C386.9,756.7 386.2,756.5 382.3,760.3C380.6,757.6 384.7,756.2 383.9,753.6C379,755.7 377.4,758.5 378.6,763.8C380.9,773.9 383.3,784.1 385.8,794.2C387.3,799.9 388.3,800.2 394.6,798.1M413.2,731.2C407.3,725.9 406.8,726 400.4,731.5C397.8,733.7 397.1,735.7 399.6,738.6C406.8,746.6 411.7,755.6 412.3,766.6C412.4,768 412.7,769.3 414.6,769.3C419.2,769.4 426.5,760.7 425.5,756.1C423.6,747 420.3,738.6 413.2,731.2M310.9,820.4C316,818 317.3,814.5 314.9,809.1C312.8,804.3 308.8,801.4 304.2,799.3C299.4,797.1 295.6,799.5 295.2,804.8C294.8,812 301.8,819.5 310.9,820.4M362.1,766.4C363.7,768.5 365.3,770.6 367,772.7C368.1,774 368.9,776.3 371.1,775.4C373.4,774.4 373,772.1 372.6,770.1C371.4,764.4 372,758.9 374.4,753.6C375.2,751.9 376.5,750.1 375,747.6C371.2,748.4 368,750.9 364.6,752.8C357.2,756.9 356.8,758.8 362.1,766.4M420.1,729C419.9,721.8 411.9,715 406.3,718C410.8,721.8 415.2,725.5 420.1,729M362,783.6C363.4,786.8 364.7,790 367.4,792.5C365.2,785 364.6,776.6 356.5,770.8C357,776.2 360.3,779.2 362,783.6M382,811.4C382.5,812.5 383.4,812.8 384.4,812.8C386.2,812.7 388.2,813.2 389.3,811.2C389.8,810.4 389.3,809.6 388.5,809.1C386.7,807.9 384.8,807.6 383,809.1C382.6,809.5 382.4,810.2 382,811.4M303.9,739.4C301.2,741.2 302.1,743.2 303.9,744.9C304.6,745.7 305.9,745.7 306.4,744.7C307.4,742.5 307.7,740.2 303.9,739.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M447.8,861.4C446.1,861.3 444.9,861.2 443.8,861.3C431.1,863.1 423.7,855.6 417.2,846.4C414.5,842.6 416,839.6 418.3,836.4C426.3,825.1 435.3,814.5 445,804.7C451.8,797.9 455.6,790.1 457.8,781C461.2,767.8 461.4,767.9 475,767.8C509.9,767.5 544.9,767 579.9,766.7C596,766.6 596,766.7 600.2,782C604.9,799.1 610.2,816.2 617.1,832.6C620.9,841.7 620.5,849.7 615.4,858.1C607.5,871 609.7,869.8 595.8,868.5C581.7,867.3 567.6,866.9 553.4,866.4C531,865.5 508.5,865.1 486,864.1C473.4,863.6 460.8,862.3 447.8,861.4M452.8,805.2C444.9,814.7 436,823.4 429,833.5C427.7,835.4 425.5,837.2 427,839.7C428.3,842.2 431,841.6 433.3,841.7C447.3,841.8 461.3,841.6 475.3,842.1C516.2,843.7 557.1,845.7 598.1,844.7C601.6,844.7 605,844.2 608.5,843.8C612.4,843.4 613.3,841.5 612.2,838C608.3,826.3 604.5,814.6 600.6,803C599,798.5 594.1,796.4 589.6,798.4C585.1,800.4 588.4,803.6 589,806C590,809.9 591.8,813.5 593.1,817.3C593.6,818.6 594.6,820 593.4,821.9C587.3,823.6 580.8,823 574.4,823.1C568.9,823.1 568,821.7 570.5,816.3C568.7,816.3 567,816.3 565.4,816.3C555.6,816.3 545.8,816.4 535.9,816.3C533.9,816.3 531.1,816.9 531,813.7C530.9,810.3 533.8,810.5 536.1,810.3C538.5,810.2 541,810.3 544.8,810.3C539.2,808 533.8,811.6 530.1,806.4C529,809.9 526.2,809.3 523.8,809.4C512,809.6 500.3,809.2 488.4,810.4C494.6,811.5 500.7,811.2 506.8,811C509.1,810.9 512.5,809.9 513,813.5C513.5,817.4 509.6,816.1 507.6,817C507.5,817.1 507.4,817.4 507.2,817.8C508.5,817.8 509.7,817.8 510.8,817.8C527.8,817.8 544.8,817.9 561.8,818C564.1,818 567.1,817.8 566.9,821.2C566.7,824.1 563.9,823.2 562.1,823.2C525.8,823.2 489.5,823.2 453.2,823.2C451.1,823.2 448.7,823.9 447.2,821.3C449.3,814.9 455.9,810.7 457.5,803.9C455.2,802.8 454.2,803.9 452.8,805.2M542.5,850.3C533.3,850.1 524.2,850.2 515,849.8C489.1,848.7 463.2,847.4 437.3,846.3C435,846.3 431.5,845 431.2,848.6C430.9,851.7 434,853 436.6,853.6C439.3,854.3 442.2,854.4 445,854.6C448.2,854.8 451.3,854.6 454.5,854.9C484,857.7 513.6,858.5 543.2,859.7C561.3,860.5 579.4,861.4 597.5,862.6C602.3,862.9 605.5,861.5 607.7,857.3C608.6,855.6 610.4,854.1 609.3,851.9C608.2,849.6 605.9,850.3 604,850.3C583.8,850.3 563.7,850.3 542.5,850.3M480.6,786.9C512.2,786.9 543.8,786.9 575.4,786.9C577.1,786.9 578.7,786.8 580.4,786.7C581.5,786.6 582.3,786.2 582.6,785C584,780 577.3,771.4 572.1,771.6C545.4,772.8 518.6,773.5 491.8,773.4C487.5,773.4 483.2,773.7 478.9,773.9C477,774 475.1,774.1 474.4,776.3C473.3,779.5 471.6,782.6 472,786.2C474.7,787.3 477.2,786.8 480.6,786.9M517.5,792.8C538.4,792.8 559.3,792.8 580.1,792.8C580.1,792.3 580.1,791.9 580.1,791.4C549.8,791.1 519.6,791.1 489.3,792.8C498.3,792.8 507.4,792.8 517.5,792.8M588.2,788.1C588,789.6 587.8,791 587.6,792.4C595.5,794 597.4,792.1 595.2,784.7C594.3,781.9 593.3,779.1 592.4,776.2C591.2,771.9 588.6,771.6 584.8,773.2C586,778.1 587.1,782.7 588.2,788.1M463.6,783.1C463.4,786.2 460.5,789.6 464.3,792.4C464.8,786.2 469.5,781 468.9,774.4C465.3,776 465.3,776 463.6,783.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M333.1,184.1C329.1,186.8 325.4,189.4 321.6,191.8C318.5,193.7 317.6,195.9 319.2,199.3C325.9,212.7 333,225.9 341,238.6C342.1,240.3 343.7,240.9 345.4,241.7C356.4,247.3 362.5,264.2 357.6,275.9C352.9,287.3 336.7,295.1 325.7,291.3C313.5,287.1 308.4,274.1 310,260.5C310.8,253.1 313.6,246.4 320.2,241.8C323.5,239.5 323.6,236.5 321.8,233.1C314.5,218.8 306.3,205.2 297.3,191.9C294.9,188.3 292.6,184.6 290.5,180.8C287.6,175.6 288.1,173.3 293.1,170C305.8,161.6 318.9,154.1 332.3,146.9C342.7,141.3 353.2,135.9 363.8,130.6C366.4,129.2 369.3,128.4 372.1,127.4C374,126.6 375.8,127 377.3,128.1C384.2,132.7 384.8,146.4 378.1,151.1C366.6,159.2 355,167 344,175.7C340.5,178.4 336.9,181.2 333.1,184.1M322.8,248.1C315.6,254.9 313.5,264.1 317.1,273.6C319.2,279.1 322.7,282.8 329.2,283C321.4,270.3 320.8,267.6 321.8,256.4C322.1,253.5 324.7,251.1 322.8,248.1M328.1,157.6C325.7,159 323.4,160.4 321.1,161.8C331.1,161.9 339.8,160 344.8,148.6C338.7,151.9 333.7,154.6 328.1,157.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M710.9,747.8C730.3,749.1 749.2,750.3 768.1,751.7C776.6,752.3 778.4,755.1 775.5,762.9C774.4,765.9 773.2,768.8 771.9,771.7C769.6,776.4 769.3,780.7 770.9,786C772.7,792.2 769.8,798.5 767.3,804C762.3,815.4 754.8,825.6 750.4,837.4C748.5,842.5 743.9,840.9 740,840C724.7,836.2 709.4,832 694.3,827.4C672.6,820.7 650.6,814.5 628.7,808.3C622.5,806.5 618,803.8 618.2,796.5C618.2,794.9 618.1,793.1 617.4,791.6C613.4,783.5 617.6,778.5 623.5,773.9C635.5,764.6 647.5,755.3 659.4,745.9C663,743.1 666.8,743.3 670.8,744C683.9,746.1 697.2,746.9 710.9,747.8M707.8,755C695.6,753.8 683.3,752.5 671.1,751.3C669.1,751.1 667.1,751.1 665.4,752.5C653.7,762.4 640.8,770.7 628.7,780.2C623.8,784.1 624.2,786.4 630.1,788.8C631.1,789.2 632,789.5 633,789.8C668.1,798.8 703.3,807.7 738.3,816.9C742.4,818 744.1,816.6 745.7,813.3C753.4,797.6 759.4,781.2 766.1,765C768,760.3 766.7,758.6 761.6,758.3C744,757.2 726.4,756.2 707.8,755M643.2,803.3C650.5,805.7 657.6,808.4 664.9,810.6C682.3,815.7 699.7,820.6 717.2,825.6C724.2,827.5 731.3,829.3 738.4,831.2C741.6,832 743.7,830.5 744.4,827.5C745.1,824.2 742.2,824.2 740.3,823.7C735.3,822.4 730.2,821.6 725.3,820.2C698.5,812.9 671.8,805.2 644.6,799.6C642.4,799.1 640.2,798.5 638,799.8C639,802.1 641,802.2 643.2,803.3M762.6,795.4C762.6,794.4 763.1,793.3 761.2,792.7C758.5,796.6 757,801.1 755.8,805.7C759.1,803.1 760.3,799.3 762.6,795.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M925.2,298C923.7,300.4 922.8,302.9 921,304.6C917.1,308.5 917.9,312 920.8,315.9C923.3,319.3 925.5,322.8 927.9,326.2C929.4,328.5 932,331.2 929.1,333.7C926,336.4 924.2,332.9 922.3,331C921.2,330 920.8,328.3 918.7,328.1C917.6,330.3 918.4,332.5 918.6,334.7C918.7,336.4 919.2,338 919.2,339.7C919.3,341.7 919.1,343.9 916.5,344.3C914,344.8 913.1,342.9 912.4,340.9C911.4,337.6 911.5,333.9 909,330C908.7,337.4 909.5,343.9 908.3,350.4C907.9,352.8 907.7,355.3 907,357.7C906.5,359.8 905.1,361.5 902.7,361C900.4,360.4 899.8,358.4 900.1,356.2C900.9,350.5 901.8,344.8 901.7,338.9C901.6,333 900.6,327.3 899.6,321.6C899.2,319.6 898.8,317.4 896.2,317.4C893.2,317.4 892.8,319.9 892.5,321.9C891.4,330 889.3,337.9 886.2,345.5C885.1,348.2 884.1,352.7 880.2,351.3C875.5,349.7 878.4,345.8 879.3,342.8C880.7,338.1 883.4,333.7 882.5,327.2C880.9,330.6 879.8,332.9 878.6,335.2C877.6,337 876.2,338.6 873.8,337.7C871.4,336.8 871.6,334.7 872.1,332.6C872.5,330.5 873.9,328.4 873.2,325.4C870.1,327.7 868.8,330.9 866.7,333.3C865.2,335.1 863.6,337.4 861,335.5C858.4,333.6 859.7,331.1 861.1,328.9C863.8,324.9 866.3,320.8 869.1,316.8C871.4,313.5 870.9,310.9 868.1,308.1C859.8,299.6 854.6,289.7 854.7,277.4C854.8,258.7 869.3,241.7 886.9,239.8C906.6,237.7 923.5,249.6 928.2,268.9C930.5,278.8 929.7,288.4 925.2,298M921.6,284.8C924,268.2 913.6,251.8 898.4,248.1C887.3,245.3 877.5,247.4 874.7,259.9C871.6,273.2 875.5,284.3 884.9,293.5C896.8,305.4 918.2,301.4 921.6,284.8M873.2,302.3C880.2,310.1 892.7,312.4 904,307.6C896.2,306.3 889.3,304.3 883,300.5C881.8,299.7 880.4,300 879.2,300.7C877.3,301.7 875.6,301.7 874.3,300C873.1,298.5 872.4,296.7 873.7,294.9C875.2,292.7 874.5,290.8 873.3,288.9C870.8,284.9 869.7,280.3 868.5,275.8C867.8,273.2 867.7,270.3 865.8,268C858.5,276 861.9,291.9 873.2,302.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M531,209.9C526.7,209.7 522.9,209.5 519.1,209.3C516.6,209.2 514.6,208 512.9,206.4C508.9,202.5 505.9,197.9 503.2,193.1C502.2,191.4 501.9,189.5 502.4,187.4C507.3,167 513.1,146.9 519.2,126.9C519.9,124.5 521.3,122.9 524.1,122.6C536.3,121.3 548.4,119.2 560.7,118.5C565.4,118.2 568.2,119.7 569.8,124.2C573.2,133.4 576.9,142.5 580.5,151.7C581.5,154.2 582.1,156.7 581.3,159.4C577.2,172.9 573.7,186.7 568.2,199.7C564.8,207.7 562.5,209.3 553.9,209.4C546.4,209.5 539,209.7 531,209.9M552.7,155.4C553.1,148.6 553.9,142.1 558.7,136.8C559.3,136.1 559.5,135 559.8,134C562.2,127.2 560.8,125.6 553.6,126.4C545.4,127.4 537.2,128.5 528.9,129.3C525.9,129.5 525.1,131.3 524.3,133.7C520.3,146.8 516.2,160 512.3,173.2C510.9,177.7 508.8,182.1 508.8,187.1C509.6,187.3 510.2,187.7 510.8,187.6C521.1,186.7 531.3,185.7 541.6,184.7C543.9,184.4 544.2,182.6 544.8,180.8C547.3,172.6 549.9,164.4 552.7,155.4M567.3,176.9C568.4,174.1 569.1,171.2 570.6,168.6C575.5,160 573,152 568.7,144.2C567.6,142.3 566.4,140.7 564.1,140.9C562,141 561.9,143.1 561.5,144.6C557.4,157.4 553.5,170.3 549.4,183.1C548.8,185.2 549.4,186.7 550.2,188.6C552.2,193.1 557.7,192.3 560.2,196.9C562.7,189.8 564.9,183.7 567.3,176.9M537.5,203.7C543,203.7 548.5,203.7 554.6,203.7C549.5,194 544.4,187.2 532.8,190.1C526.4,191.7 519.7,191.5 513.1,192C523.9,193.7 534.9,191.3 545.5,195.1C536.1,198.1 526.3,196.4 516.5,197.8C518.1,201.8 520.5,203.5 524,203.6C528.2,203.6 532.3,203.6 537.5,203.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M169.2,314.1C160.3,329.3 148.8,333.8 132.4,328.1C118.5,323.3 107.7,314.8 105.2,299.7C103.4,288.8 106.9,277.9 110.2,267.5C112.3,260.8 117,256 123.2,253.1C137.6,246.1 151.7,247.3 164.7,256.5C179.7,267 184,284.5 176.2,301C174.1,305.3 171.6,309.5 169.2,314.1M130.4,305.2C132.1,306.2 133.7,307.4 135.5,308.2C148.6,314.2 163.3,310.3 169.7,298.9C175.6,288.3 172.8,278 166.8,268.9C159.4,257.7 148.2,253.5 135.1,255.5C122,257.5 113.4,268.9 115.4,281.1C116.9,291 122,298.7 130.4,305.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M402.6,189.3C402,183.5 401.4,178.3 400.9,173C400.6,169.3 401.1,165.8 404.6,163.8C417.3,156.3 431.1,153 445.7,153.7C452.8,154 456.5,158.6 456.2,165.8C455.8,174.4 456.7,183.1 455.5,191.8C455.1,195.1 456.3,198.7 456.3,202.1C456.3,207.8 453.3,211 448,211.3C439.4,211.9 433.6,208.5 432.7,202.6C431.8,196.1 434.7,191.9 440.9,190.4C448.7,188.6 448.7,188.6 448.7,180.3C448.7,171.9 448.2,171.6 439.9,172.8C431.6,174 423.7,176.1 415.7,178.8C411,180.3 408.3,182.9 409.3,188.2C410.5,194.4 409.9,200.8 411.9,207C413.9,213.4 409.5,218.9 402.6,219.3C394.5,219.8 388.6,216.4 387.8,210.6C386.9,204.8 389.9,199.4 395.8,198.8C402,198.1 403.7,195.3 402.6,189.3M445.6,199.8C445.1,197.5 443.6,196.8 441.6,197.6C440,198.2 439.2,199.5 439.5,201.2C439.8,202.6 440.7,203.6 442.2,203.7C444.5,203.9 445.5,202.7 445.6,199.8M396.4,205.8C394.8,207 393.8,208.4 395.3,210.3C396.3,211.6 397.6,212.1 399.2,211.5C400.6,210.9 400.8,209.6 400.7,208.2C400.6,205.9 399.2,205.2 396.4,205.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M648.5,244C638.6,246.5 631.1,244.1 627,237.4C623,230.9 624,222.2 629.4,216C632.2,212.7 635.8,210.6 640.2,210.7C643.8,210.8 645,209.2 644.6,205.9C643.1,193.8 641.8,181.8 640.2,169.8C639.1,162.3 640.3,160 647.7,158.5C658.6,156.4 669.5,157.1 680.5,157.8C682.7,158 684.3,159.1 685.2,161.1C689.1,169.5 691.7,178.2 690.3,187.6C689.7,191.7 687.3,195 684.5,197.9C683,199.5 681,200.3 678.6,199.4C676.2,198.5 675,196.7 674.7,194.2C674.3,190.8 675,187.5 675.9,184.3C677.1,180.5 675.3,178.8 672,178.5C667.7,178.2 663.3,178.2 659,178.1C654.9,178.1 654.5,181.4 654.6,184.1C654.7,191.4 655.1,198.8 655.7,206C656.2,212.1 657,218 659.3,223.9C662.5,232 657.8,239.9 648.5,244M640.1,216.4C637.9,216.7 636.1,217.8 634.5,219.3C630.2,223.1 628.9,229.3 631.6,233.7C634.1,237.9 639.8,239.7 645.2,238C650.9,236.2 654.8,230.7 653.8,225.7C652.7,219.5 648.3,216.3 640.1,216.4M666.4,164.3C662.7,164.6 658.8,163.5 655.2,165.5C656.9,170.5 660.1,172.8 665.3,172.6C669.2,172.5 673.2,172.6 677.2,172.7C678.5,172.7 679.5,172.5 680.1,171.2C680.6,169.9 679.9,169.2 679.1,168.2C675.9,164.5 671.8,163.9 666.4,164.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M670,313.1C671.1,310 672,307.4 673,304.7C674.2,301.8 675.9,299.2 679.5,299.8C683.8,300.5 688.9,301 690.1,305.8C691.1,309.9 693.6,310.7 696.6,311.6C702.8,313.5 709.1,315.2 715.3,317.1C719.3,318.4 720.9,320.8 719.5,325.1C717.6,331.1 715.9,337.2 714.4,343.3C713.4,347.3 711.1,348.5 707.4,347.1C696,342.7 684.7,338.4 673.4,334C669.7,332.6 668.1,330.1 669.8,326.1C671,323.4 672.1,320.7 669.8,317.8C669.1,316.9 669.8,314.9 670,313.1M710.7,333.3C710.8,331.2 711,328.6 708,329.4C704.1,330.5 700.1,331.4 696.8,334.5C699,336.4 701.4,337.1 703.7,338C707.7,339.6 710,338.4 710.7,333.3M692.5,333.6C692.6,333.6 692.8,333.6 693,333.6C693.1,333.5 693.4,333.3 693.4,333.3C692,329.3 689.5,326.1 686.1,322.5C684.3,325.3 680.2,323.9 678.3,327.8C682.5,330.8 687.2,332 692.5,333.6M702.8,324.3C704,323.3 705.4,321.8 703.5,320.8C700.2,319.2 696.7,317.4 692.8,318.9C695.1,325.6 697.1,326.8 702.8,324.3M677.2,313.3C677.3,315 677.9,316.5 679.8,316C682,315.4 682.7,313.5 682.7,311.4C682.7,310.2 682.6,309 681,308.9C678.5,308.8 677.7,310.5 677.2,313.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M734.9,348.7C737.2,348.7 739.1,348.6 740.9,348.9C749.5,350.2 752.2,353.6 751.4,362.4C750.7,369.8 750,377.2 749.1,384.6C748.4,389.7 745.2,392.3 740.6,391.9C735.3,391.5 730.8,387.5 730.8,383.1C730.7,378.6 733.9,375 739.1,374.9C744.5,374.9 744.3,371.1 744.5,367.8C744.9,363.8 741.7,363.3 738.8,363.3C733,363.2 727.1,363.2 721.3,363.4C717.7,363.5 715.2,365.3 715.4,369.3C715.7,374.3 714,379.1 714.5,384.2C714.8,387.1 714.1,390.2 710.8,391C706.3,392.3 701.8,391.6 698.4,388C695.9,385.4 695.7,382.3 697.2,379.2C698.6,376.3 701.2,375.2 704.3,375.6C708.3,376.1 709.7,374 709.6,370.4C709.5,365.9 710.2,361.5 710.6,357C710.9,353 713,351.1 716.6,350.2C722.5,348.7 728.4,348.5 734.9,348.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M126.6,690.8C115.3,686.1 108.8,676.1 109.7,665.3C110.7,654.3 119,645.4 130.2,643.2C143.6,640.5 156.1,649.6 158.9,663.9C161.2,675.8 152,688.8 139.8,691.4C135.4,692.4 131.2,692.2 126.6,690.8M121.7,678.8C123.5,680.2 125.2,681.9 127.1,683C133.2,686.5 141.3,685.2 147,680C152.3,675.1 154.1,667.6 151.6,661.4C148.7,654.5 143.5,650.5 136,650.1C128.7,649.7 123.1,653 119.5,659.2C115.6,665.9 116.6,672.3 121.7,678.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M918.1,675.4C912,693.4 895.5,700.5 880.5,691.9C870.3,686.1 865.7,673 869.9,661.5C873.7,650.9 885.6,644 897.1,645.8C908.8,647.6 918.1,658 918.3,669.5C918.3,671.3 918.2,673.1 918.1,675.4M888.6,688.2C890.9,688.4 893.2,688.8 895.5,688.6C906.4,687.9 914.8,676.6 912.1,666.5C909.7,657.4 902.1,651.9 892.4,652.3C884.3,652.6 876.8,658.9 875.4,666.7C873.7,676 878.4,684.1 888.6,688.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M292.3,381.4C279,391.1 263.1,386.3 259.5,371.7C257.4,362.9 261.2,354.1 268.9,350C277,345.8 287,347.4 293.2,354.1C299.2,360.6 300.1,370 295.4,377.6C294.6,378.8 293.5,379.9 292.3,381.4M292,364.5C291.3,363.1 290.9,361.6 290.1,360.4C286.9,355.8 282.4,353.6 276.8,354.4C271.8,355.1 266.7,360.1 265.7,365.3C264.6,370.8 267.6,374.5 271.6,377.5C275.9,380.8 280.6,380.8 285.2,378.3C290.4,375.5 292.6,371 292,364.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M110.2,363.6C113.1,352.4 122,346.6 132.9,348.8C142.7,350.8 149,360.4 147.3,370.6C145.7,380 135.6,387.4 126.4,386C115.8,384.3 108.9,375.1 110.2,363.6M129.4,379.6C131.4,379.3 133.2,378.6 134.9,377.5C140,374.5 142.6,369.3 141.4,364.7C140,359.3 135.4,355.4 130,355.1C124.2,354.8 118.9,358.6 116.9,364.6C115.5,368.5 117.8,373.5 122.3,376.9C124.2,378.4 126.3,379.2 129.4,379.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M242.6,821.8C245.3,827.7 245.3,833.1 240.9,837.9C237.1,842.1 232.3,843.2 226.9,841.8C221.2,840.2 217.8,835.5 217.6,829.6C217.5,822.9 220.3,818.1 225.7,816.1C231.6,813.9 237.9,815.9 242.6,821.8M238.6,828.6C238.5,827 237.8,825.7 236.9,824.5C234.6,821.5 231.6,820.5 228.1,821.9C224.7,823.3 222.7,826 223.5,829.8C224.4,833.7 227,835.7 231,835.9C235.6,836 237.6,833.3 238.6,828.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M914.4,407C913,399.5 914.7,394.9 919.8,392.1C924.5,389.4 931.3,390.2 935.1,393.9C938.7,397.5 940.1,401.7 938.2,406.7C936.4,411.8 932.6,414.6 927.4,414.9C921.7,415.2 917,413.1 914.4,407M931.3,403.9C932,400.4 930.1,398.2 927.4,396.7C925.5,395.5 923.6,396.1 922,397.7C920.3,399.3 918.9,401.3 919.7,403.8C920.5,406.2 922.1,408.2 924.8,408.6C927.9,409 929.6,406.9 931.3,403.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M705.7,258.5C700.3,263.6 695.3,264.5 690,261.7C685.8,259.4 683.9,255.6 684.3,250.9C684.8,246 687.3,242.3 692.2,241C697.1,239.6 701.6,240.9 704.8,244.8C708.3,248.9 708.5,253.5 705.7,258.5M698.7,255C700.3,252.4 700.6,249.9 697.9,248C696.1,246.7 694,246.8 692.5,248.6C690.9,250.4 690.8,252.5 692.2,254.5C693.8,256.7 695.8,257.4 698.7,255z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M422.3,269.2C416.7,264.5 415.3,260.1 417.5,254.5C419.2,250.1 424.1,246.9 428.8,247.2C434.2,247.5 438.4,250.8 439.8,255.8C441,260.2 439.7,264.1 436.6,267.2C432.5,271.2 427.7,271.1 422.3,269.2M429.9,264.6C434.6,261.6 435.8,258.6 433.3,255.5C431.3,253 428.6,252.5 425.7,253.6C423.1,254.7 421.9,256.9 422.4,259.7C423.1,263.3 425.4,265 429.9,264.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M442.2,685.3C443.1,676.3 454.6,673.7 459.6,679.3C462.4,682.5 463.2,686 461.5,690C459.7,694.2 456.2,695.6 451.8,695.5C447.5,695.4 444.5,693.5 442.9,689.6C442.4,688.4 442.4,687 442.2,685.3M456.1,687.6C457.3,684.9 455.8,683.2 453.6,682C452.2,681.2 450.7,681.7 449.6,682.7C448,684 447.8,685.8 448.4,687.6C449.5,690.8 452.2,691 456.1,687.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M814.3,681C810.1,677.9 808.5,674.2 810.7,669.5C812.6,665.6 816,664.3 820.2,664.7C824.6,665.2 826.9,668 827.8,672.1C828.6,675.3 827.3,678 824.8,680C821.8,682.5 818.3,683.1 814.3,681M815.8,674.9C817.3,677 819.2,677.5 821.4,676.2C822.9,675.4 823,673.7 822.4,672.3C821.8,670.6 820.4,669.6 818.5,669.9C816.2,670.4 815.1,671.9 815.8,674.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M93.7,638C92,631.9 93.8,627.9 98.3,627C101.9,626.2 105.2,627 106.7,630.7C108.1,634.1 108.1,637.8 104.5,640C100.7,642.4 96.9,642.3 93.7,638z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M940.3,635C939.2,640.5 936.6,642.7 932.3,642.2C928.3,641.7 926.1,639.3 925.8,635.3C925.5,631.5 928.4,628.3 932.3,627.8C936.5,627.3 939,629.4 940.3,635M931.2,636.5C932.9,637.9 934.5,638.2 935.4,635.8C935.9,634.4 935,633.1 933.6,632.8C931.3,632.4 930.4,633.7 931.2,636.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M699.7,133.9C700.4,128.8 702.9,126.2 706.5,126.9C710.3,127.7 712,130.3 711.8,134.1C711.6,137.5 708.1,139.8 704.6,139.2C701.9,138.7 700.2,137.1 699.7,133.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M334.9,356C331.6,357 328.8,357 327.1,354C325.9,351.8 326.2,349.5 327.7,347.4C329.1,345.4 331.2,345.1 333.5,345.5C335.7,345.9 337,347.3 337.6,349.4C338.4,352.1 337.6,354.2 334.9,356z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M475.2,116.5C479.7,116.8 481.6,119 481.2,123C481,126 479.1,127.8 476.1,128.1C472.8,128.4 470.8,126.4 470.2,123.3C469.5,119.7 471.1,117.3 475.2,116.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M303.5,416.9C300,415.7 298.9,413.5 300.3,410.6C301.3,408.6 302.9,406.3 305.7,407.6C308.4,408.9 310.6,411.6 310,414.7C309.5,417.8 306.2,417 303.5,416.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M849,228.5C850.9,230.7 851,232.7 849.4,234.6C848.3,235.8 846.8,236 845.3,235.4C843.8,234.7 842.9,233.4 843,231.9C843.2,228.2 845.3,227.1 849,228.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M367.9,725.8C364.4,725.5 363.2,723.6 363.7,720.6C364,718.7 365.4,717.8 367.2,717.9C369.4,718 370.5,719.5 370.9,721.4C371.3,723.5 370.2,724.9 367.9,725.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M798.1,791C795.6,790.2 794.5,788.7 795,786.4C795.3,785 796.3,784 797.7,783.8C799.7,783.5 801.4,784.1 802,786.2C802.6,789 801.3,790.7 798.1,791z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M299.1,284.9C301.7,284.6 303.5,285.4 303.8,287.8C304.1,289.8 302.9,291.2 301,291.9C299.4,292.4 297.9,292 297.2,290.5C296.2,288.4 296.3,286.3 299.1,284.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M629.3,290C632.8,289.9 634.1,291.7 633.8,294.6C633.6,296.4 632.1,297.3 630.2,297.2C628.7,297.1 627.9,296.1 627.3,294.8C626.6,292.9 627.2,291.3 629.3,290z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M825,300C824.3,302.6 822.9,303.7 820.5,303C818.9,302.6 818.3,301.1 818.3,299.6C818.3,297.7 819.4,296.4 821.2,296.1C823.7,295.8 824.8,297.3 825,300z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M364.7,177.8C366.6,175.7 368.4,175.6 370.2,177.2C371.4,178.4 371.5,179.9 370.8,181.3C369.8,183 368.3,183.7 366.5,183C364.2,182.2 363.8,180.3 364.7,177.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M178.1,325.2C175.5,324.4 174.6,322.8 175.5,320.6C176.1,319 177.4,318.4 179,318.5C180.7,318.7 181.7,319.8 181.9,321.4C182.2,323.8 180.8,325 178.1,325.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M747.9,184.1C750.3,185.1 751.6,186.5 750.8,188.8C750.3,190.4 749,191.2 747.3,191C745.7,190.8 744.6,189.8 744.4,188.2C744,185.8 745.2,184.4 747.9,184.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M661.8,892.7C662.6,895.2 662.3,897 659.9,897.9C658.5,898.4 657.3,897.8 656.5,896.5C655.6,895.1 655.6,893.6 656.8,892.4C658.2,890.8 659.9,890.8 661.8,892.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M465.6,746.9C465.9,744.3 467.3,743.5 469.4,743.9C471,744.2 472,745.4 472,747C472,748.5 471.3,749.6 469.9,750C467.6,750.6 466.2,749.6 465.6,746.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M502.4,752.7C504.9,751.9 506.2,752.9 506.8,754.9C507.3,756.5 506.4,757.8 505.1,758.6C503.8,759.4 502.5,759.3 501.6,758.1C500.2,756.3 500.3,754.5 502.4,752.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M383.4,306C381.5,307.7 379.8,308 378.3,306.3C377.3,305 377.4,303.4 378.4,302.1C379.3,300.9 380.6,300.5 382,301.2C383.8,302.1 384.6,303.6 383.4,306z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M703.8,733.9C702.6,736.2 701.1,736.7 699.2,735.7C697.8,735 697.7,733.6 698.1,732.2C698.4,731 699.3,730.2 700.5,730.2C702.7,730.1 703.8,731.3 703.8,733.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M186.1,429.8C189,430.7 189.8,432.4 188.1,434.7C186.9,436.2 185.1,436.2 184,434.5C182.4,432.3 183,430.5 186.1,429.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M725.2,409.4C726.9,406.5 728.7,406.8 730.2,408.9C731.3,410.3 730.8,411.9 729.3,412.6C726.7,413.6 725.3,412.5 725.2,409.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M843.7,351.3C845.9,349.2 847.8,349.1 848.9,351.8C849.6,353.4 848.7,354.8 847.1,355.2C844.2,355.8 843.2,354.3 843.7,351.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M790.8,810.5C787.3,811.2 786.1,809.6 786.7,806.8C787.1,804.8 789,804.2 790.6,805C793.1,806.4 792.7,808.4 790.8,810.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M143,774.9C145.9,775.9 146.9,777.5 145,779.8C143.9,781.1 142.2,781 141.1,779.7C139.2,777.5 139.9,775.8 143,774.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M833,827.7C830.2,827 829.4,825.5 830.8,823.3C831.6,822.1 833,821.8 834.1,822.9C835.9,824.7 835.4,826.4 833,827.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M482.9,217.1C480.9,218.2 478.9,218.8 478.6,216C478.4,214.3 480.1,213.3 481.6,213.4C484.2,213.4 484.1,215 482.9,217.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M722.8,212.2C720,211.8 719.4,210.3 720.5,208.3C721.3,206.8 722.8,206.7 723.9,207.8C725.5,209.5 725.4,211.1 722.8,212.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M313.9,394.1C313.3,396.9 311.9,398 309.7,396.6C308.4,395.8 308.2,394.2 309.2,393.1C310.9,391.1 312.5,391.5 313.9,394.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M246.4,784.8C246.4,782.1 247.6,781.1 249.8,782.1C251.2,782.7 251.6,784.2 250.7,785.4C249.3,787.3 247.7,787.3 246.4,784.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M392,840.2C392.1,842.8 391.1,844.1 388.8,843.1C387.3,842.5 386.7,840.9 387.7,839.5C389.1,837.5 390.7,837.9 392,840.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M546.4,258.1C548.6,259.9 548.3,261.4 546.1,262.3C544.9,262.8 543.6,262.3 543.3,261.1C542.6,258.7 543.8,257.7 546.4,258.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M401.7,867.7C400.4,869.8 399.1,870.2 398,868C397.4,866.8 396.9,865.3 398.7,864.7C400.7,864.2 401.7,865.3 401.7,867.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M630.1,879C628.9,881.2 627.3,881.6 625.6,880.1C624.7,879.2 624.6,877.7 625.8,877.1C627.5,876.3 629.3,876.5 630.1,879z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M128.7,735.7C131.1,734.5 132.5,735.3 132.7,737.5C132.9,738.9 131.9,740.2 130.3,739.9C128,739.6 127.6,738 128.7,735.7z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M467.3,471C459.3,489.2 442.5,497.4 425.5,491.7C410.8,486.8 401.6,472.2 402.7,455.8C403.8,441 415.8,427.5 430.3,424.8C452.2,420.7 473.4,442.6 468.9,464.8C468.5,466.7 467.9,468.7 467.3,471M434.3,443C435.1,439.2 433.9,436.1 430.5,434.1C427.3,432.3 424,433.1 421.1,435.2C414.5,439.7 411.2,446.1 411.3,454.2C411.3,457.3 411.3,460.4 414.4,462C417.6,463.7 420.8,462.8 423.8,460.8C429.8,456.7 432.6,450.6 434.3,443M437.9,458.5C442.1,458.7 442.9,456 442.7,452.7C442.6,451.2 441.4,450 440,450.6C437.1,451.8 435.8,454.1 436.7,457.4C436.8,457.7 437.1,457.9 437.9,458.5M425.9,485.3C429.3,485.8 432.6,488 436.5,485.3C433.6,482.2 430.2,482.1 426.8,482.5C425.7,482.7 424.4,483.2 425.9,485.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M596.7,492C582.4,495.5 571.5,490.2 563.5,479.5C554.5,467.6 554.1,454.4 561.3,441.4C569.6,426.7 584.6,420.8 599.4,426.1C614.5,431.4 624.3,447.5 622,463.1C621.8,464.7 621.7,466.6 619.9,467.3C618.3,468 617.6,466.6 616.8,465.5C615.1,463.3 613.1,464.2 611.5,465.4C607.1,468.5 603.9,472.9 601.6,477.7C599.8,481.6 601.8,484 607.6,485.9C604.8,489.6 600.8,490.6 596.7,492M580.8,450.2C581.9,447.3 583.3,444.4 584.2,441.4C585,439 585.8,436 583.1,434.1C580.7,432.4 578,433.3 575.6,434.6C567.9,438.9 563.9,445.7 563.4,454.4C563.1,460.2 567,462.5 572.2,459.9C576.1,458 578.5,454.6 580.8,450.2M589.7,481.5C586.3,480 582.9,479.2 579.5,482.1C581.2,485.4 584.4,486.1 587.2,487.2C589.2,487.9 591.8,488.9 593,486.6C594.1,484.4 591.9,483.1 589.7,481.5M590.5,450.8C592.4,452.2 594,451.7 595,449.9C596.2,447.8 595.9,445.7 594.7,443.8C593.9,442.6 592.8,441.9 591.3,442.7C589.3,443.9 589.1,445.9 589.3,447.9C589.4,448.7 589.8,449.4 590.5,450.8M589.6,472.4C588.5,472.5 587.4,473.1 587.9,474.2C588.8,476.2 590.6,476.8 592.7,476.2C593.5,473.6 591.8,473.1 589.6,472.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M678.3,566.2C673.5,566.7 669.3,565.5 665.2,564.1C657.3,561.4 649.9,561.2 643.2,567C642.3,567.7 641.4,568.5 640,568C640.6,562.3 646.8,557.2 653.5,556.7C659.7,556.2 665.3,558.5 671.1,559.9C674.1,560.6 676.9,561.1 679.5,558.7C681.4,557 683.2,557.9 684.8,559.3C687.8,561.7 688.9,564.9 688.1,568.7C687.1,572.9 684.6,575.8 680.4,577.1C678.2,577.8 675.9,578.1 673.5,577.7C668,576.6 662.4,575.5 656.9,574.5C651.4,573.5 646.1,575 640.6,576.7C642,571.5 646.5,567.9 651,567.6C657.6,567.3 663.9,568.4 670.2,570.1C673.2,570.9 676.1,571.1 679.1,570.7C682.2,570.3 684,568.8 683.4,565.3C681.6,564.1 680.3,566 678.3,566.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M404.7,524.5C398.7,518.9 395.7,512.9 399,505.1C402.5,496.8 411.8,495 417.8,501.8C419.7,503.9 421.2,504.5 423.7,503.2C428.4,501 432.8,501.3 436.2,505.6C439.2,509.3 439,514.5 436,519.1C429.9,528.6 415.1,531.2 404.7,524.5M423.7,509.3C419.5,512.3 416.4,511.7 414.3,506.8C413.2,504.3 411.4,502.5 408.5,502.8C405.3,503.1 403.6,505.3 402.8,508.3C401.7,511.8 402.6,514.8 404.7,517.6C410.6,525.7 424.2,525.6 430.9,517.4C433.1,514.7 434.1,511.5 432,508.7C429.8,505.9 426.9,507.4 423.7,509.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M492.5,521.2C491.9,520 491.4,519.1 491.1,518.1C490.5,515.7 490.3,513.2 493,512.1C495.9,510.9 497.2,513.1 498.2,515.3C500.2,520.2 503.5,523.8 508.5,525.5C516.2,528 523.4,524.7 527.7,517.1C529.2,514.5 530,509.9 534.2,512.1C538.5,514.4 535.8,518.3 534.2,521.2C524.9,538 503.1,538.1 492.5,521.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M577.2,601.1C576.9,603.2 575.8,602.2 575.1,601.7C566.5,594.9 559.4,586.9 556.3,576.1C555.8,574.5 555.4,572.9 557.1,569.9C561,582.7 568.5,592.1 577.2,601.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M561.4,415.4C566.8,404.2 586,402.5 591.1,410.5C590.8,411.3 590.1,411.4 589.5,411.1C580.9,407.4 573.3,410.2 565.8,414.3C564.5,415.1 563.4,417 561.4,415.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M463.6,413.3C464.2,414.4 465.2,415.1 464,416.9C455.9,411.1 447.2,407.4 436.3,410.3C441.9,402.7 454.9,404.4 463.6,413.3z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M468.7,571.2C468,583.1 463.1,592.6 453.2,599.5C455,596.7 456.8,593.8 458.5,590.9C461.8,585.3 464.9,579.6 466.2,573.1C466.5,571.5 466.7,571.6 468.7,571.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M472.2,599.4C473.4,598.2 474.1,597 475.2,596.3C477.2,595 478.7,596 478.6,598.1C478.6,601.4 478.2,604.8 475.5,607.3C474.2,608.5 472.6,609.8 470.7,608.6C468.6,607.3 469.3,605.4 469.9,603.7C470.4,602.3 471.3,601 472.2,599.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M554.9,608.9C549.1,607.8 545.6,603.9 545.7,599.3C545.7,598.2 545.6,596.9 546.9,596.2C548.1,595.6 549.2,596.2 549.9,597.1C552.5,600.6 557,603.3 554.9,608.9z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M436.5,562.8C433.9,561.5 434.2,560.1 436.3,559.3C438.2,558.6 440.4,557.7 442.5,559.6C441.9,562.8 439.3,562.7 436.5,562.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M852.9,509.5C860.7,539.5 836.2,567.6 807.4,567.3C782.6,567 761.3,547.3 760,522.6C759.1,505.9 766.8,492.6 780.6,483.3C807.8,465.1 843,477.8 852.9,509.5M806.6,561.8C828.3,561.7 847.4,544.8 848.7,524.8C850.7,493.1 818.1,471.3 789.4,484.9C771.6,493.3 763.8,511.1 765.7,525.2C768.5,545.8 784.8,560.2 806.6,561.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M876.7,556.9C879.9,559.6 881.6,562.7 880,566.4C878.5,569.5 875.7,571.5 871.9,571.2C868.7,571 866.2,569.2 865.1,566.2C864.1,563.4 864.5,560.5 866.8,558.4C869.6,555.9 872.7,554.7 876.7,556.9M869.5,563.4C870,566.2 871.8,566.8 874.1,565.6C875.4,565 876.2,563.5 875,562.4C873.3,560.5 871.3,560.6 869.5,563.4z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M832,453.8C835.1,454.5 835.8,456.2 834.9,458.7C834,461.3 831.9,461.4 829.7,461.2C827.9,461.1 826.9,460.1 826.9,458.3C827.1,455.5 828.4,453.7 832,453.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M845.5,455.1C847.3,456.9 847.5,458.8 846,460.1C843.8,462.1 841.2,461.4 838.5,460.6C838.2,455.6 840.6,454 845.5,455.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M475,633.1C476.1,630.8 476,628.2 478.4,626.9C480.3,629.5 479.6,635.7 477.4,637.4C476.6,638 475.8,638.2 475.1,637.6C473.7,636.4 474.7,634.9 475,633.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M514.5,815.1C514.5,812.4 515.5,810.9 518,810.9C520.8,810.9 523.6,810.9 526.4,811C528,811.1 529.3,811.8 529.2,813.7C529.2,815.3 528.2,816.2 526.7,816.2C522.7,816.1 518.5,817.4 514.5,815.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M544.9,835.5C541.2,833.5 542.1,832 545.1,830.9C545.7,830.7 546.5,830.7 547.1,830.8C549.3,831 552.5,830.7 552.4,833.7C552.3,836.4 549.4,836.2 547.2,836.1C546.6,836.1 545.9,835.8 544.9,835.5z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M491.2,832.8C488.3,836.7 484.6,835.1 481.1,835C480.3,835 479.7,834.2 479.7,833.3C479.6,832.4 480,831.5 480.8,831.3C484.4,830.8 488.1,829 491.2,832.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M903.8,270.2C904.9,266.9 907.2,266.3 909.9,266.9C912.2,267.5 913.6,269.2 914.1,271.5C914.7,274.4 913.9,276.9 910.9,278C908,279.1 905.8,277.7 904.3,275C903.6,273.6 903.6,272.1 903.8,270.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M890.5,273.1C891.7,272.9 892.6,272.7 893.3,272.8C897,273.7 897.9,276.4 897.1,279.7C896.4,282.5 894.1,283.2 891.7,282.2C888.5,281 887.2,278.5 888.6,275.1C888.9,274.4 889.6,273.9 890.5,273.1z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M539.4,155.2C537,161 536.6,167.4 531.3,171.3C534.9,159.8 536.8,147.7 542.4,136.9C543.1,137.1 543.7,137.3 544.4,137.5C542.7,143.3 541.1,149.1 539.4,155.2z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M531,159.8C529.4,165 528,169.8 526.5,174.7C526.1,174.5 525.7,174.4 525.3,174.3C526.3,161.1 530.4,148.8 536.1,136.9C536.1,144.8 532.7,151.9 531,159.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M529.7,140.6C526.7,150.1 523.9,159.4 521.1,168.6C520.4,168.3 519.7,168.1 519,167.9C521.4,157.2 524.6,146.7 528.5,135.9C530.8,137.4 530.2,138.8 529.7,140.6z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M157.9,288.8C149.5,295.8 138.9,292.8 136.3,283.1C134.8,277.3 138.2,271.9 144.4,270.5C151.2,268.9 158.2,273.5 159.3,280.3C159.8,283.1 159.8,285.9 157.9,288.8z" android:strokeColor="#00000000"/>
+
+  <path android:fillColor="#000000" android:pathData="M821.2,544.4C810.4,550.1 800.2,549.3 791,541.9C782.7,535.1 778.9,526 781.4,515.2C784.1,502.9 795.3,494.2 807.7,494C818.8,493.9 829.8,502.8 833.5,514.9C836.6,525.2 831.5,537.8 821.2,544.4M798.3,525.1C801.7,529.7 805.6,533.6 812,532C818.2,530.4 821.3,523.9 819.2,517.2C817.2,510.7 810.1,507.1 803.8,509C798.4,510.6 794,517.6 798.3,525.1M807.5,542.1C805.2,541.7 802.9,541.4 800.6,541C804.7,543.3 808.9,543.3 813.1,541.6C811.5,541.7 809.9,541.9 807.5,542.1z" android:strokeColor="#00000000"/>
+
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/ic_launcher.png b/android/llama.android/app-java/src/main/res/drawable/ic_launcher.png
new file mode 100644
index 00000000..e3c90853
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable/ic_launcher_background.xml b/android/llama.android/app-java/src/main/res/drawable/ic_launcher_background.xml
new file mode 100644
index 00000000..07d5da9c
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/ic_launcher_background.xml
@@ -0,0 +1,170 @@
+<?xml version="1.0" encoding="utf-8"?>
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    android:width="108dp"
+    android:height="108dp"
+    android:viewportWidth="108"
+    android:viewportHeight="108">
+    <path
+        android:fillColor="#3DDC84"
+        android:pathData="M0,0h108v108h-108z" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M9,0L9,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,0L19,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M29,0L29,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M39,0L39,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M49,0L49,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M59,0L59,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M69,0L69,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M79,0L79,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M89,0L89,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M99,0L99,108"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,9L108,9"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,19L108,19"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,29L108,29"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,39L108,39"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,49L108,49"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,59L108,59"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,69L108,69"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,79L108,79"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,89L108,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M0,99L108,99"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,29L89,29"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,39L89,39"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,49L89,49"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,59L89,59"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,69L89,69"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M19,79L89,79"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M29,19L29,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M39,19L39,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M49,19L49,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M59,19L59,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M69,19L69,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+    <path
+        android:fillColor="#00000000"
+        android:pathData="M79,19L79,89"
+        android:strokeWidth="0.8"
+        android:strokeColor="#33FFFFFF" />
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/ic_launcher_fav_background.xml b/android/llama.android/app-java/src/main/res/drawable/ic_launcher_fav_background.xml
new file mode 100644
index 00000000..ca3826a4
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/ic_launcher_fav_background.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="utf-8"?>
+<vector
+    android:height="108dp"
+    android:width="108dp"
+    android:viewportHeight="108"
+    android:viewportWidth="108"
+    xmlns:android="http://schemas.android.com/apk/res/android">
+    <path android:fillColor="#3DDC84"
+          android:pathData="M0,0h108v108h-108z"/>
+    <path android:fillColor="#00000000" android:pathData="M9,0L9,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,0L19,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M29,0L29,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M39,0L39,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M49,0L49,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M59,0L59,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M69,0L69,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M79,0L79,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M89,0L89,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M99,0L99,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,9L108,9"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,19L108,19"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,29L108,29"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,39L108,39"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,49L108,49"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,59L108,59"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,69L108,69"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,79L108,79"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,89L108,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,99L108,99"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,29L89,29"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,39L89,39"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,49L89,49"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,59L89,59"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,69L89,69"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,79L89,79"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M29,19L29,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M39,19L39,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M49,19L49,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M59,19L59,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M69,19L69,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M79,19L79,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/ic_user.xml b/android/llama.android/app-java/src/main/res/drawable/ic_user.xml
new file mode 100644
index 00000000..725adb58
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/ic_user.xml
@@ -0,0 +1,22 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    android:width="800dp"
+    android:height="800dp"
+    android:viewportWidth="24"
+    android:viewportHeight="24">
+  <path
+      android:pathData="M17,8C17,10.761 14.761,13 12,13C9.239,13 7,10.761 7,8C7,5.239 9.239,3 12,3C14.761,3 17,5.239 17,8Z"
+      android:strokeAlpha="0.1"
+      android:fillColor="#323232"
+      android:fillAlpha="0.1"/>
+  <path
+      android:pathData="M17,8C17,10.761 14.761,13 12,13C9.239,13 7,10.761 7,8C7,5.239 9.239,3 12,3C14.761,3 17,5.239 17,8Z"
+      android:strokeWidth="2"
+      android:fillColor="#00000000"
+      android:strokeColor="#323232"/>
+  <path
+      android:pathData="M3,21C3.957,17.924 6.42,17 12,17C17.58,17 20.043,17.924 21,21"
+      android:strokeWidth="2"
+      android:fillColor="#00000000"
+      android:strokeColor="#323232"
+      android:strokeLineCap="round"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/input_text_box.xml b/android/llama.android/app-java/src/main/res/drawable/input_text_box.xml
new file mode 100644
index 00000000..1c132b0b
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/input_text_box.xml
@@ -0,0 +1,10 @@
+<shape
+    xmlns:android="http://schemas.android.com/apk/res/android"
+    android:shape="rectangle">
+
+    <solid android:color="@color/inputbox_background" />
+
+    <corners
+        android:radius="30dp" />
+
+</shape>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/drawable/microphone.xml b/android/llama.android/app-java/src/main/res/drawable/microphone.xml
new file mode 100644
index 00000000..75fe9341
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/microphone.xml
@@ -0,0 +1,13 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    android:width="40dp"
+    android:height="40dp"
+    android:viewportWidth="32"
+    android:viewportHeight="32">
+  <path
+      android:strokeWidth="1"
+      android:pathData="M23.315,13.808V15.269C23.315,19.305 20.044,22.577 16.008,22.577C11.972,22.577 8.7,19.305 8.7,15.269V13.808M16.008,23.308V25.5M16.008,25.5H18.931M16.008,25.5H13.085M16.008,19.654C13.586,19.654 11.623,17.691 11.623,15.269V10.885C11.623,8.463 13.586,6.5 16.008,6.5C18.429,6.5 20.392,8.463 20.392,10.885V15.269C20.392,17.691 18.429,19.654 16.008,19.654Z"
+      android:strokeLineJoin="round"
+      android:fillColor="#00000000"
+      android:strokeColor="#ffffff"
+      android:strokeLineCap="round"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/octopus_background.xml b/android/llama.android/app-java/src/main/res/drawable/octopus_background.xml
new file mode 100644
index 00000000..ca3826a4
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/octopus_background.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="utf-8"?>
+<vector
+    android:height="108dp"
+    android:width="108dp"
+    android:viewportHeight="108"
+    android:viewportWidth="108"
+    xmlns:android="http://schemas.android.com/apk/res/android">
+    <path android:fillColor="#3DDC84"
+          android:pathData="M0,0h108v108h-108z"/>
+    <path android:fillColor="#00000000" android:pathData="M9,0L9,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,0L19,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M29,0L29,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M39,0L39,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M49,0L49,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M59,0L59,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M69,0L69,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M79,0L79,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M89,0L89,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M99,0L99,108"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,9L108,9"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,19L108,19"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,29L108,29"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,39L108,39"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,49L108,49"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,59L108,59"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,69L108,69"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,79L108,79"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,89L108,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M0,99L108,99"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,29L89,29"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,39L89,39"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,49L89,49"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,59L89,59"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,69L89,69"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M19,79L89,79"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M29,19L29,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M39,19L39,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M49,19L49,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M59,19L59,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M69,19L69,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+    <path android:fillColor="#00000000" android:pathData="M79,19L79,89"
+          android:strokeColor="#33FFFFFF" android:strokeWidth="0.8"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/octopus_menu_send.xml b/android/llama.android/app-java/src/main/res/drawable/octopus_menu_send.xml
new file mode 100644
index 00000000..4254a34f
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/octopus_menu_send.xml
@@ -0,0 +1,11 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    android:width="36dp"
+    android:height="36dp"
+    android:viewportWidth="32"
+    android:viewportHeight="32">
+  <path
+      android:strokeWidth="1"
+      android:pathData="M8.706,11.995L22.398,7.248C23.922,6.72 25.412,8.119 24.981,9.673L21.165,23.421C20.691,25.127 18.397,25.421 17.508,23.89L14.608,18.893C14.401,18.536 14.087,18.252 13.712,18.079L8.528,15.702C6.889,14.951 7.003,12.585 8.706,11.995Z"
+      android:fillColor="#00000000"
+      android:strokeColor="#ffffff"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/octopus_original.xml b/android/llama.android/app-java/src/main/res/drawable/octopus_original.xml
new file mode 100644
index 00000000..92048641
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/octopus_original.xml
@@ -0,0 +1,171 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android" android:height="1024.0195dp" android:viewportHeight="1024" android:viewportWidth="1024" android:width="1024dp">
+      
+    <path android:fillColor="#000000" android:pathData="M863.6,714.2C880.4,724.9 885.7,740.8 878.1,756.8C874.2,765 865.8,770.4 858.3,769.6C849.8,768.7 845.4,760.8 849.3,753.2C850.3,751.3 851.6,749.5 852.4,747.5C853.3,745.4 853.3,743.2 851.4,741.5C849.3,739.7 847.3,740.8 845.4,742C844.3,742.7 843.2,743.5 842.3,744.5C830.5,757.1 815.9,759.4 799.7,756C778.1,751.4 766,737.7 761.7,716.6C760,708.6 760,708.6 752.5,711.5C734.1,718.6 715.1,718.9 695.9,715.9C689.8,714.9 683.8,713.9 677.8,712.3C673.9,711.3 671.7,712.3 669.6,715.6C663.1,725.8 655.3,735 644.6,741C627.5,750.7 609.2,755 589.5,753.5C576.7,752.6 564,751.5 551.6,747.9C523.4,739.6 503.4,721.7 489.7,696.1C483.5,684.5 478.7,672.2 474.9,659.6C472.2,650.5 467.9,649.4 461.3,656.4C428.7,691.1 387,707.6 341.4,716C322.7,719.5 303.9,717.8 286,710.4C281.9,708.8 280.5,710.5 279.7,714C278.8,717.6 278.2,721.2 277.1,724.7C271.5,743.2 258.7,753.2 239.8,756.4C223.4,759.2 209.1,756.2 197.3,743.9C195.1,741.7 192.4,738.8 189.1,742C186.1,744.8 187.3,747.9 189.5,750.9C193.1,755.9 193.2,760.8 190,765.2C187.2,769.1 182,770.8 176.6,769.5C164.4,766.5 156.3,752 159.1,738.1C163.4,716 184.8,704.7 205.6,713.4C210.1,715.3 214.3,717.6 218.4,720.2C232.6,729.4 241.9,719.5 242.5,707.1C243,694.8 241.1,682.5 241.6,670.2C241.6,669.2 241.3,668.1 240.7,667.4C233.1,657.7 226.3,647.4 216.4,639.7C206.9,632.4 196,630.3 184.6,629.3C151.3,626.3 121.2,615.1 96.7,591.8C75.2,571.5 66.2,545.3 66.6,516.1C66.9,488.9 76.2,465.3 96,446.2C106.1,436.6 118,430.8 131.9,429C153.5,426.2 172.2,444.5 169.6,466.1C167.6,483.2 158.3,494.2 143.9,496.9C134,498.7 123.4,492.6 120.3,483.3C117.2,473.8 124.9,465 134.6,467.1C137.2,467.6 139.5,468.1 140.2,465C140.8,462 138.4,460.9 136.3,459.9C133.5,458.7 130.7,459.3 128.1,460.5C118.1,465.2 112.7,473.2 111.5,483.9C110,496.1 113.4,507.6 117.5,519C118.3,521.3 119.7,522 122.1,520.4C137.8,509.8 154.6,500.9 170.1,489.9C179.9,483 190.3,476.9 200.3,470.3C210.1,463.9 222.2,468.2 225.8,479.3C231.2,495.5 233,512.4 236.1,529C237.2,535.2 234.6,540.5 228.7,543.6C223.7,546.2 218.8,549.1 214.4,552.6C212.8,553.9 211.1,554.9 210.5,556.8C211.7,559.2 213.4,558.1 215,558C227.1,557.4 239.2,557 251.2,560.2C265.6,564.2 277.3,572.5 288.2,582.2C289.9,583.7 291.4,586.2 293.8,586.3C296.5,586.3 299.8,586.2 301.6,583.8C303.5,581.1 300.9,579.1 299.3,577.4C282.2,559.3 275.2,537.2 272.7,513.1C270.4,490.7 259.2,473.8 240.1,462C232.9,457.5 225.7,453 218.7,448.2C208.2,441.1 199.6,432 192.4,421.7C180.9,405.4 180.2,387.6 185.3,368.8C191.1,347.4 202.9,330.2 220.3,316.7C226.6,311.8 232.9,306.8 238.2,300.7C248.5,288.9 248.2,274.8 237.1,263.6C232.7,259.1 227.7,255.1 223.2,250.7C215.3,243.1 210.8,234.1 214.1,222.8C217.5,211 225.4,203.5 237.3,200.3C249.4,197 263.6,205.9 266,218.1C266.8,222 266.7,225.9 263.3,228.7C259.9,231.4 256.1,230.8 252.4,229.3C249.1,228 245.5,224.6 242.9,229.4C240.4,233.9 244.5,236.5 247.6,238.5C262,248.3 271.8,261.2 275.6,278.3C278.7,292.3 276.4,305 267.5,316.5C259.7,326.5 249.9,334.7 242,344.6C237.4,350.4 233.5,356.6 231.6,363.8C227.9,378.2 234.3,389.1 244.7,398.1C250.8,403.4 258.2,406.6 265.5,409.8C274.7,413.8 284.1,417.2 292.8,422.3C310.1,432.5 319.4,448.9 327.2,466.5C332.7,479.1 336.7,492.4 343.8,504.4C350.4,515.5 359.6,523.2 371.8,527.3C373.4,527.9 375.1,529 377,528.1C377.6,526.3 376.3,525.3 375.4,524.1C352.1,492.5 343.4,456.8 347.6,418C355.4,346.7 412.1,286.4 482.4,274.7C543.1,264.5 595.3,281.1 637.5,326.1C661.5,351.5 675.3,382.1 678.5,417.3C681.5,450 676.1,480.9 660,509.8C656.5,516.1 652.1,521.9 647.8,527.7C649.3,529.1 650.5,528.7 651.5,528.4C669.3,523.7 683,513.9 691.5,497C698.3,483.3 703.5,468.9 710.9,455.4C720.5,437.9 733.7,424.4 751.4,415.1C760.9,410.1 770.3,404.5 777.9,396.6C789.6,384.7 791.8,371.4 784.5,356.4C780.3,347.7 773.9,340.7 767.1,334C760.8,327.8 754.2,321.9 749.1,314.6C736.7,296.9 739.9,279 749.1,261.4C753.9,252.4 761.2,245.5 769.6,239.8C772.1,238.2 774.5,236.4 776,233.7C776.9,232.1 777.9,230.4 776.5,228.6C775,226.8 773,226.8 771,227.4C769.4,228 767.9,228.8 766.4,229.4C762.6,230.9 758.7,231.2 755.6,228.3C752.7,225.5 752.4,221.9 753.4,218.1C757.1,204.2 771.8,196.3 785.2,201.3C804.8,208.7 814.2,232.7 796.6,250.1C793.4,253.3 790.1,256.3 786.6,259.2C782.3,262.9 778.5,267 776,272.2C771.4,281.7 772,290.5 778.9,298.8C786.1,307.4 795.1,314.1 803.7,321.2C824.3,338.3 834.9,360.7 836.8,386.7C838.4,407.1 829,423.7 813.1,436.5C811.3,437.9 809,438.9 808.5,442.3C814,442.8 819.3,443.4 824.7,443.6C834.9,443.9 845.1,443.6 855.2,444.6C857.3,444.8 859.1,444.4 860.6,442.7C875.4,426.1 898.2,425.6 917.2,437C939.1,450.2 951.7,470.2 957,494.6C965,532.1 955.2,565.3 928.3,592.1C907.9,612.3 882.1,623.3 853.8,628.3C849.3,629.1 844.7,629.9 840.1,630.7C825.6,633.3 815.1,641.8 806.7,653.4C805.6,654.9 804.6,656.5 803.5,657.9C798.7,663.9 796.4,670.1 797.9,678.2C799.6,687 796.9,696.1 797.2,705.1C797.4,709.3 798.3,713.3 800.5,717C804.6,723.9 811.1,725.9 818.5,722.2C823.6,719.7 828.3,716.5 833.5,714.2C843.3,709.9 853.3,708.6 863.6,714.2M257.7,736.2C266.4,726.8 270.5,715.8 270,703C269.7,694.2 269.7,685.3 269.6,676.5C269.6,651.2 281.7,632.4 301.3,617.7C306.5,613.8 312.6,612.6 319.2,613.3C330.9,614.4 338.6,621.6 345.3,630.1C349.3,635 352.6,640.5 356.5,645.4C372.6,665.5 394.6,670.3 417.7,658.9C430.8,652.5 441.3,642.9 450.8,632C457,625 463.4,618.2 471,612.7C477,608.3 479.2,608.7 482.7,615.1C486.1,621.3 488.6,627.8 490.3,634.6C493.9,648.6 495.5,663.1 500.3,676.8C509.5,703.1 526.8,720.7 554.6,726.8C573.5,730.9 592,728.7 610.3,723.3C635.6,716 653.4,700.3 663.2,675.7C666.8,666.5 670.1,657.3 673.7,648.1C678.5,636 684.9,625.1 695.9,617.4C706.1,610.3 717,608 729,612.6C734.9,614.9 739.8,618.4 744.5,622.4C763.7,638.8 772.8,659.1 770.6,684.7C769.6,695.4 769.3,706.3 772.2,717C775.9,731 784.3,740.5 798.5,744.2C802.1,745.2 806.1,744.6 809.9,745.2C817.1,746.4 823.4,744.8 829.1,740.3C832.1,737.9 834.9,735.3 838.1,733.2C848.9,726 860.4,729.1 865.9,740.8C867.3,743.9 869.2,744.5 872.2,743.8C874.3,736 870.4,730.5 865.7,725.3C857.3,716.1 840.2,717.5 830.7,724.7C827.8,726.9 824.8,729 821.4,730.5C810.7,735 800.1,731.5 794.2,721.6C791,716.1 789.8,710.2 789.7,703.9C789.5,691.3 791.3,678.7 788.8,666.1C786.1,651.9 782.9,638.1 775.3,625.6C762.4,604.5 742.9,594.7 718.8,593.4C706.1,592.7 693.4,593 682.3,600.9C672.1,608.2 663.5,616.6 657.4,627.7C652.3,637.1 648,646.9 643.5,656.5C638.1,668 632.1,679 623.6,688.7C602.3,713.4 570.9,711.8 552.5,685.1C545.2,674.5 542.2,662.5 540.6,650C539.1,639 539.6,628.4 544.2,618.2C547.9,610.1 551.5,609.2 558.5,614.4C567.4,621.1 576.3,627.9 584.5,635.5C596.5,646.4 609.5,656 622.9,665C625,666.4 627,666.9 628.4,664.5C634,654.7 638.2,644.2 642.6,634.2C639.5,631 634.4,631.2 633.4,626C636.1,626.2 638.4,626.6 640.7,626.5C644.4,626.5 648,625.2 649.1,621.5C650.1,618.2 646.3,617.5 644.3,616C628.6,603.5 616.8,588.1 610.4,568.8C609.3,565.6 608,562.1 609.3,558.4C611.7,558.7 612.4,560.4 613.3,561.7C617.3,567.2 621.4,572.7 625.3,578.3C629.7,584.6 636.2,587.9 643.1,590.6C644.6,591.2 646.3,591.5 647.7,590.1C656.8,581.2 667,580.5 677.9,586.4C680.3,587.7 682.6,587.5 685,586.5C699.1,580.3 710.8,571.3 720.2,559.2C723.8,554.6 726,549.8 726.2,543.8C726.4,536.9 726.6,530.1 726.8,523.3C727.1,505.7 727.6,488 728.7,470.4C729.1,464.7 731.6,460.2 736.9,457.5C743,454.5 748.9,451 755.3,448.7C770.8,443.2 783.7,434.1 795.6,423.3C812.1,408.3 817.4,390 812.2,368.5C808.7,354.1 801,342 791.3,330.9C781.9,320.4 771,311.1 764.7,298C758.7,285.5 760.2,273.9 769,263.6C775,256.5 782.2,250.5 788.6,243.7C797.6,234.1 794.9,217.8 783.5,212.4C777.5,209.6 771.1,211.4 768.3,216.8C769.5,218.1 771.1,217.6 772.6,217.6C783.1,217.7 788.3,225.7 784.1,235.6C782,240.5 778.1,243.9 774,247.1C763.3,255.3 755.4,265.5 751.2,278.5C746.9,292.3 749.6,304.1 759.8,314.3C766.3,320.7 772.9,327.1 779.4,333.5C783.5,337.5 787.2,341.8 790.3,346.5C804.8,368.2 801.3,392.9 781.1,409.4C775.8,413.8 770,417.5 763.8,420.3C737.9,431.7 720.8,451 711.2,477.4C707.9,486.3 703.9,495 699.9,503.6C692.2,520 680.2,531.8 662.3,537C647.7,541.3 632.9,544.1 617.7,545.1C615.8,545.2 613.4,546.1 611.7,543.5C613.8,540.8 617.2,539.9 619.6,537.7C621.7,535.8 625.5,534.5 624.2,530.8C623.1,527.5 619.5,528.5 616.8,528.3C607.7,527.5 600.4,524 596.5,515.2C595,511.7 595.5,508.3 598,505.4C600.4,502.5 603.6,501.3 607.4,502.1C609,502.4 610.6,503 612.2,503.6C613.9,504.2 615.3,504.2 616.6,502.6C621.1,497.2 626.6,496.3 632.6,500C637.3,502.9 641.1,501.5 644.6,497.9C646.4,495.9 648,493.8 649.8,491.8C651.3,490.2 652.5,488.1 655.3,487.7C654.3,494.7 648.1,499.2 647,507C663,495.2 674.2,433 665.9,408.2C664.1,409.3 666.6,412.6 663.5,412.9C662,412.4 661.8,410.9 661.5,409.7C660,402 658.6,394.3 657,386.7C654.4,374.1 653.2,361.2 640.8,352.9C635.5,349.3 632.1,343 629.4,336.8C627.4,332.4 624.8,328.3 621.2,325C587.4,293.9 547.6,280 501.8,283.1C475.5,284.9 450.9,292.4 429.2,307.3C376.4,343.4 351.4,393.1 359.4,457.4C363.9,493.1 379.9,522.2 412.2,540.7C413.7,541.5 415.7,542 416,544.5C414.6,545.6 412.9,545.2 411.3,545.2C401.8,545.2 392.5,543.6 383.1,542.3C356.5,538.5 338.6,524.3 329.2,499.2C326.1,491.1 322.6,483.2 319.7,475C310.2,448.9 293,431 266.3,422.2C256.8,419.1 247.7,414.8 239.5,409C231,403 224.1,395.5 221.1,385.4C218.4,376.5 219.1,367.4 221.1,358.5C221.6,356.2 221.5,354.3 219.6,352.6C215.6,355.4 215.1,361.3 210,362.1C209.7,364.7 209.4,367 209.3,369.3C209,377.6 208.2,385.9 210,394.2C211.1,399.2 215.2,402.6 217.3,407.1C223.1,419.2 230.4,429.9 242.6,437C256.9,445.4 270,455.4 278,470.7C283.2,480.5 286.8,490.8 289.3,501.5C293,517.4 295.9,533.5 304.1,547.9C309.2,556.9 315.3,564.9 323.4,571.3C325,572.7 326.9,573.4 328.9,572.4C331.1,571.5 330.8,569.4 330.7,567.6C330.5,563.6 330,559.7 329.8,555.7C329.3,543.9 338.8,536.7 350,540.6C360.4,544.2 371,547 381.8,549.3C392.9,551.8 395.9,555.5 396.2,566.8C396.3,569.3 396.1,571.9 396.3,574.3C396.5,576.9 395.5,579.6 397.9,582.8C405.5,575.5 409.7,565.6 417.4,557.9C418.6,561.7 418.4,564.4 417.6,567.1C411.7,588.8 398.5,605.2 380.5,618.2C379,619.3 376.4,620 376.8,622.4C377.2,624.7 379.7,625.2 381.8,625.8C384.1,626.5 386.3,626.9 388.7,626.1C390,625.6 391.5,624.9 392.8,626.4C392.8,628.3 391.5,629.1 390.3,629.9C384.7,634 378.6,634.6 372.3,631.9C366.4,629.3 361.8,624.9 357.4,620.3C350.5,613.2 343.2,606.7 334.6,601.7C327.8,597.9 320.5,594.1 312.5,594.6C294.5,595.8 279.3,603.3 268.6,618C252.8,639.6 248.9,664.5 249.9,690.5C250.2,699.3 251,708.1 248.2,716.8C244.7,728.1 235.1,734.2 223.6,732C215,730.4 207.4,726.2 199.9,722C193.6,718.6 184.8,718.1 179.2,722.3C177.5,723.6 174.6,724.5 176,727.6C177.3,730.6 180,730.4 182.5,729.8C193.8,727 203,730.5 210.7,739C214.3,742.9 219,745.1 224.4,745.7C236.4,746.8 247.6,744.8 257.7,736.2M826.2,473.3C814.1,473 801.9,473 789.8,472.1C773.2,470.8 756.5,471.1 740.1,468.6C736.8,468.1 735.4,469.7 735.3,472.8C735,479.8 734.6,486.7 734.4,493.7C734.1,505.7 734.5,517.7 733.5,529.7C732.7,539.1 732.6,548.6 732.4,558.1C732.3,562.6 734,565.4 739.3,565.9C752.8,567.4 766.5,567.8 780.1,568.7C796.7,569.9 813.2,571.2 829.8,572.4C845.1,573.5 860.3,574.8 875.6,575.8C881.7,576.1 883.5,574.4 883.7,568.3C884.2,546 884.3,523.7 883.8,501.4C883.7,498.5 882.4,497.1 879.8,496.6C869.1,494.5 862,487.9 857.2,478.6C855.6,475.5 853.6,474.2 850.1,474.3C842.5,474.4 834.8,474.2 826.2,473.3M101.4,552.1C110,574.1 125.9,588.5 147.9,596.6C165.7,603.1 184.4,604.3 203,604.4C219.5,604.6 233.7,609 245.9,620.2C250,623.9 251.6,623.6 254.4,618.7C259,610.5 265.1,603.5 272.1,597.2C275.9,593.8 276.3,589.4 272.8,585.5C271.3,583.8 269.4,582.4 267.6,580.9C249.5,566.8 229,564.5 207.4,569C192.3,572.2 177.5,573.9 162,570.4C134.2,564 115.6,548.1 108.3,520.1C105.5,509.2 103.5,498 101.1,487C100.7,485.3 101.3,483.2 98.4,481.9C97.2,489.7 92.7,496.2 92.2,504.2C91.2,520.7 95.4,536.2 101.4,552.1M919.5,459C910.4,447.7 899.6,439.7 884,442.4C873.1,444.2 864.5,454.2 863.4,465.9C862.5,475.7 868.5,485.7 877.6,489.5C884.7,492.4 892.7,490.3 896.9,484.3C898.3,482.4 899.6,480.3 897.3,478.1C895.1,476 893,476.4 890.9,478.7C888.2,481.7 884.9,481.9 881.3,480.4C874.8,477.7 871.4,471.5 872.6,464.2C873.8,457.1 880.2,451.2 887.3,450.7C902.9,449.7 918.7,463.3 921.3,480.7C924.6,503.5 918.8,524.7 906.9,544.1C904,548.7 902.9,552.9 903.5,558.1C904.1,562.8 903.5,567.5 899.8,571.1C891.7,579.1 882.2,583.3 870.5,582C862.7,581.2 854.9,580.9 847.1,580.3C831.2,579.1 815.2,578.3 799.4,576.4C784.8,574.7 772,577.5 761,587.5C757.4,590.8 757.3,592.4 761.5,595C769.8,600.1 776.3,606.9 781.5,615C783.7,618.4 785.8,622 787.8,625.3C790.8,625.1 792,623.1 793.4,621.6C802.5,612.5 813.2,606.9 826.3,605.5C841.2,603.9 856.2,603.1 870.6,598.7C888.3,593.4 904.5,585 914.4,569.1C927.8,547.7 936.4,524.2 933.5,498.2C932,484.4 928.5,471 919.5,459M751.4,644.1C748.5,639.9 745.9,635.6 741.2,632.5C732.2,647.1 719.9,654.3 703,652.2C699.7,651.8 698.6,654 697.7,656.4C694,666 690.4,675.7 686.5,685.2C685,689.1 686,690.8 690,691.2C699,692.2 707.9,691.9 716.8,690.6C731.6,688.5 745,682.9 756.7,673.6C759.6,671.3 760.7,668.7 759.8,664.9C758.2,657.8 755.8,650.9 751.4,644.1M319.7,688.7C323.3,689.3 326.9,690.1 330.6,690.4C337.2,690.9 343.8,691.1 350.5,690.4C351.9,690.3 353.6,689.9 354.3,688.3C354.8,686.9 353.8,685.8 352.6,685.1C339.1,677.5 330.7,665.5 323.5,652.3C322.6,650.7 321.4,649.3 319.7,648.5C313.1,645.8 307.7,641.4 302.5,636.7C299.2,633.6 296.8,634.2 294.3,637.4C287.9,645.5 283.4,654.4 281,664.5C280.1,668.2 281,670.4 283.8,672.7C294.1,681 306,685.8 319.7,688.7M560.9,679.6C567.5,689 576,695.4 587.6,697.2C595,698.3 606.1,693.5 609.1,687.7C606.3,684.8 602.6,683.2 599.2,681.2C588,674.5 578.9,665.1 568.3,657.7C565.7,655.8 563.1,654 559.9,653.5C554.1,652.6 550.7,656.6 552.3,662C554.1,668.1 556.8,673.9 560.9,679.6M378.3,591.3C380.1,590.9 380.7,589.6 380.7,588C380.7,581.8 380.7,575.7 380.7,569.5C380.7,567.2 379.4,565.6 377.4,565C368.2,562.1 359,559.1 349.3,558.2C344,557.7 341.1,561.4 341.7,566.7C342.5,574.1 347.2,578.9 352.9,582.9C356.6,585.6 362.7,585.5 362.3,592.7C364.2,589.6 365.4,585.7 369.3,588.1C371.9,589.8 374.8,590.3 378.3,591.3M789.4,464.8C791.9,464.8 794.4,464.9 796.9,464.9C798.4,464.9 800.4,464.7 800.1,462.7C799.2,457.1 802.7,454.2 806.9,451.5C789.9,445.2 756.2,451.2 747.6,462.3C761.5,463.8 774.9,464.9 789.4,464.8M914,480.6C912.6,474.4 909.7,469.2 904.1,465.4C902.6,468.3 903.7,470.3 904.5,472.2C905.7,475 907.1,478 906,480.9C902.4,489.9 902.7,499.5 901.8,508.8C901,516.4 901.6,524.1 901.6,531.8C902.2,531.9 902.8,532 903.4,532C911.5,516.2 916.7,499.7 914,480.6M255.7,293.8C252,302.9 247.3,311.4 242.6,319.9C241.9,321.2 240.5,322.5 242,323.8C243.4,325 244.5,323.8 245.5,323C249.6,319.8 253.8,316.8 257.6,313.4C270.1,302.3 273,282 258.8,270.7C257.3,273 256.9,275.6 257.1,278.2C257.6,283.2 257.3,288.2 255.7,293.8M606.2,506.4C600.7,507.2 598.7,511.4 601.8,515.9C605.7,521.6 614.9,525.1 621.7,523.5C628.3,521.9 633.4,515.3 632.6,509.3C632.2,505.9 630.2,503.5 627,502.5C624.4,501.6 622.6,503 621.1,505C616.3,511.5 616.3,511.5 609.2,507.7C608.4,507.3 607.6,507 606.2,506.4M890.3,560.4C890.3,563.6 890.3,566.8 890.3,570.3C896.9,565.3 897.7,563 896.9,555.6C895.8,545.2 894.5,534.9 895.5,524.3C896.2,516.2 895.1,508 896.5,499.9C896.8,498.2 896.8,495.9 894.2,495.9C892,495.8 890.3,496.9 890.4,499.5C890.4,500.8 890.3,502.2 890.3,503.5C890.3,522.1 890.3,540.8 890.3,560.4M238.2,242.2C230.1,235.4 232,225 243.3,215.7C240.9,212.4 238.2,211.5 234.4,213.5C224.1,218.8 221.8,234.1 229.9,242.4C235.5,248.1 242.2,252.5 248.2,257.7C250.6,259.7 251.2,263.8 255.9,264.1C252.1,255 243.7,250.2 238.2,242.2M843.4,466.8C845.3,466.9 847.1,467 848.9,466.9C850.5,466.9 852.5,467.4 853.3,465.5C854.2,463.5 852.4,462.7 851.2,461.5C848.5,458.9 848.9,456.6 852.3,455C853.2,454.6 854.4,454.6 854.3,451.9C843.1,451.9 831.9,451.9 820.3,451.9C822.8,453.4 824.9,455.1 824.6,458.4C824.2,461.8 820.7,462.7 818.8,465.5C827,467.5 834.8,466.3 843.4,466.8M174,538.5C187.4,529.2 200.8,519.8 214.2,510.5C213.2,509 212.1,508.9 211.6,509.3C208,512.3 201.2,510 199.8,516.5C199.7,517.1 198.6,518 197.9,518C194.7,517.9 193.1,520.7 190.8,521.8C188.9,521.4 188.1,518.8 185.9,519.6C184.4,520.1 184.5,521.7 184.4,523C184,528.9 176.9,534.1 171,532.5C171.2,536.8 170,539.6 165.1,537.6C163.6,539.4 164.3,542.2 161.8,543.2C158.9,544.3 159.2,540 156.5,540.1C156.6,543.9 156.1,547.5 153.1,550.5C160.8,548 166.5,542.4 174,538.5M470.1,639.6C476.2,640.7 480.5,644.2 482.7,650.2C483.6,652.7 484.4,655.2 485.6,657.6C486.3,659.3 486.9,661.5 490.3,661C490.2,654.9 489.1,649.1 486.8,643.6C485,643.6 485.3,646.2 482.4,645.5C486.6,636.3 483.9,628.2 477.3,620.3C474.1,626.7 470.3,632.2 470.1,639.6M159.8,465C157.1,461 159.1,454.8 153.6,452.1C152.1,451.3 151.1,448.6 149.1,450.1C147.1,451.7 149.2,453.4 149.9,454.9C155.7,467.8 153.8,473.9 141.4,481.2C140.5,481.8 139.8,482.3 140,483.5C140.2,484.7 141,485.6 142.2,485.8C145.6,486.2 149.3,486.5 151.6,483.7C155.8,478.5 160.4,473.3 159.8,465M739.7,573.4C733.1,573.4 730.8,578.9 726.1,582.6C741.6,587.6 749.2,585.6 755.2,575.2C750.4,573.6 745.3,574.5 739.7,573.4M346.5,650.5C342.1,652.2 339,655.3 339.6,660.1C340.1,664.3 342.9,667.6 347.2,668.4C352.4,669.5 354.3,664.9 357.3,661.6C354.1,657.6 351.3,653.4 346.5,650.5M378.3,673.1C375.8,672.2 373.3,671.5 370.9,670.4C368.7,669.4 367.2,669.8 365.7,671.7C362.5,675.7 362.5,679.5 366.2,682.5C370.3,686 376.3,685.6 379.4,681.7C382.8,677.5 382.7,675.2 378.3,673.1M720.6,641.2C724.1,639 727.7,636.9 728.9,632.5C720,628.7 709.1,634.1 705.3,644.1C710.5,645.3 713.4,644.8 720.6,641.2M327,639.4C328.5,640.6 329.7,642 331.3,642.8C334.3,644.4 337.3,643.7 339.5,641.4C342,638.9 339.7,636.8 338.3,634.9C336.9,633 335.3,631.3 333.6,629.7C331.9,628.1 330,626.5 327.5,628.5C325.2,630.4 323.7,632.8 324.8,635.9C325.2,637 326,637.9 327,639.4M803.8,638.4C809.6,633.5 811.1,629.5 808.9,624.8C807.8,622.4 806.4,621.7 804.4,623.6C801.3,626.4 798.4,629.4 795.3,632.2C793.6,633.8 793.9,635.3 795.3,636.9C797.4,639.5 799.9,640.6 803.8,638.4M592.7,742.8C598,745.1 603.5,744 606,740.2C607.2,738.4 607.7,736.5 606.6,734.5C605.6,732.7 603.8,733 602.2,733.2C599.6,733.5 596.9,733.9 594.3,734.2C592,734.5 589.3,734.2 588.6,737.1C587.8,739.9 590.1,741.2 592.7,742.8M637,730.4C638.5,727.9 639.7,725.4 637.1,722.8C634.6,720.3 632.5,722.5 630.4,723.3C629,723.9 627.6,724.5 626.3,725.2C624.3,726.4 621,726.9 621.7,730.2C622.4,733.4 625.2,734.8 628.5,735C631.9,735.1 634.6,734 637,730.4M400.5,684.7C407.4,683.7 411.5,679.5 414.8,673.6C411.6,672.5 404.7,673.4 400.2,674.9C398,675.7 396.4,677 396.3,679.5C396.1,682.1 396.9,684.1 400.5,684.7M665.3,693.3C666.6,694.7 668.1,695.1 669.8,694.3C673.5,692.7 678.2,680.8 676.5,677.1C675.8,675.3 673.5,673.5 672.5,675.4C669.5,681 665.1,686 665.3,693.3M549,635.6C549,637.1 548.9,638.6 549,640.1C549.2,641.8 550.1,642.9 552.1,642.2C555.1,641.2 558.2,640.1 561.6,639C559.8,633.7 557.9,628.9 553.9,625.1C550.2,627.6 549.1,630.9 549,635.6M928.2,564.6C926.8,566.7 925.5,568.8 924.2,570.9C922.8,573.1 923.4,574.7 925.5,575.9C928.5,577.6 932.5,576.1 935.2,572C937.3,568.7 937.9,565.4 934.6,562.6C932,560.3 930.1,561.4 928.2,564.6M711.9,700.3C708.4,700.3 704.9,700.2 701.5,700.4C697.9,700.6 697.7,702.7 699.5,705.2C702.3,709.4 711,710 714.2,706.1C716.1,703.8 717,701.3 711.9,700.3M678.6,657.7C678.1,659.7 678.9,660.9 680.8,661.4C682.5,661.9 683.6,660.7 684.5,659.5C686.9,656.1 688.4,652.3 689.5,648.3C689.9,646.4 689.6,644.5 687.6,643.7C685.3,642.8 684,644.4 683.3,646C681.6,649.6 680.3,653.3 678.6,657.7M560.7,742.2C563.4,743.2 566.2,743.4 569,742.6C570.7,742.1 571.8,740.8 571.8,738.9C571.7,737.2 570.6,736.1 569.1,735.8C565.7,735.1 562.2,734.6 558.8,734.1C557.4,734 556.1,734.5 555.6,736C555.1,737.5 555.6,738.7 556.7,739.6C557.7,740.4 558.9,741.1 560.7,742.2M245.7,634.7C243.4,632.5 241.5,628.8 237.6,631.6C235.2,633.3 234.8,636 236,638.8C237.2,641.6 238.8,644.5 242.2,644.5C245.6,644.4 244.8,640.8 245.8,638.7C246.3,637.7 246.4,636.5 245.7,634.7M940.6,549.3C944.2,547.1 945.4,543.5 945.5,539.6C945.6,537.5 944.5,535.8 942.2,535.3C939.8,534.8 938.4,536.1 937.7,538.2C936.9,540.3 936.4,542.6 935.7,544.8C934.6,548.6 936,550.2 940.6,549.3M226.7,618.8C224.3,617.2 221.6,616.2 218.9,615.5C216.9,615 214.7,615.1 213.9,617.5C213.1,619.8 214.2,621.8 216,623.2C218.6,625.4 221.5,626.5 224.7,624.9C227,623.8 228.6,622.2 226.7,618.8M591.3,651.3C590.2,650.6 589.4,649.2 587.9,650C587,655.4 591.9,662.7 596.9,663.6C598.8,664 600.2,663.2 601.1,661.6C602.2,659.8 600.8,658.9 599.6,658C597,655.9 594.4,653.8 591.3,651.3M950.2,516.4C950.4,515.8 950.7,515.2 950.7,514.5C950.9,511 951.4,506.6 947,506.1C942.1,505.5 943.4,510.7 942.6,513.5C941.9,515.6 941.7,518.4 944.4,519.5C946.8,520.6 948.4,518.8 950.2,516.4M654.9,715.4C655.8,714.7 657,714.1 657.5,713.2C659,710.5 662.5,707.4 659.3,704.5C655.7,701.2 653.6,705.7 651.4,707.6C650,708.9 648,710.3 649,712.6C649.9,714.7 651.8,715.8 654.9,715.4M729.3,702.5C733.6,704.9 737.3,703.4 740.7,700.7C742.6,699.1 743.4,697.1 741.8,694.5C737.7,695.7 733.8,696.8 729.9,698.1C727.5,698.8 727,700.2 729.3,702.5M665.6,595.3C668,595.8 670.2,595.4 672.1,593.8C668.4,588.5 657.2,587.7 652.9,592.4C656.6,594.9 660.9,594.3 665.6,595.3M823.6,616.4C824.2,619.6 826.3,620.8 829.3,620.8C832.4,620.9 835,620 836.6,617.3C837.8,615.4 837.8,613.5 835,613.5C831.1,613.4 827,612.8 823.6,616.4M162.9,502.8C153.1,509 143.3,515.1 133.5,521.3C133.9,521.9 134.4,522.6 134.8,523.3C145.4,516.2 156.4,509.8 166.6,502.2C166.4,501.8 166.1,501.4 165.9,501.1C165.1,501.5 164.3,502 162.9,502.8M131.9,444.1C130.1,444.7 127.9,444.4 126.9,447.3C132.8,451.1 138.9,449.7 146.3,448C141.8,443.6 136.7,445.7 131.9,444.1M850.7,612.9C850.6,617.4 854.1,616.7 856.7,616.6C860.2,616.6 863.5,615.7 864.4,611C859.6,609.5 855.4,610.9 850.7,612.9M432.8,666.5C437.6,665.1 439.8,661.3 441.9,657C438.4,656.6 431.2,660.6 430.5,663C430.1,664.6 431,665.5 432.8,666.5M703,627.5C704.1,626.3 705.4,625.1 704,623C699.6,623.2 697.2,626.5 694.5,629.3C693.6,630.3 692.9,631.6 694.3,632.8C695.6,633.9 696.8,633.5 697.8,632.5C699.4,631 701,629.5 703,627.5M911.7,586.3C909.5,588.4 906.5,590 905.1,593.4C910,594.8 912.6,591.9 915.2,589.2C916.3,588.1 917.3,586.7 916.1,585.3C914.7,583.6 913.5,585.1 911.7,586.3M891.3,605.2C892.8,602.8 892.4,601 889.4,601.8C886.3,602.7 883,603.5 880.6,606.6C884.6,610.4 887.7,608.2 891.3,605.2M306.9,696.5C306.1,696.3 305.3,696.2 304.5,696C302.6,695.5 300.7,695.3 299.8,697.5C299.1,699.3 300.4,700.3 301.8,700.9C304.2,701.9 306.8,702.9 308.8,700.8C310.4,699.1 309.1,697.8 306.9,696.5M126,531.4C126.1,533.5 126.6,535.6 129.3,535.3C130.9,535.1 132,533.6 131.5,531.9C131,530.4 132.4,527.9 129.9,527.3C127.4,526.6 126.3,528.3 126,531.4M330.9,700.3C329,700.6 327.8,701.6 328.4,703.6C329,705.3 330.6,705.7 332.1,705.3C333.9,704.9 336.6,705 336.5,702.4C336.3,699.7 333.6,700.4 330.9,700.3M816.4,459.7C817.4,459.1 818.8,458.3 816.8,457.4C813.4,455.7 810.3,456.3 807.6,459.6C810.5,461.6 813.2,460.9 816.4,459.7M721.3,622.5C723.9,622.5 726.6,623.9 729.6,622.3C727.4,620 724.8,619.6 722.3,618.8C721.3,618.5 720.3,618.3 719.7,619.3C719,620.5 719.5,621.5 721.3,622.5M613.8,669.3C611.1,672.7 614.1,674.1 616.2,675.8C617.2,676.5 618.7,676.8 619.3,675.5C620.6,672.5 617.8,671.6 616.1,670.2C615.6,669.8 615,669.6 613.8,669.3M888.5,465.1C888.5,463.5 889,461.8 886.7,460.7C884.6,462.1 883.6,464.2 883.6,466.8C883.6,467.7 884.2,468.4 885.1,468.4C887,468.5 887.6,467.1 888.5,465.1M759.8,690.7C760.8,688.7 761.1,686.8 759.7,684.3C757.9,684.9 755.6,685.2 755.6,687.6C755.5,689.5 756.7,691.3 759.8,690.7M361.3,548.5C360.2,548.6 358.9,547.6 357.9,549.2C360.8,549.9 363.4,551.5 366.9,551.4C365.4,549.5 363.5,549.4 361.3,548.5M170.1,613.4C169.3,611.4 167.8,610.9 166.1,611.7C165.1,612.2 165,613.5 165.8,614.2C167.2,615.4 168.8,616 170.1,613.4M313,625.1C313.9,624.5 315.7,625.2 315.9,623C313.4,621.9 311.6,622.6 309.7,624.3C310.8,625.6 311.6,625.5 313,625.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M434.3,736.8C437.7,743.6 440.1,750.3 440.9,757.5C441.2,760 441.4,762.5 440.8,765C439.7,770.3 437.3,772.3 432,771.1C428.8,770.3 426.5,771.2 424.1,772.9C420.7,775.3 417.1,777.4 413.7,779.8C409.5,782.8 409.6,786 414,788.7C420.8,793 422,799.3 416.8,805.4C410.2,813.2 400.9,816 391.4,818.2C388.7,818.9 385.8,819.1 383,819.3C379.8,819.6 377,818.7 375.2,815.8C373.1,812.4 371.1,813.8 369.3,815.8C362.2,823.4 354.4,830.4 348.4,838.7C340.7,849.3 331,851.5 319.1,849.2C293.7,844.3 270.4,818.6 269.2,792.8C268.6,780.3 274.4,769.5 290.4,764.3C295.5,762.7 297,760.3 296.7,755.4C296.2,748.4 295.9,741.4 295.8,734.4C295.7,728.2 297.3,726.6 303.3,725.2C307.4,724.3 311.3,725 315.1,726.4C318.3,727.6 320.1,730.2 320.3,733.7C320.6,739 320.9,744.3 321,749.6C321,753.5 322.8,755 326.6,754.5C333.9,753.5 341.1,752.5 348.4,751.5C352.7,750.9 356.7,749.7 360.6,747.5C371.3,741.3 381.9,735.1 392.2,728.3C395.5,726.1 397.4,723.5 398.2,719.2C399.6,711 404.9,704.8 414.9,711.9C423.8,718.2 429,727.3 434.3,736.8M327.2,842.8C336.3,842.1 341.1,837.2 341.7,828.2C342.9,811.7 335.7,798.5 324.9,786.9C317.5,778.9 308.8,772.9 297.2,773C288,773 276.4,778.3 277.8,792.4C278.3,797.2 280.4,801.3 282.3,805.5C283,807.1 283.6,809.3 285.9,808.9C287.9,808.5 287.7,806.4 288.1,804.8C289.7,797.6 294.7,793.6 302,793.7C310.5,793.8 319.1,800.9 321.4,809.8C323.9,819.5 317.6,826.7 307.6,825.6C304.4,825.2 301.2,823.9 297.6,825.3C298.3,829.7 300,833.4 303.8,835.6C310.8,839.7 318,843 327.2,842.8M394.6,798.1C403.1,794.6 405.1,789.6 401.5,781.3C400,777.7 399,773.8 397.8,770C396.8,766.7 396.2,763.2 393.4,760.5C392,761.2 390.8,761.9 389.5,762.6C386.9,756.7 386.2,756.5 382.3,760.3C380.6,757.6 384.7,756.2 383.9,753.6C379,755.7 377.4,758.5 378.6,763.8C380.9,773.9 383.3,784.1 385.8,794.2C387.3,799.9 388.3,800.2 394.6,798.1M413.2,731.2C407.3,725.9 406.8,726 400.4,731.5C397.8,733.7 397.1,735.7 399.6,738.6C406.8,746.6 411.7,755.6 412.3,766.6C412.4,768 412.7,769.3 414.6,769.3C419.2,769.4 426.5,760.7 425.5,756.1C423.6,747 420.3,738.6 413.2,731.2M310.9,820.4C316,818 317.3,814.5 314.9,809.1C312.8,804.3 308.8,801.4 304.2,799.3C299.4,797.1 295.6,799.5 295.2,804.8C294.8,812 301.8,819.5 310.9,820.4M362.1,766.4C363.7,768.5 365.3,770.6 367,772.7C368.1,774 368.9,776.3 371.1,775.4C373.4,774.4 373,772.1 372.6,770.1C371.4,764.4 372,758.9 374.4,753.6C375.2,751.9 376.5,750.1 375,747.6C371.2,748.4 368,750.9 364.6,752.8C357.2,756.9 356.8,758.8 362.1,766.4M420.1,729C419.9,721.8 411.9,715 406.3,718C410.8,721.8 415.2,725.5 420.1,729M362,783.6C363.4,786.8 364.7,790 367.4,792.5C365.2,785 364.6,776.6 356.5,770.8C357,776.2 360.3,779.2 362,783.6M382,811.4C382.5,812.5 383.4,812.8 384.4,812.8C386.2,812.7 388.2,813.2 389.3,811.2C389.8,810.4 389.3,809.6 388.5,809.1C386.7,807.9 384.8,807.6 383,809.1C382.6,809.5 382.4,810.2 382,811.4M303.9,739.4C301.2,741.2 302.1,743.2 303.9,744.9C304.6,745.7 305.9,745.7 306.4,744.7C307.4,742.5 307.7,740.2 303.9,739.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M447.8,861.4C446.1,861.3 444.9,861.2 443.8,861.3C431.1,863.1 423.7,855.6 417.2,846.4C414.5,842.6 416,839.6 418.3,836.4C426.3,825.1 435.3,814.5 445,804.7C451.8,797.9 455.6,790.1 457.8,781C461.2,767.8 461.4,767.9 475,767.8C509.9,767.5 544.9,767 579.9,766.7C596,766.6 596,766.7 600.2,782C604.9,799.1 610.2,816.2 617.1,832.6C620.9,841.7 620.5,849.7 615.4,858.1C607.5,871 609.7,869.8 595.8,868.5C581.7,867.3 567.6,866.9 553.4,866.4C531,865.5 508.5,865.1 486,864.1C473.4,863.6 460.8,862.3 447.8,861.4M452.8,805.2C444.9,814.7 436,823.4 429,833.5C427.7,835.4 425.5,837.2 427,839.7C428.3,842.2 431,841.6 433.3,841.7C447.3,841.8 461.3,841.6 475.3,842.1C516.2,843.7 557.1,845.7 598.1,844.7C601.6,844.7 605,844.2 608.5,843.8C612.4,843.4 613.3,841.5 612.2,838C608.3,826.3 604.5,814.6 600.6,803C599,798.5 594.1,796.4 589.6,798.4C585.1,800.4 588.4,803.6 589,806C590,809.9 591.8,813.5 593.1,817.3C593.6,818.6 594.6,820 593.4,821.9C587.3,823.6 580.8,823 574.4,823.1C568.9,823.1 568,821.7 570.5,816.3C568.7,816.3 567,816.3 565.4,816.3C555.6,816.3 545.8,816.4 535.9,816.3C533.9,816.3 531.1,816.9 531,813.7C530.9,810.3 533.8,810.5 536.1,810.3C538.5,810.2 541,810.3 544.8,810.3C539.2,808 533.8,811.6 530.1,806.4C529,809.9 526.2,809.3 523.8,809.4C512,809.6 500.3,809.2 488.4,810.4C494.6,811.5 500.7,811.2 506.8,811C509.1,810.9 512.5,809.9 513,813.5C513.5,817.4 509.6,816.1 507.6,817C507.5,817.1 507.4,817.4 507.2,817.8C508.5,817.8 509.7,817.8 510.8,817.8C527.8,817.8 544.8,817.9 561.8,818C564.1,818 567.1,817.8 566.9,821.2C566.7,824.1 563.9,823.2 562.1,823.2C525.8,823.2 489.5,823.2 453.2,823.2C451.1,823.2 448.7,823.9 447.2,821.3C449.3,814.9 455.9,810.7 457.5,803.9C455.2,802.8 454.2,803.9 452.8,805.2M542.5,850.3C533.3,850.1 524.2,850.2 515,849.8C489.1,848.7 463.2,847.4 437.3,846.3C435,846.3 431.5,845 431.2,848.6C430.9,851.7 434,853 436.6,853.6C439.3,854.3 442.2,854.4 445,854.6C448.2,854.8 451.3,854.6 454.5,854.9C484,857.7 513.6,858.5 543.2,859.7C561.3,860.5 579.4,861.4 597.5,862.6C602.3,862.9 605.5,861.5 607.7,857.3C608.6,855.6 610.4,854.1 609.3,851.9C608.2,849.6 605.9,850.3 604,850.3C583.8,850.3 563.7,850.3 542.5,850.3M480.6,786.9C512.2,786.9 543.8,786.9 575.4,786.9C577.1,786.9 578.7,786.8 580.4,786.7C581.5,786.6 582.3,786.2 582.6,785C584,780 577.3,771.4 572.1,771.6C545.4,772.8 518.6,773.5 491.8,773.4C487.5,773.4 483.2,773.7 478.9,773.9C477,774 475.1,774.1 474.4,776.3C473.3,779.5 471.6,782.6 472,786.2C474.7,787.3 477.2,786.8 480.6,786.9M517.5,792.8C538.4,792.8 559.3,792.8 580.1,792.8C580.1,792.3 580.1,791.9 580.1,791.4C549.8,791.1 519.6,791.1 489.3,792.8C498.3,792.8 507.4,792.8 517.5,792.8M588.2,788.1C588,789.6 587.8,791 587.6,792.4C595.5,794 597.4,792.1 595.2,784.7C594.3,781.9 593.3,779.1 592.4,776.2C591.2,771.9 588.6,771.6 584.8,773.2C586,778.1 587.1,782.7 588.2,788.1M463.6,783.1C463.4,786.2 460.5,789.6 464.3,792.4C464.8,786.2 469.5,781 468.9,774.4C465.3,776 465.3,776 463.6,783.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M333.1,184.1C329.1,186.8 325.4,189.4 321.6,191.8C318.5,193.7 317.6,195.9 319.2,199.3C325.9,212.7 333,225.9 341,238.6C342.1,240.3 343.7,240.9 345.4,241.7C356.4,247.3 362.5,264.2 357.6,275.9C352.9,287.3 336.7,295.1 325.7,291.3C313.5,287.1 308.4,274.1 310,260.5C310.8,253.1 313.6,246.4 320.2,241.8C323.5,239.5 323.6,236.5 321.8,233.1C314.5,218.8 306.3,205.2 297.3,191.9C294.9,188.3 292.6,184.6 290.5,180.8C287.6,175.6 288.1,173.3 293.1,170C305.8,161.6 318.9,154.1 332.3,146.9C342.7,141.3 353.2,135.9 363.8,130.6C366.4,129.2 369.3,128.4 372.1,127.4C374,126.6 375.8,127 377.3,128.1C384.2,132.7 384.8,146.4 378.1,151.1C366.6,159.2 355,167 344,175.7C340.5,178.4 336.9,181.2 333.1,184.1M322.8,248.1C315.6,254.9 313.5,264.1 317.1,273.6C319.2,279.1 322.7,282.8 329.2,283C321.4,270.3 320.8,267.6 321.8,256.4C322.1,253.5 324.7,251.1 322.8,248.1M328.1,157.6C325.7,159 323.4,160.4 321.1,161.8C331.1,161.9 339.8,160 344.8,148.6C338.7,151.9 333.7,154.6 328.1,157.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M710.9,747.8C730.3,749.1 749.2,750.3 768.1,751.7C776.6,752.3 778.4,755.1 775.5,762.9C774.4,765.9 773.2,768.8 771.9,771.7C769.6,776.4 769.3,780.7 770.9,786C772.7,792.2 769.8,798.5 767.3,804C762.3,815.4 754.8,825.6 750.4,837.4C748.5,842.5 743.9,840.9 740,840C724.7,836.2 709.4,832 694.3,827.4C672.6,820.7 650.6,814.5 628.7,808.3C622.5,806.5 618,803.8 618.2,796.5C618.2,794.9 618.1,793.1 617.4,791.6C613.4,783.5 617.6,778.5 623.5,773.9C635.5,764.6 647.5,755.3 659.4,745.9C663,743.1 666.8,743.3 670.8,744C683.9,746.1 697.2,746.9 710.9,747.8M707.8,755C695.6,753.8 683.3,752.5 671.1,751.3C669.1,751.1 667.1,751.1 665.4,752.5C653.7,762.4 640.8,770.7 628.7,780.2C623.8,784.1 624.2,786.4 630.1,788.8C631.1,789.2 632,789.5 633,789.8C668.1,798.8 703.3,807.7 738.3,816.9C742.4,818 744.1,816.6 745.7,813.3C753.4,797.6 759.4,781.2 766.1,765C768,760.3 766.7,758.6 761.6,758.3C744,757.2 726.4,756.2 707.8,755M643.2,803.3C650.5,805.7 657.6,808.4 664.9,810.6C682.3,815.7 699.7,820.6 717.2,825.6C724.2,827.5 731.3,829.3 738.4,831.2C741.6,832 743.7,830.5 744.4,827.5C745.1,824.2 742.2,824.2 740.3,823.7C735.3,822.4 730.2,821.6 725.3,820.2C698.5,812.9 671.8,805.2 644.6,799.6C642.4,799.1 640.2,798.5 638,799.8C639,802.1 641,802.2 643.2,803.3M762.6,795.4C762.6,794.4 763.1,793.3 761.2,792.7C758.5,796.6 757,801.1 755.8,805.7C759.1,803.1 760.3,799.3 762.6,795.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M925.2,298C923.7,300.4 922.8,302.9 921,304.6C917.1,308.5 917.9,312 920.8,315.9C923.3,319.3 925.5,322.8 927.9,326.2C929.4,328.5 932,331.2 929.1,333.7C926,336.4 924.2,332.9 922.3,331C921.2,330 920.8,328.3 918.7,328.1C917.6,330.3 918.4,332.5 918.6,334.7C918.7,336.4 919.2,338 919.2,339.7C919.3,341.7 919.1,343.9 916.5,344.3C914,344.8 913.1,342.9 912.4,340.9C911.4,337.6 911.5,333.9 909,330C908.7,337.4 909.5,343.9 908.3,350.4C907.9,352.8 907.7,355.3 907,357.7C906.5,359.8 905.1,361.5 902.7,361C900.4,360.4 899.8,358.4 900.1,356.2C900.9,350.5 901.8,344.8 901.7,338.9C901.6,333 900.6,327.3 899.6,321.6C899.2,319.6 898.8,317.4 896.2,317.4C893.2,317.4 892.8,319.9 892.5,321.9C891.4,330 889.3,337.9 886.2,345.5C885.1,348.2 884.1,352.7 880.2,351.3C875.5,349.7 878.4,345.8 879.3,342.8C880.7,338.1 883.4,333.7 882.5,327.2C880.9,330.6 879.8,332.9 878.6,335.2C877.6,337 876.2,338.6 873.8,337.7C871.4,336.8 871.6,334.7 872.1,332.6C872.5,330.5 873.9,328.4 873.2,325.4C870.1,327.7 868.8,330.9 866.7,333.3C865.2,335.1 863.6,337.4 861,335.5C858.4,333.6 859.7,331.1 861.1,328.9C863.8,324.9 866.3,320.8 869.1,316.8C871.4,313.5 870.9,310.9 868.1,308.1C859.8,299.6 854.6,289.7 854.7,277.4C854.8,258.7 869.3,241.7 886.9,239.8C906.6,237.7 923.5,249.6 928.2,268.9C930.5,278.8 929.7,288.4 925.2,298M921.6,284.8C924,268.2 913.6,251.8 898.4,248.1C887.3,245.3 877.5,247.4 874.7,259.9C871.6,273.2 875.5,284.3 884.9,293.5C896.8,305.4 918.2,301.4 921.6,284.8M873.2,302.3C880.2,310.1 892.7,312.4 904,307.6C896.2,306.3 889.3,304.3 883,300.5C881.8,299.7 880.4,300 879.2,300.7C877.3,301.7 875.6,301.7 874.3,300C873.1,298.5 872.4,296.7 873.7,294.9C875.2,292.7 874.5,290.8 873.3,288.9C870.8,284.9 869.7,280.3 868.5,275.8C867.8,273.2 867.7,270.3 865.8,268C858.5,276 861.9,291.9 873.2,302.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M531,209.9C526.7,209.7 522.9,209.5 519.1,209.3C516.6,209.2 514.6,208 512.9,206.4C508.9,202.5 505.9,197.9 503.2,193.1C502.2,191.4 501.9,189.5 502.4,187.4C507.3,167 513.1,146.9 519.2,126.9C519.9,124.5 521.3,122.9 524.1,122.6C536.3,121.3 548.4,119.2 560.7,118.5C565.4,118.2 568.2,119.7 569.8,124.2C573.2,133.4 576.9,142.5 580.5,151.7C581.5,154.2 582.1,156.7 581.3,159.4C577.2,172.9 573.7,186.7 568.2,199.7C564.8,207.7 562.5,209.3 553.9,209.4C546.4,209.5 539,209.7 531,209.9M552.7,155.4C553.1,148.6 553.9,142.1 558.7,136.8C559.3,136.1 559.5,135 559.8,134C562.2,127.2 560.8,125.6 553.6,126.4C545.4,127.4 537.2,128.5 528.9,129.3C525.9,129.5 525.1,131.3 524.3,133.7C520.3,146.8 516.2,160 512.3,173.2C510.9,177.7 508.8,182.1 508.8,187.1C509.6,187.3 510.2,187.7 510.8,187.6C521.1,186.7 531.3,185.7 541.6,184.7C543.9,184.4 544.2,182.6 544.8,180.8C547.3,172.6 549.9,164.4 552.7,155.4M567.3,176.9C568.4,174.1 569.1,171.2 570.6,168.6C575.5,160 573,152 568.7,144.2C567.6,142.3 566.4,140.7 564.1,140.9C562,141 561.9,143.1 561.5,144.6C557.4,157.4 553.5,170.3 549.4,183.1C548.8,185.2 549.4,186.7 550.2,188.6C552.2,193.1 557.7,192.3 560.2,196.9C562.7,189.8 564.9,183.7 567.3,176.9M537.5,203.7C543,203.7 548.5,203.7 554.6,203.7C549.5,194 544.4,187.2 532.8,190.1C526.4,191.7 519.7,191.5 513.1,192C523.9,193.7 534.9,191.3 545.5,195.1C536.1,198.1 526.3,196.4 516.5,197.8C518.1,201.8 520.5,203.5 524,203.6C528.2,203.6 532.3,203.6 537.5,203.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M169.2,314.1C160.3,329.3 148.8,333.8 132.4,328.1C118.5,323.3 107.7,314.8 105.2,299.7C103.4,288.8 106.9,277.9 110.2,267.5C112.3,260.8 117,256 123.2,253.1C137.6,246.1 151.7,247.3 164.7,256.5C179.7,267 184,284.5 176.2,301C174.1,305.3 171.6,309.5 169.2,314.1M130.4,305.2C132.1,306.2 133.7,307.4 135.5,308.2C148.6,314.2 163.3,310.3 169.7,298.9C175.6,288.3 172.8,278 166.8,268.9C159.4,257.7 148.2,253.5 135.1,255.5C122,257.5 113.4,268.9 115.4,281.1C116.9,291 122,298.7 130.4,305.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M402.6,189.3C402,183.5 401.4,178.3 400.9,173C400.6,169.3 401.1,165.8 404.6,163.8C417.3,156.3 431.1,153 445.7,153.7C452.8,154 456.5,158.6 456.2,165.8C455.8,174.4 456.7,183.1 455.5,191.8C455.1,195.1 456.3,198.7 456.3,202.1C456.3,207.8 453.3,211 448,211.3C439.4,211.9 433.6,208.5 432.7,202.6C431.8,196.1 434.7,191.9 440.9,190.4C448.7,188.6 448.7,188.6 448.7,180.3C448.7,171.9 448.2,171.6 439.9,172.8C431.6,174 423.7,176.1 415.7,178.8C411,180.3 408.3,182.9 409.3,188.2C410.5,194.4 409.9,200.8 411.9,207C413.9,213.4 409.5,218.9 402.6,219.3C394.5,219.8 388.6,216.4 387.8,210.6C386.9,204.8 389.9,199.4 395.8,198.8C402,198.1 403.7,195.3 402.6,189.3M445.6,199.8C445.1,197.5 443.6,196.8 441.6,197.6C440,198.2 439.2,199.5 439.5,201.2C439.8,202.6 440.7,203.6 442.2,203.7C444.5,203.9 445.5,202.7 445.6,199.8M396.4,205.8C394.8,207 393.8,208.4 395.3,210.3C396.3,211.6 397.6,212.1 399.2,211.5C400.6,210.9 400.8,209.6 400.7,208.2C400.6,205.9 399.2,205.2 396.4,205.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M648.5,244C638.6,246.5 631.1,244.1 627,237.4C623,230.9 624,222.2 629.4,216C632.2,212.7 635.8,210.6 640.2,210.7C643.8,210.8 645,209.2 644.6,205.9C643.1,193.8 641.8,181.8 640.2,169.8C639.1,162.3 640.3,160 647.7,158.5C658.6,156.4 669.5,157.1 680.5,157.8C682.7,158 684.3,159.1 685.2,161.1C689.1,169.5 691.7,178.2 690.3,187.6C689.7,191.7 687.3,195 684.5,197.9C683,199.5 681,200.3 678.6,199.4C676.2,198.5 675,196.7 674.7,194.2C674.3,190.8 675,187.5 675.9,184.3C677.1,180.5 675.3,178.8 672,178.5C667.7,178.2 663.3,178.2 659,178.1C654.9,178.1 654.5,181.4 654.6,184.1C654.7,191.4 655.1,198.8 655.7,206C656.2,212.1 657,218 659.3,223.9C662.5,232 657.8,239.9 648.5,244M640.1,216.4C637.9,216.7 636.1,217.8 634.5,219.3C630.2,223.1 628.9,229.3 631.6,233.7C634.1,237.9 639.8,239.7 645.2,238C650.9,236.2 654.8,230.7 653.8,225.7C652.7,219.5 648.3,216.3 640.1,216.4M666.4,164.3C662.7,164.6 658.8,163.5 655.2,165.5C656.9,170.5 660.1,172.8 665.3,172.6C669.2,172.5 673.2,172.6 677.2,172.7C678.5,172.7 679.5,172.5 680.1,171.2C680.6,169.9 679.9,169.2 679.1,168.2C675.9,164.5 671.8,163.9 666.4,164.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M670,313.1C671.1,310 672,307.4 673,304.7C674.2,301.8 675.9,299.2 679.5,299.8C683.8,300.5 688.9,301 690.1,305.8C691.1,309.9 693.6,310.7 696.6,311.6C702.8,313.5 709.1,315.2 715.3,317.1C719.3,318.4 720.9,320.8 719.5,325.1C717.6,331.1 715.9,337.2 714.4,343.3C713.4,347.3 711.1,348.5 707.4,347.1C696,342.7 684.7,338.4 673.4,334C669.7,332.6 668.1,330.1 669.8,326.1C671,323.4 672.1,320.7 669.8,317.8C669.1,316.9 669.8,314.9 670,313.1M710.7,333.3C710.8,331.2 711,328.6 708,329.4C704.1,330.5 700.1,331.4 696.8,334.5C699,336.4 701.4,337.1 703.7,338C707.7,339.6 710,338.4 710.7,333.3M692.5,333.6C692.6,333.6 692.8,333.6 693,333.6C693.1,333.5 693.4,333.3 693.4,333.3C692,329.3 689.5,326.1 686.1,322.5C684.3,325.3 680.2,323.9 678.3,327.8C682.5,330.8 687.2,332 692.5,333.6M702.8,324.3C704,323.3 705.4,321.8 703.5,320.8C700.2,319.2 696.7,317.4 692.8,318.9C695.1,325.6 697.1,326.8 702.8,324.3M677.2,313.3C677.3,315 677.9,316.5 679.8,316C682,315.4 682.7,313.5 682.7,311.4C682.7,310.2 682.6,309 681,308.9C678.5,308.8 677.7,310.5 677.2,313.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M734.9,348.7C737.2,348.7 739.1,348.6 740.9,348.9C749.5,350.2 752.2,353.6 751.4,362.4C750.7,369.8 750,377.2 749.1,384.6C748.4,389.7 745.2,392.3 740.6,391.9C735.3,391.5 730.8,387.5 730.8,383.1C730.7,378.6 733.9,375 739.1,374.9C744.5,374.9 744.3,371.1 744.5,367.8C744.9,363.8 741.7,363.3 738.8,363.3C733,363.2 727.1,363.2 721.3,363.4C717.7,363.5 715.2,365.3 715.4,369.3C715.7,374.3 714,379.1 714.5,384.2C714.8,387.1 714.1,390.2 710.8,391C706.3,392.3 701.8,391.6 698.4,388C695.9,385.4 695.7,382.3 697.2,379.2C698.6,376.3 701.2,375.2 704.3,375.6C708.3,376.1 709.7,374 709.6,370.4C709.5,365.9 710.2,361.5 710.6,357C710.9,353 713,351.1 716.6,350.2C722.5,348.7 728.4,348.5 734.9,348.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M126.6,690.8C115.3,686.1 108.8,676.1 109.7,665.3C110.7,654.3 119,645.4 130.2,643.2C143.6,640.5 156.1,649.6 158.9,663.9C161.2,675.8 152,688.8 139.8,691.4C135.4,692.4 131.2,692.2 126.6,690.8M121.7,678.8C123.5,680.2 125.2,681.9 127.1,683C133.2,686.5 141.3,685.2 147,680C152.3,675.1 154.1,667.6 151.6,661.4C148.7,654.5 143.5,650.5 136,650.1C128.7,649.7 123.1,653 119.5,659.2C115.6,665.9 116.6,672.3 121.7,678.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M918.1,675.4C912,693.4 895.5,700.5 880.5,691.9C870.3,686.1 865.7,673 869.9,661.5C873.7,650.9 885.6,644 897.1,645.8C908.8,647.6 918.1,658 918.3,669.5C918.3,671.3 918.2,673.1 918.1,675.4M888.6,688.2C890.9,688.4 893.2,688.8 895.5,688.6C906.4,687.9 914.8,676.6 912.1,666.5C909.7,657.4 902.1,651.9 892.4,652.3C884.3,652.6 876.8,658.9 875.4,666.7C873.7,676 878.4,684.1 888.6,688.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M292.3,381.4C279,391.1 263.1,386.3 259.5,371.7C257.4,362.9 261.2,354.1 268.9,350C277,345.8 287,347.4 293.2,354.1C299.2,360.6 300.1,370 295.4,377.6C294.6,378.8 293.5,379.9 292.3,381.4M292,364.5C291.3,363.1 290.9,361.6 290.1,360.4C286.9,355.8 282.4,353.6 276.8,354.4C271.8,355.1 266.7,360.1 265.7,365.3C264.6,370.8 267.6,374.5 271.6,377.5C275.9,380.8 280.6,380.8 285.2,378.3C290.4,375.5 292.6,371 292,364.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M110.2,363.6C113.1,352.4 122,346.6 132.9,348.8C142.7,350.8 149,360.4 147.3,370.6C145.7,380 135.6,387.4 126.4,386C115.8,384.3 108.9,375.1 110.2,363.6M129.4,379.6C131.4,379.3 133.2,378.6 134.9,377.5C140,374.5 142.6,369.3 141.4,364.7C140,359.3 135.4,355.4 130,355.1C124.2,354.8 118.9,358.6 116.9,364.6C115.5,368.5 117.8,373.5 122.3,376.9C124.2,378.4 126.3,379.2 129.4,379.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M242.6,821.8C245.3,827.7 245.3,833.1 240.9,837.9C237.1,842.1 232.3,843.2 226.9,841.8C221.2,840.2 217.8,835.5 217.6,829.6C217.5,822.9 220.3,818.1 225.7,816.1C231.6,813.9 237.9,815.9 242.6,821.8M238.6,828.6C238.5,827 237.8,825.7 236.9,824.5C234.6,821.5 231.6,820.5 228.1,821.9C224.7,823.3 222.7,826 223.5,829.8C224.4,833.7 227,835.7 231,835.9C235.6,836 237.6,833.3 238.6,828.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M914.4,407C913,399.5 914.7,394.9 919.8,392.1C924.5,389.4 931.3,390.2 935.1,393.9C938.7,397.5 940.1,401.7 938.2,406.7C936.4,411.8 932.6,414.6 927.4,414.9C921.7,415.2 917,413.1 914.4,407M931.3,403.9C932,400.4 930.1,398.2 927.4,396.7C925.5,395.5 923.6,396.1 922,397.7C920.3,399.3 918.9,401.3 919.7,403.8C920.5,406.2 922.1,408.2 924.8,408.6C927.9,409 929.6,406.9 931.3,403.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M705.7,258.5C700.3,263.6 695.3,264.5 690,261.7C685.8,259.4 683.9,255.6 684.3,250.9C684.8,246 687.3,242.3 692.2,241C697.1,239.6 701.6,240.9 704.8,244.8C708.3,248.9 708.5,253.5 705.7,258.5M698.7,255C700.3,252.4 700.6,249.9 697.9,248C696.1,246.7 694,246.8 692.5,248.6C690.9,250.4 690.8,252.5 692.2,254.5C693.8,256.7 695.8,257.4 698.7,255z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M422.3,269.2C416.7,264.5 415.3,260.1 417.5,254.5C419.2,250.1 424.1,246.9 428.8,247.2C434.2,247.5 438.4,250.8 439.8,255.8C441,260.2 439.7,264.1 436.6,267.2C432.5,271.2 427.7,271.1 422.3,269.2M429.9,264.6C434.6,261.6 435.8,258.6 433.3,255.5C431.3,253 428.6,252.5 425.7,253.6C423.1,254.7 421.9,256.9 422.4,259.7C423.1,263.3 425.4,265 429.9,264.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M442.2,685.3C443.1,676.3 454.6,673.7 459.6,679.3C462.4,682.5 463.2,686 461.5,690C459.7,694.2 456.2,695.6 451.8,695.5C447.5,695.4 444.5,693.5 442.9,689.6C442.4,688.4 442.4,687 442.2,685.3M456.1,687.6C457.3,684.9 455.8,683.2 453.6,682C452.2,681.2 450.7,681.7 449.6,682.7C448,684 447.8,685.8 448.4,687.6C449.5,690.8 452.2,691 456.1,687.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M814.3,681C810.1,677.9 808.5,674.2 810.7,669.5C812.6,665.6 816,664.3 820.2,664.7C824.6,665.2 826.9,668 827.8,672.1C828.6,675.3 827.3,678 824.8,680C821.8,682.5 818.3,683.1 814.3,681M815.8,674.9C817.3,677 819.2,677.5 821.4,676.2C822.9,675.4 823,673.7 822.4,672.3C821.8,670.6 820.4,669.6 818.5,669.9C816.2,670.4 815.1,671.9 815.8,674.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M93.7,638C92,631.9 93.8,627.9 98.3,627C101.9,626.2 105.2,627 106.7,630.7C108.1,634.1 108.1,637.8 104.5,640C100.7,642.4 96.9,642.3 93.7,638z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M940.3,635C939.2,640.5 936.6,642.7 932.3,642.2C928.3,641.7 926.1,639.3 925.8,635.3C925.5,631.5 928.4,628.3 932.3,627.8C936.5,627.3 939,629.4 940.3,635M931.2,636.5C932.9,637.9 934.5,638.2 935.4,635.8C935.9,634.4 935,633.1 933.6,632.8C931.3,632.4 930.4,633.7 931.2,636.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M699.7,133.9C700.4,128.8 702.9,126.2 706.5,126.9C710.3,127.7 712,130.3 711.8,134.1C711.6,137.5 708.1,139.8 704.6,139.2C701.9,138.7 700.2,137.1 699.7,133.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M334.9,356C331.6,357 328.8,357 327.1,354C325.9,351.8 326.2,349.5 327.7,347.4C329.1,345.4 331.2,345.1 333.5,345.5C335.7,345.9 337,347.3 337.6,349.4C338.4,352.1 337.6,354.2 334.9,356z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M475.2,116.5C479.7,116.8 481.6,119 481.2,123C481,126 479.1,127.8 476.1,128.1C472.8,128.4 470.8,126.4 470.2,123.3C469.5,119.7 471.1,117.3 475.2,116.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M303.5,416.9C300,415.7 298.9,413.5 300.3,410.6C301.3,408.6 302.9,406.3 305.7,407.6C308.4,408.9 310.6,411.6 310,414.7C309.5,417.8 306.2,417 303.5,416.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M849,228.5C850.9,230.7 851,232.7 849.4,234.6C848.3,235.8 846.8,236 845.3,235.4C843.8,234.7 842.9,233.4 843,231.9C843.2,228.2 845.3,227.1 849,228.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M367.9,725.8C364.4,725.5 363.2,723.6 363.7,720.6C364,718.7 365.4,717.8 367.2,717.9C369.4,718 370.5,719.5 370.9,721.4C371.3,723.5 370.2,724.9 367.9,725.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M798.1,791C795.6,790.2 794.5,788.7 795,786.4C795.3,785 796.3,784 797.7,783.8C799.7,783.5 801.4,784.1 802,786.2C802.6,789 801.3,790.7 798.1,791z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M299.1,284.9C301.7,284.6 303.5,285.4 303.8,287.8C304.1,289.8 302.9,291.2 301,291.9C299.4,292.4 297.9,292 297.2,290.5C296.2,288.4 296.3,286.3 299.1,284.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M629.3,290C632.8,289.9 634.1,291.7 633.8,294.6C633.6,296.4 632.1,297.3 630.2,297.2C628.7,297.1 627.9,296.1 627.3,294.8C626.6,292.9 627.2,291.3 629.3,290z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M825,300C824.3,302.6 822.9,303.7 820.5,303C818.9,302.6 818.3,301.1 818.3,299.6C818.3,297.7 819.4,296.4 821.2,296.1C823.7,295.8 824.8,297.3 825,300z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M364.7,177.8C366.6,175.7 368.4,175.6 370.2,177.2C371.4,178.4 371.5,179.9 370.8,181.3C369.8,183 368.3,183.7 366.5,183C364.2,182.2 363.8,180.3 364.7,177.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M178.1,325.2C175.5,324.4 174.6,322.8 175.5,320.6C176.1,319 177.4,318.4 179,318.5C180.7,318.7 181.7,319.8 181.9,321.4C182.2,323.8 180.8,325 178.1,325.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M747.9,184.1C750.3,185.1 751.6,186.5 750.8,188.8C750.3,190.4 749,191.2 747.3,191C745.7,190.8 744.6,189.8 744.4,188.2C744,185.8 745.2,184.4 747.9,184.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M661.8,892.7C662.6,895.2 662.3,897 659.9,897.9C658.5,898.4 657.3,897.8 656.5,896.5C655.6,895.1 655.6,893.6 656.8,892.4C658.2,890.8 659.9,890.8 661.8,892.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M465.6,746.9C465.9,744.3 467.3,743.5 469.4,743.9C471,744.2 472,745.4 472,747C472,748.5 471.3,749.6 469.9,750C467.6,750.6 466.2,749.6 465.6,746.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M502.4,752.7C504.9,751.9 506.2,752.9 506.8,754.9C507.3,756.5 506.4,757.8 505.1,758.6C503.8,759.4 502.5,759.3 501.6,758.1C500.2,756.3 500.3,754.5 502.4,752.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M383.4,306C381.5,307.7 379.8,308 378.3,306.3C377.3,305 377.4,303.4 378.4,302.1C379.3,300.9 380.6,300.5 382,301.2C383.8,302.1 384.6,303.6 383.4,306z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M703.8,733.9C702.6,736.2 701.1,736.7 699.2,735.7C697.8,735 697.7,733.6 698.1,732.2C698.4,731 699.3,730.2 700.5,730.2C702.7,730.1 703.8,731.3 703.8,733.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M186.1,429.8C189,430.7 189.8,432.4 188.1,434.7C186.9,436.2 185.1,436.2 184,434.5C182.4,432.3 183,430.5 186.1,429.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M725.2,409.4C726.9,406.5 728.7,406.8 730.2,408.9C731.3,410.3 730.8,411.9 729.3,412.6C726.7,413.6 725.3,412.5 725.2,409.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M843.7,351.3C845.9,349.2 847.8,349.1 848.9,351.8C849.6,353.4 848.7,354.8 847.1,355.2C844.2,355.8 843.2,354.3 843.7,351.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M790.8,810.5C787.3,811.2 786.1,809.6 786.7,806.8C787.1,804.8 789,804.2 790.6,805C793.1,806.4 792.7,808.4 790.8,810.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M143,774.9C145.9,775.9 146.9,777.5 145,779.8C143.9,781.1 142.2,781 141.1,779.7C139.2,777.5 139.9,775.8 143,774.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M833,827.7C830.2,827 829.4,825.5 830.8,823.3C831.6,822.1 833,821.8 834.1,822.9C835.9,824.7 835.4,826.4 833,827.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M482.9,217.1C480.9,218.2 478.9,218.8 478.6,216C478.4,214.3 480.1,213.3 481.6,213.4C484.2,213.4 484.1,215 482.9,217.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M722.8,212.2C720,211.8 719.4,210.3 720.5,208.3C721.3,206.8 722.8,206.7 723.9,207.8C725.5,209.5 725.4,211.1 722.8,212.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M313.9,394.1C313.3,396.9 311.9,398 309.7,396.6C308.4,395.8 308.2,394.2 309.2,393.1C310.9,391.1 312.5,391.5 313.9,394.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M246.4,784.8C246.4,782.1 247.6,781.1 249.8,782.1C251.2,782.7 251.6,784.2 250.7,785.4C249.3,787.3 247.7,787.3 246.4,784.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M392,840.2C392.1,842.8 391.1,844.1 388.8,843.1C387.3,842.5 386.7,840.9 387.7,839.5C389.1,837.5 390.7,837.9 392,840.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M546.4,258.1C548.6,259.9 548.3,261.4 546.1,262.3C544.9,262.8 543.6,262.3 543.3,261.1C542.6,258.7 543.8,257.7 546.4,258.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M401.7,867.7C400.4,869.8 399.1,870.2 398,868C397.4,866.8 396.9,865.3 398.7,864.7C400.7,864.2 401.7,865.3 401.7,867.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M630.1,879C628.9,881.2 627.3,881.6 625.6,880.1C624.7,879.2 624.6,877.7 625.8,877.1C627.5,876.3 629.3,876.5 630.1,879z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M128.7,735.7C131.1,734.5 132.5,735.3 132.7,737.5C132.9,738.9 131.9,740.2 130.3,739.9C128,739.6 127.6,738 128.7,735.7z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M467.3,471C459.3,489.2 442.5,497.4 425.5,491.7C410.8,486.8 401.6,472.2 402.7,455.8C403.8,441 415.8,427.5 430.3,424.8C452.2,420.7 473.4,442.6 468.9,464.8C468.5,466.7 467.9,468.7 467.3,471M434.3,443C435.1,439.2 433.9,436.1 430.5,434.1C427.3,432.3 424,433.1 421.1,435.2C414.5,439.7 411.2,446.1 411.3,454.2C411.3,457.3 411.3,460.4 414.4,462C417.6,463.7 420.8,462.8 423.8,460.8C429.8,456.7 432.6,450.6 434.3,443M437.9,458.5C442.1,458.7 442.9,456 442.7,452.7C442.6,451.2 441.4,450 440,450.6C437.1,451.8 435.8,454.1 436.7,457.4C436.8,457.7 437.1,457.9 437.9,458.5M425.9,485.3C429.3,485.8 432.6,488 436.5,485.3C433.6,482.2 430.2,482.1 426.8,482.5C425.7,482.7 424.4,483.2 425.9,485.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M596.7,492C582.4,495.5 571.5,490.2 563.5,479.5C554.5,467.6 554.1,454.4 561.3,441.4C569.6,426.7 584.6,420.8 599.4,426.1C614.5,431.4 624.3,447.5 622,463.1C621.8,464.7 621.7,466.6 619.9,467.3C618.3,468 617.6,466.6 616.8,465.5C615.1,463.3 613.1,464.2 611.5,465.4C607.1,468.5 603.9,472.9 601.6,477.7C599.8,481.6 601.8,484 607.6,485.9C604.8,489.6 600.8,490.6 596.7,492M580.8,450.2C581.9,447.3 583.3,444.4 584.2,441.4C585,439 585.8,436 583.1,434.1C580.7,432.4 578,433.3 575.6,434.6C567.9,438.9 563.9,445.7 563.4,454.4C563.1,460.2 567,462.5 572.2,459.9C576.1,458 578.5,454.6 580.8,450.2M589.7,481.5C586.3,480 582.9,479.2 579.5,482.1C581.2,485.4 584.4,486.1 587.2,487.2C589.2,487.9 591.8,488.9 593,486.6C594.1,484.4 591.9,483.1 589.7,481.5M590.5,450.8C592.4,452.2 594,451.7 595,449.9C596.2,447.8 595.9,445.7 594.7,443.8C593.9,442.6 592.8,441.9 591.3,442.7C589.3,443.9 589.1,445.9 589.3,447.9C589.4,448.7 589.8,449.4 590.5,450.8M589.6,472.4C588.5,472.5 587.4,473.1 587.9,474.2C588.8,476.2 590.6,476.8 592.7,476.2C593.5,473.6 591.8,473.1 589.6,472.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M678.3,566.2C673.5,566.7 669.3,565.5 665.2,564.1C657.3,561.4 649.9,561.2 643.2,567C642.3,567.7 641.4,568.5 640,568C640.6,562.3 646.8,557.2 653.5,556.7C659.7,556.2 665.3,558.5 671.1,559.9C674.1,560.6 676.9,561.1 679.5,558.7C681.4,557 683.2,557.9 684.8,559.3C687.8,561.7 688.9,564.9 688.1,568.7C687.1,572.9 684.6,575.8 680.4,577.1C678.2,577.8 675.9,578.1 673.5,577.7C668,576.6 662.4,575.5 656.9,574.5C651.4,573.5 646.1,575 640.6,576.7C642,571.5 646.5,567.9 651,567.6C657.6,567.3 663.9,568.4 670.2,570.1C673.2,570.9 676.1,571.1 679.1,570.7C682.2,570.3 684,568.8 683.4,565.3C681.6,564.1 680.3,566 678.3,566.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M404.7,524.5C398.7,518.9 395.7,512.9 399,505.1C402.5,496.8 411.8,495 417.8,501.8C419.7,503.9 421.2,504.5 423.7,503.2C428.4,501 432.8,501.3 436.2,505.6C439.2,509.3 439,514.5 436,519.1C429.9,528.6 415.1,531.2 404.7,524.5M423.7,509.3C419.5,512.3 416.4,511.7 414.3,506.8C413.2,504.3 411.4,502.5 408.5,502.8C405.3,503.1 403.6,505.3 402.8,508.3C401.7,511.8 402.6,514.8 404.7,517.6C410.6,525.7 424.2,525.6 430.9,517.4C433.1,514.7 434.1,511.5 432,508.7C429.8,505.9 426.9,507.4 423.7,509.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M492.5,521.2C491.9,520 491.4,519.1 491.1,518.1C490.5,515.7 490.3,513.2 493,512.1C495.9,510.9 497.2,513.1 498.2,515.3C500.2,520.2 503.5,523.8 508.5,525.5C516.2,528 523.4,524.7 527.7,517.1C529.2,514.5 530,509.9 534.2,512.1C538.5,514.4 535.8,518.3 534.2,521.2C524.9,538 503.1,538.1 492.5,521.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M577.2,601.1C576.9,603.2 575.8,602.2 575.1,601.7C566.5,594.9 559.4,586.9 556.3,576.1C555.8,574.5 555.4,572.9 557.1,569.9C561,582.7 568.5,592.1 577.2,601.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M561.4,415.4C566.8,404.2 586,402.5 591.1,410.5C590.8,411.3 590.1,411.4 589.5,411.1C580.9,407.4 573.3,410.2 565.8,414.3C564.5,415.1 563.4,417 561.4,415.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M463.6,413.3C464.2,414.4 465.2,415.1 464,416.9C455.9,411.1 447.2,407.4 436.3,410.3C441.9,402.7 454.9,404.4 463.6,413.3z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M468.7,571.2C468,583.1 463.1,592.6 453.2,599.5C455,596.7 456.8,593.8 458.5,590.9C461.8,585.3 464.9,579.6 466.2,573.1C466.5,571.5 466.7,571.6 468.7,571.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M472.2,599.4C473.4,598.2 474.1,597 475.2,596.3C477.2,595 478.7,596 478.6,598.1C478.6,601.4 478.2,604.8 475.5,607.3C474.2,608.5 472.6,609.8 470.7,608.6C468.6,607.3 469.3,605.4 469.9,603.7C470.4,602.3 471.3,601 472.2,599.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M554.9,608.9C549.1,607.8 545.6,603.9 545.7,599.3C545.7,598.2 545.6,596.9 546.9,596.2C548.1,595.6 549.2,596.2 549.9,597.1C552.5,600.6 557,603.3 554.9,608.9z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M436.5,562.8C433.9,561.5 434.2,560.1 436.3,559.3C438.2,558.6 440.4,557.7 442.5,559.6C441.9,562.8 439.3,562.7 436.5,562.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M852.9,509.5C860.7,539.5 836.2,567.6 807.4,567.3C782.6,567 761.3,547.3 760,522.6C759.1,505.9 766.8,492.6 780.6,483.3C807.8,465.1 843,477.8 852.9,509.5M806.6,561.8C828.3,561.7 847.4,544.8 848.7,524.8C850.7,493.1 818.1,471.3 789.4,484.9C771.6,493.3 763.8,511.1 765.7,525.2C768.5,545.8 784.8,560.2 806.6,561.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M876.7,556.9C879.9,559.6 881.6,562.7 880,566.4C878.5,569.5 875.7,571.5 871.9,571.2C868.7,571 866.2,569.2 865.1,566.2C864.1,563.4 864.5,560.5 866.8,558.4C869.6,555.9 872.7,554.7 876.7,556.9M869.5,563.4C870,566.2 871.8,566.8 874.1,565.6C875.4,565 876.2,563.5 875,562.4C873.3,560.5 871.3,560.6 869.5,563.4z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M832,453.8C835.1,454.5 835.8,456.2 834.9,458.7C834,461.3 831.9,461.4 829.7,461.2C827.9,461.1 826.9,460.1 826.9,458.3C827.1,455.5 828.4,453.7 832,453.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M845.5,455.1C847.3,456.9 847.5,458.8 846,460.1C843.8,462.1 841.2,461.4 838.5,460.6C838.2,455.6 840.6,454 845.5,455.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M475,633.1C476.1,630.8 476,628.2 478.4,626.9C480.3,629.5 479.6,635.7 477.4,637.4C476.6,638 475.8,638.2 475.1,637.6C473.7,636.4 474.7,634.9 475,633.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M514.5,815.1C514.5,812.4 515.5,810.9 518,810.9C520.8,810.9 523.6,810.9 526.4,811C528,811.1 529.3,811.8 529.2,813.7C529.2,815.3 528.2,816.2 526.7,816.2C522.7,816.1 518.5,817.4 514.5,815.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M544.9,835.5C541.2,833.5 542.1,832 545.1,830.9C545.7,830.7 546.5,830.7 547.1,830.8C549.3,831 552.5,830.7 552.4,833.7C552.3,836.4 549.4,836.2 547.2,836.1C546.6,836.1 545.9,835.8 544.9,835.5z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M491.2,832.8C488.3,836.7 484.6,835.1 481.1,835C480.3,835 479.7,834.2 479.7,833.3C479.6,832.4 480,831.5 480.8,831.3C484.4,830.8 488.1,829 491.2,832.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M903.8,270.2C904.9,266.9 907.2,266.3 909.9,266.9C912.2,267.5 913.6,269.2 914.1,271.5C914.7,274.4 913.9,276.9 910.9,278C908,279.1 905.8,277.7 904.3,275C903.6,273.6 903.6,272.1 903.8,270.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M890.5,273.1C891.7,272.9 892.6,272.7 893.3,272.8C897,273.7 897.9,276.4 897.1,279.7C896.4,282.5 894.1,283.2 891.7,282.2C888.5,281 887.2,278.5 888.6,275.1C888.9,274.4 889.6,273.9 890.5,273.1z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M539.4,155.2C537,161 536.6,167.4 531.3,171.3C534.9,159.8 536.8,147.7 542.4,136.9C543.1,137.1 543.7,137.3 544.4,137.5C542.7,143.3 541.1,149.1 539.4,155.2z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M531,159.8C529.4,165 528,169.8 526.5,174.7C526.1,174.5 525.7,174.4 525.3,174.3C526.3,161.1 530.4,148.8 536.1,136.9C536.1,144.8 532.7,151.9 531,159.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M529.7,140.6C526.7,150.1 523.9,159.4 521.1,168.6C520.4,168.3 519.7,168.1 519,167.9C521.4,157.2 524.6,146.7 528.5,135.9C530.8,137.4 530.2,138.8 529.7,140.6z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M157.9,288.8C149.5,295.8 138.9,292.8 136.3,283.1C134.8,277.3 138.2,271.9 144.4,270.5C151.2,268.9 158.2,273.5 159.3,280.3C159.8,283.1 159.8,285.9 157.9,288.8z" android:strokeColor="#00000000"/>
+      
+    <path android:fillColor="#000000" android:pathData="M821.2,544.4C810.4,550.1 800.2,549.3 791,541.9C782.7,535.1 778.9,526 781.4,515.2C784.1,502.9 795.3,494.2 807.7,494C818.8,493.9 829.8,502.8 833.5,514.9C836.6,525.2 831.5,537.8 821.2,544.4M798.3,525.1C801.7,529.7 805.6,533.6 812,532C818.2,530.4 821.3,523.9 819.2,517.2C817.2,510.7 810.1,507.1 803.8,509C798.4,510.6 794,517.6 798.3,525.1M807.5,542.1C805.2,541.7 802.9,541.4 800.6,541C804.7,543.3 808.9,543.3 813.1,541.6C811.5,541.7 809.9,541.9 807.5,542.1z" android:strokeColor="#00000000"/>
+    
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/drawable/ocutopus_v3_full_size.png b/android/llama.android/app-java/src/main/res/drawable/ocutopus_v3_full_size.png
new file mode 100644
index 00000000..de1bb864
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/drawable/ocutopus_v3_full_size.png differ
diff --git a/android/llama.android/app-java/src/main/res/drawable/roundcorner.xml b/android/llama.android/app-java/src/main/res/drawable/roundcorner.xml
new file mode 100644
index 00000000..5c795c41
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/roundcorner.xml
@@ -0,0 +1,9 @@
+<?xml version="1.0" encoding="utf-8"?>
+<shape xmlns:android="http://schemas.android.com/apk/res/android"
+    android:shape="rectangle"
+    >
+
+    <corners android:radius="10dp" />
+
+    <solid android:color="#854BDA" />
+</shape>
diff --git a/android/llama.android/app-java/src/main/res/drawable/title.xml b/android/llama.android/app-java/src/main/res/drawable/title.xml
new file mode 100644
index 00000000..a7bad4f8
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/title.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<layer-list xmlns:android="http://schemas.android.com/apk/res/android">
+    <!-- 在底部绘制线条 -->
+    <item
+        android:gravity="bottom"
+        android:height="2dp">
+        <shape android:shape="rectangle">
+            <solid android:color="#000000" />
+        </shape>
+    </item>
+</layer-list>
diff --git a/android/llama.android/app-java/src/main/res/drawable/upload_image_icon.xml b/android/llama.android/app-java/src/main/res/drawable/upload_image_icon.xml
new file mode 100644
index 00000000..f4a86832
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/drawable/upload_image_icon.xml
@@ -0,0 +1,13 @@
+<vector xmlns:android="http://schemas.android.com/apk/res/android"
+    android:width="48dp"
+    android:height="48dp"
+    android:viewportWidth="32"
+    android:viewportHeight="33">
+  <path
+      android:pathData="M21.115,26L17.096,21.981M25.5,22.346L21.115,17.962L17.096,21.981M17.096,21.981L10.885,15.769L7.231,19.423L6.5,20.154M6.5,20.154L6.5,9.923C6.5,8.309 7.809,7 9.423,7L22.577,7C24.191,7 25.5,8.309 25.5,9.923L25.5,23.077C25.5,24.691 24.191,26 22.577,26L9.423,26C7.809,26 6.5,24.691 6.5,23.077L6.5,20.154ZM22.577,12.115C22.577,13.326 21.595,14.308 20.385,14.308C19.174,14.308 18.192,13.326 18.192,12.115C18.192,10.905 19.174,9.923 20.385,9.923C21.595,9.923 22.577,10.905 22.577,12.115Z"
+      android:strokeLineJoin="round"
+      android:strokeWidth="1.2"
+      android:fillColor="#00000000"
+      android:strokeColor="#ffffff"
+      android:strokeLineCap="round"/>
+</vector>
diff --git a/android/llama.android/app-java/src/main/res/font/abhaya_libre_bold.ttf b/android/llama.android/app-java/src/main/res/font/abhaya_libre_bold.ttf
new file mode 100644
index 00000000..6f4a231d
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/font/abhaya_libre_bold.ttf differ
diff --git a/android/llama.android/app-java/src/main/res/font/alegreya_sans_sc_extrabold.xml b/android/llama.android/app-java/src/main/res/font/alegreya_sans_sc_extrabold.xml
new file mode 100644
index 00000000..8112a231
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/font/alegreya_sans_sc_extrabold.xml
@@ -0,0 +1,7 @@
+<?xml version="1.0" encoding="utf-8"?>
+<font-family xmlns:app="http://schemas.android.com/apk/res-auto"
+        app:fontProviderAuthority="com.google.android.gms.fonts"
+        app:fontProviderPackage="com.google.android.gms"
+        app:fontProviderQuery="name=Alegreya Sans SC&amp;weight=800"
+        app:fontProviderCerts="@array/com_google_android_gms_fonts_certs">
+</font-family>
diff --git a/android/llama.android/app-java/src/main/res/layout/activity_main.xml b/android/llama.android/app-java/src/main/res/layout/activity_main.xml
new file mode 100644
index 00000000..625d9923
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/layout/activity_main.xml
@@ -0,0 +1,115 @@
+<?xml version="1.0" encoding="utf-8"?>
+<RelativeLayout xmlns:android="http://schemas.android.com/apk/res/android"
+    xmlns:tools="http://schemas.android.com/tools"
+    android:layout_width="wrap_content"
+    android:layout_height="match_parent"
+    android:background="@drawable/gradient_background"
+    tools:context=".MainActivity">
+
+    <LinearLayout
+        android:id="@+id/idLayoutBeforeChat"
+        android:layout_width="match_parent"
+        android:layout_height="wrap_content"
+        android:orientation="vertical"
+        android:layout_marginTop="100dp">
+
+        <TextView
+            android:layout_width="match_parent"
+            android:layout_height="100dp"
+            android:text="Hello, Ask Me Anything!"
+            android:textColor="@color/white"
+            android:fontFamily="sans-serif"
+            android:gravity="center"
+            android:includeFontPadding="false"
+            android:textSize="40sp" />
+
+        <ImageView
+            android:layout_width="match_parent"
+            android:layout_height="250dp"
+            android:layout_marginTop="40dp"
+            android:src="@drawable/ocutopus_v3_full_size"/>
+
+    </LinearLayout>
+
+    <TextView
+        android:id="@+id/textView"
+        android:layout_width="match_parent"
+        android:layout_height="wrap_content"
+        android:layout_centerHorizontal="true"
+        android:layout_marginStart="10dp"
+        android:layout_marginEnd="10dp"
+        android:layout_marginBottom="15dp"
+        android:layout_marginTop="15dp"
+        android:textColor="@color/white"
+        android:fontFamily="sans-serif"
+        android:gravity="center"
+        android:includeFontPadding="false"
+        android:text="Nexa VLM"
+        android:textSize="40sp"
+        android:visibility="gone"/>
+
+
+    <androidx.recyclerview.widget.RecyclerView
+        android:id="@+id/idRVChats"
+        android:layout_width="match_parent"
+        android:layout_height="wrap_content"
+        android:layout_above="@id/idLLMessage"
+        android:layout_below="@+id/textView"
+        android:gravity="end"
+        android:padding="10dp"
+        android:visibility="gone" />
+
+    <LinearLayout
+        android:id="@+id/idLLMessage"
+        android:layout_width="match_parent"
+        android:layout_height="100dp"
+        android:minHeight="100dp"
+        android:layout_alignParentBottom="true"
+        android:orientation="horizontal"
+        android:background="@color/custom_chatbox_color"
+        android:padding="10dp">
+
+        <ImageButton
+            android:id="@+id/btnUploadImage"
+            android:layout_width="45dp"
+            android:layout_height="match_parent"
+            android:background="@android:color/transparent"
+            android:src="@drawable/upload_image_icon"/>
+
+        <View
+            android:layout_width="8dp"
+            android:layout_height="match_parent"/>
+
+        <ImageButton
+            android:id="@+id/btnStart"
+            android:layout_width="45dp"
+            android:layout_height="match_parent"
+            android:background="@android:color/transparent"
+            android:src="@drawable/microphone"/>
+
+        <View
+            android:layout_width="8dp"
+            android:layout_height="match_parent"/>
+
+        <EditText
+            android:id="@+id/idEdtMessage"
+            android:layout_width="0dp"
+            android:layout_height="50dp"
+            android:layout_weight="1"
+            android:background="@drawable/input_text_box"
+            android:textColor="@color/white"
+            android:hint="Chat with image"
+            android:textColorHint="#8F8F90"
+            android:layout_marginTop="15dp"
+            android:paddingStart="20dp"/>
+
+        <ImageButton
+            android:id="@+id/idIBSend"
+            android:layout_width="55dp"
+            android:layout_height="match_parent"
+            android:background="@android:color/transparent"
+            android:src="@drawable/octopus_menu_send" />
+
+    </LinearLayout>
+
+</RelativeLayout>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/layout/bot_msg.xml b/android/llama.android/app-java/src/main/res/layout/bot_msg.xml
new file mode 100644
index 00000000..5ee58e1d
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/layout/bot_msg.xml
@@ -0,0 +1,35 @@
+<?xml version="1.0" encoding="utf-8"?>
+<com.google.android.material.card.MaterialCardView
+    xmlns:android="http://schemas.android.com/apk/res/android"
+    xmlns:app="http://schemas.android.com/apk/res-auto"
+    android:layout_width="wrap_content"
+    android:layout_height="wrap_content"
+    android:layout_gravity="start"
+    android:layout_margin="5dp"
+    android:elevation="8dp"
+    app:cardBackgroundColor="@color/black"
+    app:shapeAppearanceOverlay="@style/CustomCornersBot">
+
+    <LinearLayout
+        android:layout_width="wrap_content"
+        android:layout_height="wrap_content"
+        android:minHeight="35dp"
+        android:background="@color/black"
+        android:orientation="horizontal"
+        android:padding="5dp">
+
+        <TextView
+            android:id="@+id/idTVBot"
+            android:layout_width="wrap_content"
+            android:maxWidth="280dp"
+            android:layout_height="wrap_content"
+            android:layout_gravity="center_vertical"
+            android:layout_marginLeft="5dp"
+            android:layout_marginRight="5dp"
+            android:text="Bot message"
+            android:textSize="16sp"
+            android:textColor="@color/white" />
+
+    </LinearLayout>
+
+</com.google.android.material.card.MaterialCardView>
diff --git a/android/llama.android/app-java/src/main/res/layout/user_msg.xml b/android/llama.android/app-java/src/main/res/layout/user_msg.xml
new file mode 100644
index 00000000..20aa126a
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/layout/user_msg.xml
@@ -0,0 +1,55 @@
+<?xml version="1.0" encoding="utf-8"?>
+<LinearLayout
+    xmlns:android="http://schemas.android.com/apk/res/android"
+    xmlns:app="http://schemas.android.com/apk/res-auto"
+    android:layout_width="match_parent"
+    android:layout_height="wrap_content"
+    android:orientation="vertical"
+    android:padding="5dp">
+
+    <com.google.android.material.card.MaterialCardView
+        android:layout_width="wrap_content"
+        android:layout_height="wrap_content"
+        android:layout_gravity="end"
+        android:layout_margin="5dp"
+        android:elevation="8dp"
+        app:cardBackgroundColor="@color/white"
+        app:shapeAppearanceOverlay="@style/CustomCornersUser">
+
+        <LinearLayout
+            android:layout_width="match_parent"
+            android:minWidth="60dp"
+            android:layout_height="wrap_content"
+            android:minHeight="35dp"
+            android:background="@color/white"
+            android:layout_gravity="end"
+            android:orientation="horizontal"
+            android:padding="5dp"
+            android:gravity="center_vertical">
+
+            <TextView
+                android:id="@+id/idTVUser"
+                android:layout_width="wrap_content"
+                android:maxWidth="300dp"
+                android:layout_height="wrap_content"
+                android:layout_gravity="center_vertical"
+                android:layout_marginLeft="5dp"
+                android:layout_marginRight="5dp"
+                android:text="@string/user_message"
+                android:textSize="16sp"
+                android:textColor="@color/black" />
+
+            <ImageView
+                android:id="@+id/idIVUserImage"
+                android:layout_width="wrap_content"
+                android:layout_height="200dp"
+                android:visibility="gone"
+                android:adjustViewBounds="true"
+                android:scaleType="fitCenter"
+                android:maxWidth="250dp"
+                android:maxHeight="150dp" />
+
+        </LinearLayout>
+
+    </com.google.android.material.card.MaterialCardView>
+</LinearLayout>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher.xml b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
new file mode 100644
index 00000000..036d09bc
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="utf-8"?>
+<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
+    <background android:drawable="@color/ic_launcher_background"/>
+    <foreground android:drawable="@mipmap/ic_launcher_foreground"/>
+</adaptive-icon>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
new file mode 100644
index 00000000..036d09bc
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/ic_launcher_round.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="utf-8"?>
+<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
+    <background android:drawable="@color/ic_launcher_background"/>
+    <foreground android:drawable="@mipmap/ic_launcher_foreground"/>
+</adaptive-icon>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus.xml b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus.xml
new file mode 100644
index 00000000..2e533e65
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="utf-8"?>
+<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
+    <background android:drawable="@drawable/octopus_background"/>
+    <foreground android:drawable="@mipmap/octopus_foreground"/>
+</adaptive-icon>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus_round.xml b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus_round.xml
new file mode 100644
index 00000000..2e533e65
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/mipmap-anydpi-v26/octopus_round.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="utf-8"?>
+<adaptive-icon xmlns:android="http://schemas.android.com/apk/res/android">
+    <background android:drawable="@drawable/octopus_background"/>
+    <foreground android:drawable="@mipmap/octopus_foreground"/>
+</adaptive-icon>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher.png b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher.png
new file mode 100644
index 00000000..cf0c3458
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_foreground.png b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_foreground.png
new file mode 100644
index 00000000..8acbf0ea
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_foreground.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_round.png b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_round.png
new file mode 100644
index 00000000..12580bdb
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/ic_launcher_round.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus.webp b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus.webp
new file mode 100644
index 00000000..29daecf1
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_foreground.webp b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_foreground.webp
new file mode 100644
index 00000000..88bf3149
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_foreground.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_round.webp b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_round.webp
new file mode 100644
index 00000000..0883ba1c
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-hdpi/octopus_round.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher.png b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher.png
new file mode 100644
index 00000000..b3990457
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_foreground.png b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_foreground.png
new file mode 100644
index 00000000..b8a59f47
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_foreground.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_round.png b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_round.png
new file mode 100644
index 00000000..75aec75a
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/ic_launcher_round.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus.webp b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus.webp
new file mode 100644
index 00000000..c192866e
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_foreground.webp b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_foreground.webp
new file mode 100644
index 00000000..34251871
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_foreground.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_round.webp b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_round.webp
new file mode 100644
index 00000000..edb57427
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-mdpi/octopus_round.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher.png b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher.png
new file mode 100644
index 00000000..a6324636
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_foreground.png b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_foreground.png
new file mode 100644
index 00000000..98708fa5
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_foreground.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_round.png b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_round.png
new file mode 100644
index 00000000..30de3067
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/ic_launcher_round.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus.webp b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus.webp
new file mode 100644
index 00000000..372b8bdb
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_foreground.webp b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_foreground.webp
new file mode 100644
index 00000000..fcdd6ddf
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_foreground.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_round.webp b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_round.webp
new file mode 100644
index 00000000..5b864a66
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xhdpi/octopus_round.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher.png b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher.png
new file mode 100644
index 00000000..196c1ef5
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_foreground.png b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_foreground.png
new file mode 100644
index 00000000..34fc4e7e
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_foreground.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_round.png b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_round.png
new file mode 100644
index 00000000..984bb8d9
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/ic_launcher_round.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus.webp b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus.webp
new file mode 100644
index 00000000..ad3daafc
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_foreground.webp b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_foreground.webp
new file mode 100644
index 00000000..ca878a67
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_foreground.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_round.webp b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_round.webp
new file mode 100644
index 00000000..fd780d66
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxhdpi/octopus_round.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher.png b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher.png
new file mode 100644
index 00000000..1f10f330
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_foreground.png b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_foreground.png
new file mode 100644
index 00000000..13f3147e
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_foreground.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png
new file mode 100644
index 00000000..b81a70ba
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/ic_launcher_round.png differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus.webp b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus.webp
new file mode 100644
index 00000000..ef8923ce
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_foreground.webp b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_foreground.webp
new file mode 100644
index 00000000..e8b6489c
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_foreground.webp differ
diff --git a/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_round.webp b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_round.webp
new file mode 100644
index 00000000..d0b5881a
Binary files /dev/null and b/android/llama.android/app-java/src/main/res/mipmap-xxxhdpi/octopus_round.webp differ
diff --git a/android/llama.android/app-java/src/main/res/values-night/themes.xml b/android/llama.android/app-java/src/main/res/values-night/themes.xml
new file mode 100644
index 00000000..2bd72d37
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values-night/themes.xml
@@ -0,0 +1,11 @@
+<resources xmlns:tools="http://schemas.android.com/tools">
+    <!-- Base application theme. -->
+    <style name="Base.Theme.LayoutTest" parent="Theme.Material3.DayNight.NoActionBar">
+        <item name="colorPrimary">@color/colorPrimary</item>
+        <item name="colorPrimaryDark">@color/colorPrimaryDark</item>
+        <item name="colorAccent">@color/colorAccent</item>
+        <item name="android:textColor">@color/colorText</item>
+        <item name="android:windowBackground">@color/colorBackground</item>
+        <item name="colorError">@color/colorError</item>
+    </style>
+</resources>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/values/colors.xml b/android/llama.android/app-java/src/main/res/values/colors.xml
new file mode 100644
index 00000000..b15af47b
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/colors.xml
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="utf-8"?>
+<resources>
+    <color name="black">#FF000000</color>
+    <color name="white">#FFFFFFFF</color>
+    <color name="purple_200">#813BBA</color>
+    <color name="background">#FF202020</color>
+    <color name="green">#17CE92</color>
+    <color name="grey">#E5E5E5</color>
+    <color name="custom_chatbox_color">#0A1528</color>
+    <color name="inputbox_background">#313D50</color>
+    <color name="colorPrimary">#03070D</color>
+    <color name="colorPrimaryDark">#03070D</color>
+    <color name="colorAccent">#03070D</color>
+    <color name="colorBackground">#03070D</color>
+    <color name="colorText">#FFFFFF</color>
+    <color name="colorError">#B00020</color>
+</resources>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/values/font_certs.xml b/android/llama.android/app-java/src/main/res/values/font_certs.xml
new file mode 100644
index 00000000..d2226ac0
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/font_certs.xml
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="utf-8"?>
+<resources>
+    <array name="com_google_android_gms_fonts_certs">
+        <item>@array/com_google_android_gms_fonts_certs_dev</item>
+        <item>@array/com_google_android_gms_fonts_certs_prod</item>
+    </array>
+    <string-array name="com_google_android_gms_fonts_certs_dev">
+        <item>
+            MIIEqDCCA5CgAwIBAgIJANWFuGx90071MA0GCSqGSIb3DQEBBAUAMIGUMQswCQYDVQQGEwJVUzETMBEGA1UECBMKQ2FsaWZvcm5pYTEWMBQGA1UEBxMNTW91bnRhaW4gVmlldzEQMA4GA1UEChMHQW5kcm9pZDEQMA4GA1UECxMHQW5kcm9pZDEQMA4GA1UEAxMHQW5kcm9pZDEiMCAGCSqGSIb3DQEJARYTYW5kcm9pZEBhbmRyb2lkLmNvbTAeFw0wODA0MTUyMzM2NTZaFw0zNTA5MDEyMzM2NTZaMIGUMQswCQYDVQQGEwJVUzETMBEGA1UECBMKQ2FsaWZvcm5pYTEWMBQGA1UEBxMNTW91bnRhaW4gVmlldzEQMA4GA1UEChMHQW5kcm9pZDEQMA4GA1UECxMHQW5kcm9pZDEQMA4GA1UEAxMHQW5kcm9pZDEiMCAGCSqGSIb3DQEJARYTYW5kcm9pZEBhbmRyb2lkLmNvbTCCASAwDQYJKoZIhvcNAQEBBQADggENADCCAQgCggEBANbOLggKv+IxTdGNs8/TGFy0PTP6DHThvbbR24kT9ixcOd9W+EaBPWW+wPPKQmsHxajtWjmQwWfna8mZuSeJS48LIgAZlKkpFeVyxW0qMBujb8X8ETrWy550NaFtI6t9+u7hZeTfHwqNvacKhp1RbE6dBRGWynwMVX8XW8N1+UjFaq6GCJukT4qmpN2afb8sCjUigq0GuMwYXrFVee74bQgLHWGJwPmvmLHC69EH6kWr22ijx4OKXlSIx2xT1AsSHee70w5iDBiK4aph27yH3TxkXy9V89TDdexAcKk/cVHYNnDBapcavl7y0RiQ4biu8ymM8Ga/nmzhRKya6G0cGw8CAQOjgfwwgfkwHQYDVR0OBBYEFI0cxb6VTEM8YYY6FbBMvAPyT+CyMIHJBgNVHSMEgcEwgb6AFI0cxb6VTEM8YYY6FbBMvAPyT+CyoYGapIGXMIGUMQswCQYDVQQGEwJVUzETMBEGA1UECBMKQ2FsaWZvcm5pYTEWMBQGA1UEBxMNTW91bnRhaW4gVmlldzEQMA4GA1UEChMHQW5kcm9pZDEQMA4GA1UECxMHQW5kcm9pZDEQMA4GA1UEAxMHQW5kcm9pZDEiMCAGCSqGSIb3DQEJARYTYW5kcm9pZEBhbmRyb2lkLmNvbYIJANWFuGx90071MAwGA1UdEwQFMAMBAf8wDQYJKoZIhvcNAQEEBQADggEBABnTDPEF+3iSP0wNfdIjIz1AlnrPzgAIHVvXxunW7SBrDhEglQZBbKJEk5kT0mtKoOD1JMrSu1xuTKEBahWRbqHsXclaXjoBADb0kkjVEJu/Lh5hgYZnOjvlba8Ld7HCKePCVePoTJBdI4fvugnL8TsgK05aIskyY0hKI9L8KfqfGTl1lzOv2KoWD0KWwtAWPoGChZxmQ+nBli+gwYMzM1vAkP+aayLe0a1EQimlOalO762r0GXO0ks+UeXde2Z4e+8S/pf7pITEI/tP+MxJTALw9QUWEv9lKTk+jkbqxbsh8nfBUapfKqYn0eidpwq2AzVp3juYl7//fKnaPhJD9gs=
+        </item>
+    </string-array>
+    <string-array name="com_google_android_gms_fonts_certs_prod">
+        <item>
+            MIIEQzCCAyugAwIBAgIJAMLgh0ZkSjCNMA0GCSqGSIb3DQEBBAUAMHQxCzAJBgNVBAYTAlVTMRMwEQYDVQQIEwpDYWxpZm9ybmlhMRYwFAYDVQQHEw1Nb3VudGFpbiBWaWV3MRQwEgYDVQQKEwtHb29nbGUgSW5jLjEQMA4GA1UECxMHQW5kcm9pZDEQMA4GA1UEAxMHQW5kcm9pZDAeFw0wODA4MjEyMzEzMzRaFw0zNjAxMDcyMzEzMzRaMHQxCzAJBgNVBAYTAlVTMRMwEQYDVQQIEwpDYWxpZm9ybmlhMRYwFAYDVQQHEw1Nb3VudGFpbiBWaWV3MRQwEgYDVQQKEwtHb29nbGUgSW5jLjEQMA4GA1UECxMHQW5kcm9pZDEQMA4GA1UEAxMHQW5kcm9pZDCCASAwDQYJKoZIhvcNAQEBBQADggENADCCAQgCggEBAKtWLgDYO6IIrgqWbxJOKdoR8qtW0I9Y4sypEwPpt1TTcvZApxsdyxMJZ2JORland2qSGT2y5b+3JKkedxiLDmpHpDsz2WCbdxgxRczfey5YZnTJ4VZbH0xqWVW/8lGmPav5xVwnIiJS6HXk+BVKZF+JcWjAsb/GEuq/eFdpuzSqeYTcfi6idkyugwfYwXFU1+5fZKUaRKYCwkkFQVfcAs1fXA5V+++FGfvjJ/CxURaSxaBvGdGDhfXE28LWuT9ozCl5xw4Yq5OGazvV24mZVSoOO0yZ31j7kYvtwYK6NeADwbSxDdJEqO4k//0zOHKrUiGYXtqw/A0LFFtqoZKFjnkCAQOjgdkwgdYwHQYDVR0OBBYEFMd9jMIhF1Ylmn/Tgt9r45jk14alMIGmBgNVHSMEgZ4wgZuAFMd9jMIhF1Ylmn/Tgt9r45jk14aloXikdjB0MQswCQYDVQQGEwJVUzETMBEGA1UECBMKQ2FsaWZvcm5pYTEWMBQGA1UEBxMNTW91bnRhaW4gVmlldzEUMBIGA1UEChMLR29vZ2xlIEluYy4xEDAOBgNVBAsTB0FuZHJvaWQxEDAOBgNVBAMTB0FuZHJvaWSCCQDC4IdGZEowjTAMBgNVHRMEBTADAQH/MA0GCSqGSIb3DQEBBAUAA4IBAQBt0lLO74UwLDYKqs6Tm8/yzKkEu116FmH4rkaymUIE0P9KaMftGlMexFlaYjzmB2OxZyl6euNXEsQH8gjwyxCUKRJNexBiGcCEyj6z+a1fuHHvkiaai+KL8W1EyNmgjmyy8AW7P+LLlkR+ho5zEHatRbM/YAnqGcFh5iZBqpknHf1SKMXFh4dd239FJ1jWYfbMDMy3NS5CTMQ2XFI1MvcyUTdZPErjQfTbQe3aDQsQcafEQPD+nqActifKZ0Np0IS9L9kR/wbNvyz6ENwPiTrjV2KRkEjH78ZMcUQXg0L3BYHJ3lc69Vs5Ddf9uUGGMYldX3WfMBEmh/9iFBDAaTCK
+        </item>
+    </string-array>
+</resources>
diff --git a/android/llama.android/app-java/src/main/res/values/ic_launcher_background.xml b/android/llama.android/app-java/src/main/res/values/ic_launcher_background.xml
new file mode 100644
index 00000000..c5d5899f
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/ic_launcher_background.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="utf-8"?>
+<resources>
+    <color name="ic_launcher_background">#FFFFFF</color>
+</resources>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/values/preloaded_fonts.xml b/android/llama.android/app-java/src/main/res/values/preloaded_fonts.xml
new file mode 100644
index 00000000..56657f17
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/preloaded_fonts.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="utf-8"?>
+<resources>
+    <array name="preloaded_fonts" translatable="false">
+        <item>@font/alegreya_sans_sc_extrabold</item>
+    </array>
+</resources>
diff --git a/android/llama.android/app-java/src/main/res/values/strings.xml b/android/llama.android/app-java/src/main/res/values/strings.xml
new file mode 100644
index 00000000..2ff67712
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/strings.xml
@@ -0,0 +1,4 @@
+<resources>
+    <string name="app_name">LayoutTest</string>
+    <string name="user_message">User Message</string>
+</resources>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/values/styles.xml b/android/llama.android/app-java/src/main/res/values/styles.xml
new file mode 100644
index 00000000..864fcf30
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/styles.xml
@@ -0,0 +1,16 @@
+<resources>
+    <style name="CustomCornersUser" parent="Widget.MaterialComponents.CardView">
+        <item name="cornerFamily">rounded</item>
+        <item name="cornerSizeTopLeft">12dp</item>
+        <item name="cornerSizeTopRight">12dp</item>
+        <item name="cornerSizeBottomLeft">12dp</item>
+        <item name="cornerSizeBottomRight">0dp</item>
+    </style>
+    <style name="CustomCornersBot" parent="Widget.MaterialComponents.CardView">
+        <item name="cornerFamily">rounded</item>
+        <item name="cornerSizeTopLeft">12dp</item>
+        <item name="cornerSizeTopRight">12dp</item>
+        <item name="cornerSizeBottomLeft">0dp</item>
+        <item name="cornerSizeBottomRight">12dp</item>
+    </style>
+</resources>
diff --git a/android/llama.android/app-java/src/main/res/values/themes.xml b/android/llama.android/app-java/src/main/res/values/themes.xml
new file mode 100644
index 00000000..2ef46f0c
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/values/themes.xml
@@ -0,0 +1,13 @@
+<resources xmlns:tools="http://schemas.android.com/tools">
+    <!-- Base application theme. -->
+    <style name="Base.Theme.LayoutTest" parent="Theme.Material3.DayNight.NoActionBar">
+        <item name="colorPrimary">@color/colorPrimary</item>
+        <item name="colorPrimaryDark">@color/colorPrimaryDark</item>
+        <item name="colorAccent">@color/colorAccent</item>
+        <item name="android:textColor">@color/colorText</item>
+        <item name="android:windowBackground">@color/colorBackground</item>
+        <item name="colorError">@color/colorError</item>
+    </style>
+
+    <style name="Theme.LayoutTest" parent="Base.Theme.LayoutTest" />
+</resources>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/xml/backup_rules.xml b/android/llama.android/app-java/src/main/res/xml/backup_rules.xml
new file mode 100644
index 00000000..fa0f996d
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/xml/backup_rules.xml
@@ -0,0 +1,13 @@
+<?xml version="1.0" encoding="utf-8"?><!--
+   Sample backup rules file; uncomment and customize as necessary.
+   See https://developer.android.com/guide/topics/data/autobackup
+   for details.
+   Note: This file is ignored for devices older that API 31
+   See https://developer.android.com/about/versions/12/backup-restore
+-->
+<full-backup-content>
+    <!--
+   <include domain="sharedpref" path="."/>
+   <exclude domain="sharedpref" path="device.xml"/>
+-->
+</full-backup-content>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/xml/data_extraction_rules.xml b/android/llama.android/app-java/src/main/res/xml/data_extraction_rules.xml
new file mode 100644
index 00000000..9ee9997b
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/xml/data_extraction_rules.xml
@@ -0,0 +1,19 @@
+<?xml version="1.0" encoding="utf-8"?><!--
+   Sample data extraction rules file; uncomment and customize as necessary.
+   See https://developer.android.com/about/versions/12/backup-restore#xml-changes
+   for details.
+-->
+<data-extraction-rules>
+    <cloud-backup>
+        <!-- TODO: Use <include> and <exclude> to control what is backed up.
+        <include .../>
+        <exclude .../>
+        -->
+    </cloud-backup>
+    <!--
+    <device-transfer>
+        <include .../>
+        <exclude .../>
+    </device-transfer>
+    -->
+</data-extraction-rules>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/xml/file_paths.xml b/android/llama.android/app-java/src/main/res/xml/file_paths.xml
new file mode 100644
index 00000000..3d985443
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/xml/file_paths.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="utf-8"?>
+<paths xmlns:android="http://schemas.android.com/apk/res/android">
+    <external-files-path name="my_images" path="Pictures" />
+</paths>
\ No newline at end of file
diff --git a/android/llama.android/app-java/src/main/res/xml/network_security_config.xml b/android/llama.android/app-java/src/main/res/xml/network_security_config.xml
new file mode 100644
index 00000000..f239ba46
--- /dev/null
+++ b/android/llama.android/app-java/src/main/res/xml/network_security_config.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="utf-8"?>
+<network-security-config>
+    <!-- Secure domain config for api.nexaforai.com -->
+    <domain-config cleartextTrafficPermitted="false">
+        <domain includeSubdomains="true">api.nexaforai.com</domain>
+        <!-- Pinning certificates or other configurations can be added here for enhanced security -->
+    </domain-config>
+</network-security-config>
diff --git a/android/llama.android/app-java/src/test/java/ai/nexa/app_java/ExampleUnitTest.java b/android/llama.android/app-java/src/test/java/ai/nexa/app_java/ExampleUnitTest.java
new file mode 100644
index 00000000..07b55b17
--- /dev/null
+++ b/android/llama.android/app-java/src/test/java/ai/nexa/app_java/ExampleUnitTest.java
@@ -0,0 +1,17 @@
+package ai.nexa.app_java;
+
+import org.junit.Test;
+
+import static org.junit.Assert.*;
+
+/**
+ * Example local unit test, which will execute on the development machine (host).
+ *
+ * @see <a href="http://d.android.com/tools/testing">Testing documentation</a>
+ */
+public class ExampleUnitTest {
+    @Test
+    public void addition_isCorrect() {
+        assertEquals(4, 2 + 2);
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/build.gradle.kts b/android/llama.android/build.gradle.kts
new file mode 100644
index 00000000..53401400
--- /dev/null
+++ b/android/llama.android/build.gradle.kts
@@ -0,0 +1,13 @@
+// Top-level build file where you can add configuration options common to all sub-projects/modules.
+plugins {
+    id("com.android.application") version "8.2.0" apply false
+    id("org.jetbrains.kotlin.android") version "1.9.0" apply false
+    id("com.android.library") version "8.2.0" apply false
+}
+buildscript {
+    val kotlin_version by extra("1.9.20")
+
+    dependencies {
+        classpath("org.jetbrains.kotlin:kotlin-gradle-plugin:$kotlin_version")
+    }
+}
diff --git a/android/llama.android/gradle.properties b/android/llama.android/gradle.properties
new file mode 100644
index 00000000..2cbd6d19
--- /dev/null
+++ b/android/llama.android/gradle.properties
@@ -0,0 +1,23 @@
+# Project-wide Gradle settings.
+# IDE (e.g. Android Studio) users:
+# Gradle settings configured through the IDE *will override*
+# any settings specified in this file.
+# For more details on how to configure your build environment visit
+# http://www.gradle.org/docs/current/userguide/build_environment.html
+# Specifies the JVM arguments used for the daemon process.
+# The setting is particularly useful for tweaking memory settings.
+org.gradle.jvmargs=-Xmx2048m -Dfile.encoding=UTF-8
+# When configured, Gradle will run in incubating parallel mode.
+# This option should only be used with decoupled projects. More details, visit
+# http://www.gradle.org/docs/current/userguide/multi_project_builds.html#sec:decoupled_projects
+# org.gradle.parallel=true
+# AndroidX package structure to make it clearer which packages are bundled with the
+# Android operating system, and which are packaged with your app's APK
+# https://developer.android.com/topic/libraries/support-library/androidx-rn
+android.useAndroidX=true
+# Kotlin code style for this project: "official" or "obsolete":
+kotlin.code.style=official
+# Enables namespacing of each library's R class so that its R class includes only the
+# resources declared in the library itself and none from the library's dependencies,
+# thereby reducing the size of the R class for that library
+android.nonTransitiveRClass=true
diff --git a/android/llama.android/gradle/wrapper/gradle-wrapper.jar b/android/llama.android/gradle/wrapper/gradle-wrapper.jar
new file mode 100644
index 00000000..e708b1c0
Binary files /dev/null and b/android/llama.android/gradle/wrapper/gradle-wrapper.jar differ
diff --git a/android/llama.android/gradle/wrapper/gradle-wrapper.properties b/android/llama.android/gradle/wrapper/gradle-wrapper.properties
new file mode 100644
index 00000000..a3958c14
--- /dev/null
+++ b/android/llama.android/gradle/wrapper/gradle-wrapper.properties
@@ -0,0 +1,6 @@
+#Thu Dec 21 14:31:09 AEDT 2023
+distributionBase=GRADLE_USER_HOME
+distributionPath=wrapper/dists
+distributionUrl=https\://services.gradle.org/distributions/gradle-8.2-bin.zip
+zipStoreBase=GRADLE_USER_HOME
+zipStorePath=wrapper/dists
diff --git a/android/llama.android/gradlew b/android/llama.android/gradlew
new file mode 100755
index 00000000..4f906e0c
--- /dev/null
+++ b/android/llama.android/gradlew
@@ -0,0 +1,185 @@
+#!/usr/bin/env sh
+
+#
+# Copyright 2015 the original author or authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+##############################################################################
+##
+##  Gradle start up script for UN*X
+##
+##############################################################################
+
+# Attempt to set APP_HOME
+# Resolve links: $0 may be a link
+PRG="$0"
+# Need this for relative symlinks.
+while [ -h "$PRG" ] ; do
+    ls=`ls -ld "$PRG"`
+    link=`expr "$ls" : '.*-> \(.*\)$'`
+    if expr "$link" : '/.*' > /dev/null; then
+        PRG="$link"
+    else
+        PRG=`dirname "$PRG"`"/$link"
+    fi
+done
+SAVED="`pwd`"
+cd "`dirname \"$PRG\"`/" >/dev/null
+APP_HOME="`pwd -P`"
+cd "$SAVED" >/dev/null
+
+APP_NAME="Gradle"
+APP_BASE_NAME=`basename "$0"`
+
+# Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
+DEFAULT_JVM_OPTS='"-Xmx64m" "-Xms64m"'
+
+# Use the maximum available, or set MAX_FD != -1 to use that value.
+MAX_FD="maximum"
+
+warn () {
+    echo "$*"
+}
+
+die () {
+    echo
+    echo "$*"
+    echo
+    exit 1
+}
+
+# OS specific support (must be 'true' or 'false').
+cygwin=false
+msys=false
+darwin=false
+nonstop=false
+case "`uname`" in
+  CYGWIN* )
+    cygwin=true
+    ;;
+  Darwin* )
+    darwin=true
+    ;;
+  MINGW* )
+    msys=true
+    ;;
+  NONSTOP* )
+    nonstop=true
+    ;;
+esac
+
+CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
+
+
+# Determine the Java command to use to start the JVM.
+if [ -n "$JAVA_HOME" ] ; then
+    if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
+        # IBM's JDK on AIX uses strange locations for the executables
+        JAVACMD="$JAVA_HOME/jre/sh/java"
+    else
+        JAVACMD="$JAVA_HOME/bin/java"
+    fi
+    if [ ! -x "$JAVACMD" ] ; then
+        die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+    fi
+else
+    JAVACMD="java"
+    which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
+
+Please set the JAVA_HOME variable in your environment to match the
+location of your Java installation."
+fi
+
+# Increase the maximum file descriptors if we can.
+if [ "$cygwin" = "false" -a "$darwin" = "false" -a "$nonstop" = "false" ] ; then
+    MAX_FD_LIMIT=`ulimit -H -n`
+    if [ $? -eq 0 ] ; then
+        if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
+            MAX_FD="$MAX_FD_LIMIT"
+        fi
+        ulimit -n $MAX_FD
+        if [ $? -ne 0 ] ; then
+            warn "Could not set maximum file descriptor limit: $MAX_FD"
+        fi
+    else
+        warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
+    fi
+fi
+
+# For Darwin, add options to specify how the application appears in the dock
+if $darwin; then
+    GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
+fi
+
+# For Cygwin or MSYS, switch paths to Windows format before running java
+if [ "$cygwin" = "true" -o "$msys" = "true" ] ; then
+    APP_HOME=`cygpath --path --mixed "$APP_HOME"`
+    CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
+
+    JAVACMD=`cygpath --unix "$JAVACMD"`
+
+    # We build the pattern for arguments to be converted via cygpath
+    ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
+    SEP=""
+    for dir in $ROOTDIRSRAW ; do
+        ROOTDIRS="$ROOTDIRS$SEP$dir"
+        SEP="|"
+    done
+    OURCYGPATTERN="(^($ROOTDIRS))"
+    # Add a user-defined pattern to the cygpath arguments
+    if [ "$GRADLE_CYGPATTERN" != "" ] ; then
+        OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
+    fi
+    # Now convert the arguments - kludge to limit ourselves to /bin/sh
+    i=0
+    for arg in "$@" ; do
+        CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
+        CHECK2=`echo "$arg"|egrep -c "^-"`                                 ### Determine if an option
+
+        if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then                    ### Added a condition
+            eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
+        else
+            eval `echo args$i`="\"$arg\""
+        fi
+        i=`expr $i + 1`
+    done
+    case $i in
+        0) set -- ;;
+        1) set -- "$args0" ;;
+        2) set -- "$args0" "$args1" ;;
+        3) set -- "$args0" "$args1" "$args2" ;;
+        4) set -- "$args0" "$args1" "$args2" "$args3" ;;
+        5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
+        6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
+        7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
+        8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
+        9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
+    esac
+fi
+
+# Escape application args
+save () {
+    for i do printf %s\\n "$i" | sed "s/'/'\\\\''/g;1s/^/'/;\$s/\$/' \\\\/" ; done
+    echo " "
+}
+APP_ARGS=`save "$@"`
+
+# Collect all arguments for the java command, following the shell quoting and substitution rules
+eval set -- $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS "\"-Dorg.gradle.appname=$APP_BASE_NAME\"" -classpath "\"$CLASSPATH\"" org.gradle.wrapper.GradleWrapperMain "$APP_ARGS"
+
+exec "$JAVACMD" "$@"
diff --git a/android/llama.android/llama/.gitignore b/android/llama.android/llama/.gitignore
new file mode 100644
index 00000000..796b96d1
--- /dev/null
+++ b/android/llama.android/llama/.gitignore
@@ -0,0 +1 @@
+/build
diff --git a/android/llama.android/llama/build.gradle.kts b/android/llama.android/llama/build.gradle.kts
new file mode 100644
index 00000000..61b5b638
--- /dev/null
+++ b/android/llama.android/llama/build.gradle.kts
@@ -0,0 +1,71 @@
+plugins {
+    id("com.android.library")
+    id("org.jetbrains.kotlin.android")
+}
+
+android {
+    namespace = "com.nexa"
+    compileSdk = 34
+
+    defaultConfig {
+        minSdk = 33
+
+        testInstrumentationRunner = "androidx.test.runner.AndroidJUnitRunner"
+        consumerProguardFiles("consumer-rules.pro")
+        ndk {
+            // Add NDK properties if wanted, e.g.
+            // abiFilters += listOf("arm64-v8a")
+        }
+        externalNativeBuild {
+            cmake {
+                arguments += "-DLLAMA_BUILD_COMMON=ON"
+                arguments += "-DCMAKE_BUILD_TYPE=Release"
+                cppFlags += listOf()
+                arguments += listOf()
+
+                cppFlags("")
+            }
+        }
+    }
+
+    buildTypes {
+        release {
+            isMinifyEnabled = false
+            proguardFiles(
+                getDefaultProguardFile("proguard-android-optimize.txt"),
+                "proguard-rules.pro"
+            )
+        }
+    }
+    externalNativeBuild {
+        cmake {
+            path("src/main/cpp/CMakeLists.txt")
+            version = "3.22.1"
+        }
+    }
+    compileOptions {
+        sourceCompatibility = JavaVersion.VERSION_1_8
+        targetCompatibility = JavaVersion.VERSION_1_8
+    }
+    kotlinOptions {
+        jvmTarget = "1.8"
+    }
+
+    packaging {
+        resources {
+            excludes += "/META-INF/{AL2.0,LGPL2.1}"
+        }
+    }
+}
+
+dependencies {
+
+    implementation("androidx.core:core-ktx:1.12.0")
+    implementation("com.google.code.gson:gson:2.11.0")
+    implementation("androidx.appcompat:appcompat:1.6.1")
+    implementation("com.google.android.material:material:1.11.0")
+    testImplementation("junit:junit:4.13.2")
+    androidTestImplementation("androidx.test.ext:junit:1.1.5")
+    androidTestImplementation("androidx.test.espresso:espresso-core:3.5.1")
+
+}
diff --git a/android/llama.android/llama/consumer-rules.pro b/android/llama.android/llama/consumer-rules.pro
new file mode 100644
index 00000000..e69de29b
diff --git a/android/llama.android/llama/proguard-rules.pro b/android/llama.android/llama/proguard-rules.pro
new file mode 100644
index 00000000..f1b42451
--- /dev/null
+++ b/android/llama.android/llama/proguard-rules.pro
@@ -0,0 +1,21 @@
+# Add project specific ProGuard rules here.
+# You can control the set of applied configuration files using the
+# proguardFiles setting in build.gradle.
+#
+# For more details, see
+#   http://developer.android.com/guide/developing/tools/proguard.html
+
+# If your project uses WebView with JS, uncomment the following
+# and specify the fully qualified class name to the JavaScript interface
+# class:
+#-keepclassmembers class fqcn.of.javascript.interface.for.webview {
+#   public *;
+#}
+
+# Uncomment this to preserve the line number information for
+# debugging stack traces.
+#-keepattributes SourceFile,LineNumberTable
+
+# If you keep the line number information, uncomment this to
+# hide the original source file name.
+#-renamesourcefileattribute SourceFile
diff --git a/android/llama.android/llama/src/androidTest/java/android/llama/nexa/ExampleInstrumentedTest.kt b/android/llama.android/llama/src/androidTest/java/android/llama/nexa/ExampleInstrumentedTest.kt
new file mode 100644
index 00000000..b13a1fe8
--- /dev/null
+++ b/android/llama.android/llama/src/androidTest/java/android/llama/nexa/ExampleInstrumentedTest.kt
@@ -0,0 +1,24 @@
+package android.llama.nexa
+
+import androidx.test.platform.app.InstrumentationRegistry
+import androidx.test.ext.junit.runners.AndroidJUnit4
+
+import org.junit.Test
+import org.junit.runner.RunWith
+
+import org.junit.Assert.*
+
+/**
+ * Instrumented test, which will execute on an Android device.
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+@RunWith(AndroidJUnit4::class)
+class ExampleInstrumentedTest {
+    @Test
+    fun useAppContext() {
+        // Context of the app under test.
+        val appContext = InstrumentationRegistry.getInstrumentation().targetContext
+        assertEquals("android.llama.cpp.test", appContext.packageName)
+    }
+}
diff --git a/android/llama.android/llama/src/main/AndroidManifest.xml b/android/llama.android/llama/src/main/AndroidManifest.xml
new file mode 100644
index 00000000..8bdb7e14
--- /dev/null
+++ b/android/llama.android/llama/src/main/AndroidManifest.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="utf-8"?>
+<manifest xmlns:android="http://schemas.android.com/apk/res/android">
+
+</manifest>
diff --git a/android/llama.android/llama/src/main/cpp/CMakeLists.txt b/android/llama.android/llama/src/main/cpp/CMakeLists.txt
new file mode 100644
index 00000000..78b4e9a1
--- /dev/null
+++ b/android/llama.android/llama/src/main/cpp/CMakeLists.txt
@@ -0,0 +1,53 @@
+# Sets the minimum CMake version required for this project.
+cmake_minimum_required(VERSION 3.22.1)
+set(CMAKE_BUILD_TYPE  Release)
+# Declares the project name
+project("llama-android")
+
+# Enable FetchContent module
+include(FetchContent)
+
+FetchContent_Declare(
+        json
+        GIT_REPOSITORY https://github.com/nlohmann/json
+        GIT_TAG        v3.11.3
+)
+FetchContent_MakeAvailable(json)
+
+# Declare llama.cpp repository
+FetchContent_Declare(
+        llama
+#        GIT_REPOSITORY https://github.com/ggerganov/llama.cpp
+        GIT_REPOSITORY https://github.com/NexaAI/llama.cpp
+        GIT_TAG master
+)
+
+# Declare llava repository (if needed)
+FetchContent_Declare(
+        llava
+#        GIT_REPOSITORY https://github.com/ggerganov/llama.cpp
+        GIT_REPOSITORY https://github.com/NexaAI/llama.cpp
+        GIT_TAG master
+        SOURCE_SUBDIR examples/llava
+)
+
+# Make the content available
+FetchContent_MakeAvailable(llama llava)
+
+# Create the main library
+add_library(${CMAKE_PROJECT_NAME} SHARED
+        llama-android.cpp
+        llava-android.cpp
+        common.cpp
+)
+
+
+# Link the required libraries
+target_link_libraries(${CMAKE_PROJECT_NAME}
+        nlohmann_json
+        llama
+        common
+        android
+        log
+        llava
+)
\ No newline at end of file
diff --git a/android/llama.android/llama/src/main/cpp/common.cpp b/android/llama.android/llama/src/main/cpp/common.cpp
new file mode 100644
index 00000000..b56e0292
--- /dev/null
+++ b/android/llama.android/llama/src/main/cpp/common.cpp
@@ -0,0 +1,33 @@
+
+    bool is_valid_utf8(const char * string) {
+        if (!string) {
+            return true;
+        }
+
+        const unsigned char * bytes = (const unsigned char *)string;
+        int num;
+
+        while (*bytes != 0x00) {
+            if ((*bytes & 0x80) == 0x00) {
+                num = 1;
+            } else if ((*bytes & 0xE0) == 0xC0) {
+                num = 2;
+            } else if ((*bytes & 0xF0) == 0xE0) {
+                num = 3;
+            } else if ((*bytes & 0xF8) == 0xF0) {
+                num = 4;
+            } else {
+                return false;
+            }
+
+            bytes += 1;
+            for (int i = 1; i < num; ++i) {
+                if ((*bytes & 0xC0) != 0x80) {
+                    return false;
+                }
+                bytes += 1;
+            }
+        }
+
+        return true;
+    }
diff --git a/android/llama.android/llama/src/main/cpp/llama-android.cpp b/android/llama.android/llama/src/main/cpp/llama-android.cpp
new file mode 100644
index 00000000..260b899f
--- /dev/null
+++ b/android/llama.android/llama/src/main/cpp/llama-android.cpp
@@ -0,0 +1,409 @@
+#include <android/log.h>
+#include <jni.h>
+#include <iomanip>
+#include <math.h>
+#include <string>
+#include <unistd.h>
+#include "llama.h"
+#include "common.h"
+#include "llava.h"
+
+// Write C++ code here.
+//
+// Do not forget to dynamically load the C++ library into your application.
+//
+// For instance,
+//
+// In MainActivity.java:
+//    static {
+//       System.loadLibrary("llama-android");
+//    }
+//
+// Or, in MainActivity.kt:
+//    companion object {
+//      init {
+//         System.loadLibrary("llama-android")
+//      }
+//    }
+
+#define TAG "llama-android.cpp"
+#define LOGi(...) __android_log_print(ANDROID_LOG_INFO, TAG, __VA_ARGS__)
+#define LOGe(...) __android_log_print(ANDROID_LOG_ERROR, TAG, __VA_ARGS__)
+
+jclass la_int_var;
+jmethodID la_int_var_value;
+jmethodID la_int_var_inc;
+
+std::string cached_token_chars;
+
+extern bool is_valid_utf8(const char* str);
+
+static void log_callback(ggml_log_level level, const char * fmt, void * data) {
+    if (level == GGML_LOG_LEVEL_ERROR)     __android_log_print(ANDROID_LOG_ERROR, TAG, fmt, data);
+    else if (level == GGML_LOG_LEVEL_INFO) __android_log_print(ANDROID_LOG_INFO, TAG, fmt, data);
+    else if (level == GGML_LOG_LEVEL_WARN) __android_log_print(ANDROID_LOG_WARN, TAG, fmt, data);
+    else __android_log_print(ANDROID_LOG_DEFAULT, TAG, fmt, data);
+}
+
+extern "C"
+JNIEXPORT jlong JNICALL
+Java_com_nexa_LLamaAndroid_load_1model(JNIEnv *env, jobject, jstring filename) {
+    llama_model_params model_params = llama_model_default_params();
+
+    auto path_to_model = env->GetStringUTFChars(filename, 0);
+    LOGi("Loading model from %s", path_to_model);
+
+    auto model = llama_load_model_from_file(path_to_model, model_params);
+    env->ReleaseStringUTFChars(filename, path_to_model);
+
+    if (!model) {
+        LOGe("load_model() failed");
+        env->ThrowNew(env->FindClass("java/lang/IllegalStateException"), "load_model() failed");
+        return 0;
+    }
+
+    return reinterpret_cast<jlong>(model);
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_free_1model(JNIEnv *, jobject, jlong model) {
+    llama_free_model(reinterpret_cast<llama_model *>(model));
+}
+
+extern "C"
+JNIEXPORT jlong JNICALL
+Java_com_nexa_LLamaAndroid_new_1context(JNIEnv *env, jobject, jlong jmodel) {
+    auto model = reinterpret_cast<llama_model *>(jmodel);
+
+    if (!model) {
+        LOGe("new_context(): model cannot be null");
+        env->ThrowNew(env->FindClass("java/lang/IllegalArgumentException"), "Model cannot be null");
+        return 0;
+    }
+
+    int n_threads = std::max(1, std::min(8, (int) sysconf(_SC_NPROCESSORS_ONLN) - 2));
+    LOGi("Using %d threads", n_threads);
+
+    llama_context_params ctx_params = llama_context_default_params();
+    ctx_params.seed  = 1234;
+    ctx_params.n_ctx = 2048;
+    ctx_params.n_threads       = n_threads;
+    ctx_params.n_threads_batch = n_threads;
+
+    llama_context * context = llama_new_context_with_model(model, ctx_params);
+
+    if (!context) {
+        LOGe("llama_new_context_with_model() returned null)");
+        env->ThrowNew(env->FindClass("java/lang/IllegalStateException"),
+                      "llama_new_context_with_model() returned null)");
+        return 0;
+    }
+
+    return reinterpret_cast<jlong>(context);
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_free_1context(JNIEnv *, jobject, jlong context) {
+    llama_free(reinterpret_cast<llama_context *>(context));
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_backend_1free(JNIEnv *, jobject) {
+    llama_backend_free();
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_log_1to_1android(JNIEnv *, jobject) {
+    llama_log_set(log_callback, NULL);
+}
+
+extern "C"
+JNIEXPORT jstring JNICALL
+Java_com_nexa_LLamaAndroid_bench_1model(
+        JNIEnv *env,
+        jobject,
+        jlong context_pointer,
+        jlong model_pointer,
+        jlong batch_pointer,
+        jint pp,
+        jint tg,
+        jint pl,
+        jint nr
+        ) {
+    auto pp_avg = 0.0;
+    auto tg_avg = 0.0;
+    auto pp_std = 0.0;
+    auto tg_std = 0.0;
+
+    const auto context = reinterpret_cast<llama_context *>(context_pointer);
+    const auto model = reinterpret_cast<llama_model *>(model_pointer);
+    const auto batch = reinterpret_cast<llama_batch *>(batch_pointer);
+
+    const int n_ctx = llama_n_ctx(context);
+
+    LOGi("n_ctx = %d", n_ctx);
+
+    int i, j;
+    int nri;
+    for (nri = 0; nri < nr; nri++) {
+        LOGi("Benchmark prompt processing (pp)");
+
+        llama_batch_clear(*batch);
+
+        const int n_tokens = pp;
+        for (i = 0; i < n_tokens; i++) {
+            llama_batch_add(*batch, 0, i, { 0 }, false);
+        }
+
+        batch->logits[batch->n_tokens - 1] = true;
+        llama_kv_cache_clear(context);
+
+        const auto t_pp_start = ggml_time_us();
+        if (llama_decode(context, *batch) != 0) {
+            LOGi("llama_decode() failed during prompt processing");
+        }
+        const auto t_pp_end = ggml_time_us();
+
+        // bench text generation
+
+        LOGi("Benchmark text generation (tg)");
+
+        llama_kv_cache_clear(context);
+        const auto t_tg_start = ggml_time_us();
+        for (i = 0; i < tg; i++) {
+
+            llama_batch_clear(*batch);
+            for (j = 0; j < pl; j++) {
+                llama_batch_add(*batch, 0, i, { j }, true);
+            }
+
+            LOGi("llama_decode() text generation: %d", i);
+            if (llama_decode(context, *batch) != 0) {
+                LOGi("llama_decode() failed during text generation");
+            }
+        }
+
+        const auto t_tg_end = ggml_time_us();
+
+        llama_kv_cache_clear(context);
+
+        const auto t_pp = double(t_pp_end - t_pp_start) / 1000000.0;
+        const auto t_tg = double(t_tg_end - t_tg_start) / 1000000.0;
+
+        const auto speed_pp = double(pp) / t_pp;
+        const auto speed_tg = double(pl * tg) / t_tg;
+
+        pp_avg += speed_pp;
+        tg_avg += speed_tg;
+
+        pp_std += speed_pp * speed_pp;
+        tg_std += speed_tg * speed_tg;
+
+        LOGi("pp %f t/s, tg %f t/s", speed_pp, speed_tg);
+    }
+
+    pp_avg /= double(nr);
+    tg_avg /= double(nr);
+
+    if (nr > 1) {
+        pp_std = sqrt(pp_std / double(nr - 1) - pp_avg * pp_avg * double(nr) / double(nr - 1));
+        tg_std = sqrt(tg_std / double(nr - 1) - tg_avg * tg_avg * double(nr) / double(nr - 1));
+    } else {
+        pp_std = 0;
+        tg_std = 0;
+    }
+
+    char model_desc[128];
+    llama_model_desc(model, model_desc, sizeof(model_desc));
+
+    const auto model_size     = double(llama_model_size(model)) / 1024.0 / 1024.0 / 1024.0;
+    const auto model_n_params = double(llama_model_n_params(model)) / 1e9;
+
+    const auto backend    = "(Android)"; // TODO: What should this be?
+
+    std::stringstream result;
+    result << std::setprecision(2);
+    result << "| model | size | params | backend | test | t/s |\n";
+    result << "| --- | --- | --- | --- | --- | --- |\n";
+    result << "| " << model_desc << " | " << model_size << "GiB | " << model_n_params << "B | " << backend << " | pp " << pp << " | " << pp_avg << " ± " << pp_std << " |\n";
+    result << "| " << model_desc << " | " << model_size << "GiB | " << model_n_params << "B | " << backend << " | tg " << tg << " | " << tg_avg << " ± " << tg_std << " |\n";
+
+    return env->NewStringUTF(result.str().c_str());
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_free_1batch(JNIEnv *, jobject, jlong batch_pointer) {
+    llama_batch_free(*reinterpret_cast<llama_batch *>(batch_pointer));
+}
+
+extern "C"
+JNIEXPORT jlong JNICALL
+Java_com_nexa_LLamaAndroid_new_1batch(JNIEnv *, jobject, jint n_tokens, jint embd, jint n_seq_max) {
+
+    // Source: Copy of llama.cpp:llama_batch_init but heap-allocated.
+
+    llama_batch *batch = new llama_batch {
+        0,
+        nullptr,
+        nullptr,
+        nullptr,
+        nullptr,
+        nullptr,
+        nullptr,
+        0,
+        0,
+        0,
+    };
+
+    if (embd) {
+        batch->embd = (float *) malloc(sizeof(float) * n_tokens * embd);
+    } else {
+        batch->token = (llama_token *) malloc(sizeof(llama_token) * n_tokens);
+    }
+
+    batch->pos      = (llama_pos *)     malloc(sizeof(llama_pos)      * n_tokens);
+    batch->n_seq_id = (int32_t *)       malloc(sizeof(int32_t)        * n_tokens);
+    batch->seq_id   = (llama_seq_id **) malloc(sizeof(llama_seq_id *) * n_tokens);
+    for (int i = 0; i < n_tokens; ++i) {
+        batch->seq_id[i] = (llama_seq_id *) malloc(sizeof(llama_seq_id) * n_seq_max);
+    }
+    batch->logits   = (int8_t *)        malloc(sizeof(int8_t)         * n_tokens);
+
+    return reinterpret_cast<jlong>(batch);
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_backend_1init(JNIEnv *, jobject) {
+    llama_backend_init();
+}
+
+extern "C"
+JNIEXPORT jstring JNICALL
+Java_com_nexa_LLamaAndroid_system_1info(JNIEnv *env, jobject) {
+    return env->NewStringUTF(llama_print_system_info());
+}
+
+extern "C"
+JNIEXPORT jint JNICALL
+Java_com_nexa_LLamaAndroid_completion_1init(
+        JNIEnv *env,
+        jobject,
+        jlong context_pointer,
+        jlong batch_pointer,
+        jstring jtext,
+        jint n_len
+    ) {
+
+    cached_token_chars.clear();
+
+    const auto text = env->GetStringUTFChars(jtext, 0);
+    const auto context = reinterpret_cast<llama_context *>(context_pointer);
+    const auto batch = reinterpret_cast<llama_batch *>(batch_pointer);
+
+    const auto tokens_list = llama_tokenize(context, text, 1);
+
+    auto n_ctx = llama_n_ctx(context);
+    auto n_kv_req = tokens_list.size() + (n_len - tokens_list.size());
+
+    LOGi("n_len = %d, n_ctx = %d, n_kv_req = %d", n_len, n_ctx, n_kv_req);
+
+    if (n_kv_req > n_ctx) {
+        LOGe("error: n_kv_req > n_ctx, the required KV cache size is not big enough");
+    }
+
+    for (auto id : tokens_list) {
+        LOGi("%s", llama_token_to_piece(context, id).c_str());
+    }
+
+    llama_batch_clear(*batch);
+
+    // evaluate the initial prompt
+    for (auto i = 0; i < tokens_list.size(); i++) {
+        llama_batch_add(*batch, tokens_list[i], i, { 0 }, false);
+    }
+
+    // llama_decode will output logits only for the last token of the prompt
+    batch->logits[batch->n_tokens - 1] = true;
+
+    if (llama_decode(context, *batch) != 0) {
+        LOGe("llama_decode() failed");
+    }
+
+    env->ReleaseStringUTFChars(jtext, text);
+
+    return batch->n_tokens;
+}
+
+extern "C"
+JNIEXPORT jstring JNICALL
+Java_com_nexa_LLamaAndroid_completion_1loop(
+        JNIEnv * env,
+        jobject,
+        jlong context_pointer,
+        jlong batch_pointer,
+        jint n_len,
+        jobject intvar_ncur
+) {
+    const auto context = reinterpret_cast<llama_context *>(context_pointer);
+    const auto batch = reinterpret_cast<llama_batch *>(batch_pointer);
+    const auto model = llama_get_model(context);
+
+    if (!la_int_var) la_int_var = env->GetObjectClass(intvar_ncur);
+    if (!la_int_var_value) la_int_var_value = env->GetMethodID(la_int_var, "getValue", "()I");
+    if (!la_int_var_inc) la_int_var_inc = env->GetMethodID(la_int_var, "inc", "()V");
+
+    auto n_vocab = llama_n_vocab(model);
+    auto logits = llama_get_logits_ith(context, batch->n_tokens - 1);
+
+    std::vector<llama_token_data> candidates;
+    candidates.reserve(n_vocab);
+
+    for (llama_token token_id = 0; token_id < n_vocab; token_id++) {
+        candidates.emplace_back(llama_token_data{ token_id, logits[token_id], 0.0f });
+    }
+
+    llama_token_data_array candidates_p = { candidates.data(), candidates.size(), false };
+
+    // sample the most likely token
+    const auto new_token_id = llama_sample_token_greedy(context, &candidates_p);
+
+    const auto n_cur = env->CallIntMethod(intvar_ncur, la_int_var_value);
+    if (llama_token_is_eog(model, new_token_id) || n_cur == n_len) {
+        return nullptr;
+    }
+
+    auto new_token_chars = llama_token_to_piece(context, new_token_id);
+    cached_token_chars += new_token_chars;
+
+    jstring new_token = nullptr;
+    if (is_valid_utf8(cached_token_chars.c_str())) {
+        new_token = env->NewStringUTF(cached_token_chars.c_str());
+        LOGi("cached: %s, new_token_chars: `%s`, id: %d", cached_token_chars.c_str(), new_token_chars.c_str(), new_token_id);
+        cached_token_chars.clear();
+    } else {
+        new_token = env->NewStringUTF("");
+    }
+
+    llama_batch_clear(*batch);
+    llama_batch_add(*batch, new_token_id, n_cur, { 0 }, true);
+
+    env->CallVoidMethod(intvar_ncur, la_int_var_inc);
+
+    if (llama_decode(context, *batch) != 0) {
+        LOGe("llama_decode() returned null");
+    }
+
+    return new_token;
+}
+
+extern "C"
+JNIEXPORT void JNICALL
+Java_com_nexa_LLamaAndroid_kv_1cache_1clear(JNIEnv *, jobject, jlong context) {
+    llama_kv_cache_clear(reinterpret_cast<llama_context *>(context));
+}
diff --git a/android/llama.android/llama/src/main/cpp/llava-android.cpp b/android/llama.android/llama/src/main/cpp/llava-android.cpp
new file mode 100644
index 00000000..f2ce542d
--- /dev/null
+++ b/android/llama.android/llama/src/main/cpp/llava-android.cpp
@@ -0,0 +1,348 @@
+#include <android/log.h>
+#include <jni.h>
+#include <iomanip>
+#include <math.h>
+#include <string>
+#include <unistd.h>
+#include "llama.h"
+#include "common.h"
+#include "llava-cli.cpp"
+#include <nlohmann/json.hpp>
+
+#define TAG "llava-android.cpp"
+#define LOGi(...) __android_log_print(ANDROID_LOG_INFO, TAG, __VA_ARGS__)
+#define LOGe(...) __android_log_print(ANDROID_LOG_ERROR, TAG, __VA_ARGS__)
+
+extern bool is_valid_utf8(const char* str);
+
+std::string jstring2str(JNIEnv* env, jstring jstr) {
+    if (!jstr) {
+        return "";
+    }
+    const char* str = env->GetStringUTFChars(jstr, nullptr);
+    if (!str) {
+        return "";
+    }
+    std::string ret(str);
+    env->ReleaseStringUTFChars(jstr, str);
+    return ret;
+}
+
+#include <jni.h>
+#include <string>
+#include <iostream>
+
+// Helper function to throw a Java exception from JNI
+void throwJavaException(JNIEnv* env, const char* className, const std::string& message) {
+    // Find the exception class
+    jclass exceptionClass = env->FindClass(className);
+    if (exceptionClass != nullptr) {
+        // Throw the exception with the given message
+        env->ThrowNew(exceptionClass, message.c_str());
+        env->DeleteLocalRef(exceptionClass); // Clean up the local reference
+    } else {
+        // If the specified exception class cannot be found, fall back to RuntimeException
+        std::cerr << "Error: Cannot find exception class: " << className << std::endl;
+        jclass runtimeExceptionClass = env->FindClass("java/lang/RuntimeException");
+        if (runtimeExceptionClass != nullptr) {
+            env->ThrowNew(runtimeExceptionClass, ("Fallback: " + message).c_str());
+            env->DeleteLocalRef(runtimeExceptionClass); // Clean up
+        } else {
+            std::cerr << "Critical Error: Cannot find RuntimeException class" << std::endl;
+        }
+    }
+}
+
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_init_1params(JNIEnv *env, jobject /* this */, jstring jmodel, jstring jmmproj) {
+    try {
+        // Initialize timers and common components
+        ggml_time_init();
+
+
+        const char* model_chars = env->GetStringUTFChars(jmodel, nullptr);
+        const char* mmproj_chars = env->GetStringUTFChars(jmmproj, nullptr);
+
+        const char* argv = "omni-wrapper-py";
+        char* nc_argv = const_cast<char*>(argv);
+        gpt_params* params = new gpt_params();
+        gpt_params_parse(1, &nc_argv, *params);
+
+        params->model = std::string(model_chars);
+        params->mmproj = std::string(mmproj_chars);
+
+        env->ReleaseStringUTFChars(jmodel, model_chars);
+        env->ReleaseStringUTFChars(jmmproj, mmproj_chars);
+
+        return reinterpret_cast<jlong>(params);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model 1: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+
+    return 0;
+}
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_load_1model(JNIEnv *env, jobject /* this */, jlong jparams) {
+    try {
+        const auto params = reinterpret_cast<gpt_params*>(jparams);
+
+        auto* model = llava_init(params);
+        if (model == nullptr) {
+            throwJavaException(env, "java/lang/RuntimeException", "Failed to initialize model");
+            return 0;
+        }
+
+        return reinterpret_cast<jlong>(model);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model 1: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+
+    return 0;
+}
+
+extern "C" JNIEXPORT void JNICALL
+Java_com_nexa_NexaVlmInference_update_1params(JNIEnv *env, jobject /* this */, jlong jparams, jfloat jtemp , jint jtopK, jfloat jtopP) {
+    int32_t top_k = (int32_t) jtopK;
+    float top_p = (float) jtopP;
+    float temp = (float) jtemp;
+    const auto params = reinterpret_cast<gpt_params*>(jparams);
+    params->sparams.top_k = top_k;
+    params->sparams.top_p = top_p;
+    params->sparams.temp = temp;
+}
+
+extern "C" JNIEXPORT void JNICALL
+Java_com_nexa_NexaVlmInference_free_1model(JNIEnv *env, jobject /* this */, jlong jmodel) {
+    const auto llava_model = reinterpret_cast<llama_model *>(jmodel);
+
+    llama_free_model(llava_model);
+}
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_llava_1init_1context(JNIEnv *env, jobject /* this */, jlong jparams, jlong jmodel) {
+    try {
+        const auto params = reinterpret_cast<gpt_params*>(jparams);
+
+        const auto llava_model = reinterpret_cast<llama_model*>(jmodel);
+        auto* ctx_llava = llava_init_context(params, llava_model);
+        if (ctx_llava == nullptr) {
+            throwJavaException(env, "java/lang/RuntimeException", "Failed to initialize llava ctx");
+            return 0;
+        }
+
+        return reinterpret_cast<jlong>(ctx_llava);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+
+    return 0;
+}
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_llava_1ctx_1free(JNIEnv *env, jobject /* this */, jlong llava_ctx_pointer) {
+    try {
+        auto* llava_ctx = reinterpret_cast<llava_context *>(llava_ctx_pointer);
+        if (llava_ctx == nullptr) {
+            throwJavaException(env, "java/lang/RuntimeException", "Null pointer");
+            return 0;
+        }
+
+        llava_ctx->model = NULL;
+        llava_free(llava_ctx);
+    }  catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while freeing ctx");
+    }
+}
+
+extern "C" JNIEXPORT jint JNICALL
+Java_com_nexa_NexaVlmInference_llava_1image_1embed_1free(JNIEnv *env, jobject /* this */, jlong llava_image_embed_pointer) {
+    try {
+        if (llava_image_embed_pointer == 0) {
+            throwJavaException(env, "java/lang/RuntimeException", "Pointer is null.");
+            return -1;
+        }
+
+        auto* llava_image_embed = reinterpret_cast<struct llava_image_embed *>(llava_image_embed_pointer);
+        if (llava_image_embed == nullptr ) {
+            throwJavaException(env, "java/lang/RuntimeException", "Pointer cast resulted in null.");
+            return -1;
+        }
+        if(llava_image_embed->embed == nullptr ) {
+            throwJavaException(env, "java/lang/RuntimeException", "Pointer cast resulted in null.");
+            return -1;
+        }
+
+        llava_image_embed_free(llava_image_embed);
+    } catch (const std::exception &e) {
+        // 捕获标准异常
+        throwJavaException(env, "java/lang/RuntimeException", e.what());
+        return -1;
+    } catch (...) {
+        // 捕获未知异常
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while freeing image");
+        return -1;
+    }
+
+    return 0; // 成功
+}
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_load_1image(JNIEnv *env, jobject /* this */, jlong llava_ctx_pointer, jlong jparams, jstring imagePath) {
+    try {
+        auto* params = reinterpret_cast<gpt_params*>(jparams);
+        auto* ctx_llava = reinterpret_cast<llava_context *>(llava_ctx_pointer);
+
+        std::string image_str = jstring2str(env, imagePath);
+        auto * image_embed = load_image(ctx_llava, params, image_str);
+        if (image_embed == nullptr) {
+            throwJavaException(env, "java/lang/RuntimeException", "Failed to initialize llava ctx");
+            return 0;
+        }
+
+        return reinterpret_cast<jlong>(image_embed);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+}
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_llava_1eval(JNIEnv *env, jobject /* this */, jlong llava_ctx_pointer, jlong jparams,  jlong llava_image_embed_pointer, jstring jprompt) {
+
+    try {
+        auto* params = reinterpret_cast<gpt_params*>(jparams);
+        auto* image_embed = reinterpret_cast<llava_image_embed *>(llava_image_embed_pointer);
+        auto* ctx_llava = reinterpret_cast<llava_context *>(llava_ctx_pointer);
+
+        int* n_past = new int(0);
+
+        const int max_tgt_len = params->n_predict < 0 ? 256 : params->n_predict;
+        std::string prompt = jstring2str(env, jprompt);
+
+        std::string system_prompt, user_prompt;
+        system_prompt = "A chat between a curious human and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the human's questions.\nUSER:";
+        user_prompt = prompt + "\nASSISTANT:";
+
+        eval_string(ctx_llava->ctx_llama, system_prompt.c_str(), params->n_batch, n_past, true);
+        llava_eval_image_embed(ctx_llava->ctx_llama, image_embed, params->n_batch, n_past);
+        eval_string(ctx_llava->ctx_llama, user_prompt.c_str(), params->n_batch, n_past, false);
+
+        return reinterpret_cast<jlong>(n_past);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+
+    return 0;
+}
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_llava_1sampler_1init(JNIEnv *env, jobject /* this */, jlong llava_ctx_pointer, jlong jparams) {
+
+    try {
+        auto* params = reinterpret_cast<gpt_params*>(jparams);
+        auto* ctx_llava = reinterpret_cast<llava_context *>(llava_ctx_pointer);
+        struct llama_sampling_context * smpl = llama_sampling_init(params->sparams);
+
+        if (smpl == nullptr) {
+            throwJavaException(env, "java/lang/RuntimeException", "Failed to initialize llava ctx");
+            return 0;
+        }
+
+        return reinterpret_cast<jlong>(smpl);
+    } catch (const nlohmann::json::exception& e) {
+        throwJavaException(env, "java/lang/IllegalArgumentException",
+            std::string("JSON parsing error: ") + e.what());
+    } catch (const std::exception& e) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            std::string("Error loading model: ") + e.what());
+    } catch (...) {
+        throwJavaException(env, "java/lang/RuntimeException",
+            "Unknown error occurred while loading model");
+    }
+
+    return 0;
+}
+
+extern "C" JNIEXPORT jstring JNICALL
+Java_com_nexa_NexaVlmInference_llava_1sample(JNIEnv *env, jobject /* this */, jlong llava_ctx_pointer, jlong sampler, jlong jnpast, jlong jcached_tokens) {
+    auto* smpl = reinterpret_cast<llama_sampling_context*>(sampler);
+    auto* ctx_llava = reinterpret_cast<llava_context*>(llava_ctx_pointer);
+    auto* cached_tokens = reinterpret_cast<std::string*>(jcached_tokens);
+    auto* n_past = reinterpret_cast<int*>(jnpast);
+    const char* tmp = sample(smpl, ctx_llava->ctx_llama, n_past);
+    *cached_tokens += tmp;
+    jstring new_token = nullptr;
+    if (is_valid_utf8(cached_tokens->c_str())) {
+        new_token = env->NewStringUTF(cached_tokens->c_str());
+        cached_tokens->clear();
+    } else {
+        new_token = env->NewStringUTF("");
+    }
+
+    return new_token;
+}
+
+extern "C" JNIEXPORT void JNICALL
+Java_com_nexa_NexaVlmInference_llava_1sample_1free(JNIEnv *env, jobject /* this */, jlong sampler) {
+    auto* smpl = reinterpret_cast<llama_sampling_context*>(sampler);
+    llama_sampling_free(smpl);
+}
+
+
+extern "C" JNIEXPORT jlong JNICALL
+Java_com_nexa_NexaVlmInference_cached_1token_1init(JNIEnv *env, jobject /* this */) {
+    std::string* strPtr = new std::string("");
+    return reinterpret_cast<jlong>(strPtr);
+}
+
+extern "C" JNIEXPORT void JNICALL
+Java_com_nexa_NexaVlmInference_cached_1token_1free(JNIEnv *env, jobject /* this */, jlong jcached_tokens) {
+    std::string* str = reinterpret_cast<std::string*>(jcached_tokens);
+
+    if (str) {
+        delete str;
+    }
+}
\ No newline at end of file
diff --git a/android/llama.android/llama/src/main/java/com/nexa/LLamaAndroid.kt b/android/llama.android/llama/src/main/java/com/nexa/LLamaAndroid.kt
new file mode 100644
index 00000000..ca11ec58
--- /dev/null
+++ b/android/llama.android/llama/src/main/java/com/nexa/LLamaAndroid.kt
@@ -0,0 +1,179 @@
+package com.nexa
+
+import android.util.Log
+import kotlinx.coroutines.CoroutineDispatcher
+import kotlinx.coroutines.asCoroutineDispatcher
+import kotlinx.coroutines.flow.Flow
+import kotlinx.coroutines.flow.flow
+import kotlinx.coroutines.flow.flowOn
+import kotlinx.coroutines.withContext
+import java.util.concurrent.Executors
+import kotlin.concurrent.thread
+
+class LLamaAndroid {
+    private val tag: String? = this::class.simpleName
+
+    private val threadLocalState: ThreadLocal<State> = ThreadLocal.withInitial { State.Idle }
+
+    private val runLoop: CoroutineDispatcher = Executors.newSingleThreadExecutor {
+        thread(start = false, name = "Llm-RunLoop") {
+            Log.d(tag, "Dedicated thread for native code: ${Thread.currentThread().name}")
+
+            // No-op if called more than once.
+            System.loadLibrary("llama-android")
+
+            // Set llama log handler to Android
+            log_to_android()
+            backend_init(false)
+
+            Log.d(tag, system_info())
+
+            it.run()
+        }.apply {
+            uncaughtExceptionHandler = Thread.UncaughtExceptionHandler { _, exception: Throwable ->
+                Log.e(tag, "Unhandled exception", exception)
+            }
+        }
+    }.asCoroutineDispatcher()
+
+    private val nlen: Int = 64
+
+    private external fun log_to_android()
+    private external fun load_model(filename: String): Long
+    private external fun free_model(model: Long)
+    private external fun new_context(model: Long): Long
+    private external fun free_context(context: Long)
+    private external fun backend_init(numa: Boolean)
+    private external fun backend_free()
+    private external fun new_batch(nTokens: Int, embd: Int, nSeqMax: Int): Long
+    private external fun free_batch(batch: Long)
+    private external fun new_sampler(): Long
+    private external fun free_sampler(sampler: Long)
+    private external fun bench_model(
+        context: Long,
+        model: Long,
+        batch: Long,
+        pp: Int,
+        tg: Int,
+        pl: Int,
+        nr: Int
+    ): String
+
+    private external fun system_info(): String
+
+    private external fun completion_init(
+        context: Long,
+        batch: Long,
+        text: String,
+        nLen: Int
+    ): Int
+
+    private external fun completion_loop(
+        context: Long,
+        batch: Long,
+        sampler: Long,
+        nLen: Int,
+        ncur: IntVar
+    ): String?
+
+    private external fun kv_cache_clear(context: Long)
+
+    suspend fun bench(pp: Int, tg: Int, pl: Int, nr: Int = 1): String {
+        return withContext(runLoop) {
+            when (val state = threadLocalState.get()) {
+                is State.Loaded -> {
+                    Log.d(tag, "bench(): $state")
+                    bench_model(state.context, state.model, state.batch, pp, tg, pl, nr)
+                }
+
+                else -> throw IllegalStateException("No model loaded")
+            }
+        }
+    }
+
+    suspend fun load(pathToModel: String) {
+        withContext(runLoop) {
+            when (threadLocalState.get()) {
+                is State.Idle -> {
+                    val model = load_model(pathToModel)
+                    if (model == 0L)  throw IllegalStateException("load_model() failed")
+
+                    val context = new_context(model)
+                    if (context == 0L) throw IllegalStateException("new_context() failed")
+
+                    val batch = new_batch(512, 0, 1)
+                    if (batch == 0L) throw IllegalStateException("new_batch() failed")
+
+                    val sampler = new_sampler()
+                    if (sampler == 0L) throw IllegalStateException("new_sampler() failed")
+
+                    Log.i(tag, "Loaded model $pathToModel")
+                    threadLocalState.set(State.Loaded(model, context, batch, sampler))
+                }
+                else -> throw IllegalStateException("Model already loaded")
+            }
+        }
+    }
+
+    fun send(message: String): Flow<String> = flow {
+        when (val state = threadLocalState.get()) {
+            is State.Loaded -> {
+                val ncur = IntVar(completion_init(state.context, state.batch, message, nlen))
+                while (ncur.value <= nlen) {
+                    val str = completion_loop(state.context, state.batch, state.sampler, nlen, ncur)
+                    if (str == null) {
+                        break
+                    }
+                    emit(str)
+                }
+                kv_cache_clear(state.context)
+            }
+            else -> {}
+        }
+    }.flowOn(runLoop)
+
+    /**
+     * Unloads the model and frees resources.
+     *
+     * This is a no-op if there's no model loaded.
+     */
+    suspend fun unload() {
+        withContext(runLoop) {
+            when (val state = threadLocalState.get()) {
+                is State.Loaded -> {
+                    free_context(state.context)
+                    free_model(state.model)
+                    free_batch(state.batch)
+                    free_sampler(state.sampler);
+
+                    threadLocalState.set(State.Idle)
+                }
+                else -> {}
+            }
+        }
+    }
+
+    companion object {
+        private class IntVar(value: Int) {
+            @Volatile
+            var value: Int = value
+                private set
+
+            fun inc() {
+                synchronized(this) {
+                    value += 1
+                }
+            }
+        }
+
+        private sealed interface State {
+            data object Idle: State
+            data class Loaded(val model: Long, val context: Long, val batch: Long, val sampler: Long): State
+        }
+
+        // Enforce only one instance of Llm.
+        private val _instance: LLamaAndroid = LLamaAndroid()
+
+        fun instance(): LLamaAndroid = _instance
+    }
+}
diff --git a/android/llama.android/llama/src/main/java/com/nexa/NexaVlmInference.kt b/android/llama.android/llama/src/main/java/com/nexa/NexaVlmInference.kt
new file mode 100644
index 00000000..82a617de
--- /dev/null
+++ b/android/llama.android/llama/src/main/java/com/nexa/NexaVlmInference.kt
@@ -0,0 +1,196 @@
+package com.nexa
+import kotlinx.coroutines.Dispatchers
+import kotlinx.coroutines.flow.Flow
+import kotlinx.coroutines.flow.flow
+import kotlinx.coroutines.flow.flowOn
+
+class NexaVlmInference(
+    private val modelPath: String,
+    private val projectorPath: String,
+    private var imagePath: String,
+    private var stopWords: List<String> = emptyList(),
+    private var temperature: Float = 0.8f,
+    private var maxNewTokens: Int = 64,
+    private var topK: Int = 40,
+    private var topP: Float = 0.95f
+) {
+    init {
+        System.loadLibrary("llama-android")
+    }
+
+    private var paramsPointer: Long = 0
+    private var modelPointer: Long = 0
+    private var llavaCtxPointer: Long = 0
+    private var embedImagePointer: Long = 0
+    private var samplerPointer: Long = 0
+    private var nPastPointer: Long = 0
+    private var generatedTokenNum: Int = 0
+    private var generatedText: String = ""
+    private var isModelLoaded: Boolean = false
+    private var cachedTokenPointer: Long = 0
+
+    private external fun init_params(modelPath: String, mmprojPath: String): Long
+
+    private external fun update_params(params: Long, temperature: Float, topK: Int, topP: Float)
+
+    private external fun load_model(params: Long): Long
+
+    private external fun free_model(model: Long)
+
+    private external fun llava_init_context(params: Long, model: Long): Long
+
+    private external fun llava_ctx_free(ctx: Long)
+
+    private external fun load_image(ctx: Long, params: Long, imagepath: String): Long
+
+    private external fun llava_image_embed_free(llava_image_embed: Long)
+
+    private external fun llava_eval(ctx: Long, params: Long, llava_image_embed: Long, prompt: String): Long
+
+    private external fun llava_sampler_init(ctx: Long, params: Long): Long
+
+    private external fun llava_sample(ctx: Long, sampler: Long, n_past: Long, cached_tokens: Long): String
+
+    private external fun cached_token_init(): Long
+
+    private external fun cached_token_free(cached_tokens: Long)
+
+    private external fun llava_sample_free(sampler: Long)
+
+    @Synchronized
+    fun loadModel() {
+        if(isModelLoaded){
+            throw RuntimeException("Model is already loaded.")
+        }
+        try {
+            paramsPointer = init_params(modelPath, mmprojPath = projectorPath)
+            modelPointer = load_model(paramsPointer)
+            isModelLoaded = true
+        } catch (e: Exception) {
+            println(e)
+        } catch (e: UnsatisfiedLinkError) {
+            throw RuntimeException("Native method not found: ${e.message}")
+        }
+    }
+
+    fun dispose() {
+        if(paramsPointer!=0L){
+            paramsPointer = 0;
+        }
+        if (modelPointer != 0L) {
+            free_model(modelPointer)
+            modelPointer = 0;
+        }
+    }
+
+    private fun updateParams(
+        stopWords: List<String>? = null,
+        temperature: Float? = null,
+        maxNewTokens: Int? = null,
+        topK: Int? = null,
+        topP: Float? = null
+    ) {
+        if(stopWords != null){
+            this.stopWords = stopWords
+        }
+        if (temperature != null) {
+            this.temperature = temperature
+        }
+        if (maxNewTokens != null) {
+            this.maxNewTokens = maxNewTokens
+        }
+        if (topK != null) {
+            this.topK = topK;
+        }
+        if (topP != null) {
+            this.topP = topP
+        }
+
+        if(paramsPointer != 0L) {
+            update_params(paramsPointer, this.temperature, this.topK, this.topP)
+        }
+    }
+
+    private fun shouldStop(): Boolean {
+        if(this.generatedTokenNum >= this.maxNewTokens){
+            return true
+        }
+
+        return stopWords.any { generatedText.contains(it, ignoreCase = true) }
+    }
+
+    private fun resetGeneration() {
+        generatedTokenNum = 0
+        generatedText = ""
+    }
+
+    @Synchronized
+    fun createCompletionStream(
+        prompt: String,
+        imagePath: String? = null,
+        stopWords: List<String>? = null,
+        temperature: Float? = null,
+        maxNewTokens: Int? = null,
+        topK: Int? = null,
+        topP: Float? = null
+    ): Flow<String> = flow {
+        if(!isModelLoaded){
+            throw RuntimeException("Model is not loaded.")
+        }
+
+        // Reset generation state at the start
+        resetGeneration()
+        updateParams(stopWords, temperature, maxNewTokens, topK, topP)
+
+        val imagePathToUse = imagePath ?: this@NexaVlmInference.imagePath
+        llavaCtxPointer = llava_init_context(paramsPointer, modelPointer)
+        embedImagePointer = load_image(llavaCtxPointer, paramsPointer, imagePathToUse)
+        nPastPointer = llava_eval(llavaCtxPointer, paramsPointer, embedImagePointer, prompt)
+        samplerPointer = llava_sampler_init(llavaCtxPointer, paramsPointer)
+        cachedTokenPointer = cached_token_init()
+
+        try {
+            while (true) {
+                val sampledText = llava_sample(llavaCtxPointer, samplerPointer, nPastPointer, cachedTokenPointer)
+                generatedTokenNum += 1
+                generatedText += sampledText
+                if(shouldStop()){
+                    break
+                }
+                emit(sampledText)
+            }
+        } finally {
+            // Clean up resources and reset generation state
+            cleanupResources()
+            resetGeneration()
+        }
+    }.flowOn(Dispatchers.IO)
+
+    private fun cleanupResources() {
+        if(cachedTokenPointer != 0L){
+            cached_token_free(cachedTokenPointer)
+            cachedTokenPointer = 0
+        }
+
+        if (samplerPointer != 0L) {
+            llava_sample_free(samplerPointer)
+            samplerPointer = 0
+        }
+
+        if (embedImagePointer != 0L) {
+            try {
+                llava_image_embed_free(embedImagePointer)
+                embedImagePointer = 0
+            } catch (e: Exception) {
+                println(e)
+            } catch (e: Error) {
+                throw RuntimeException("Native method not found: ${e.message}")
+            }
+        }
+
+        if (llavaCtxPointer != 0L) {
+            llava_ctx_free(llavaCtxPointer)
+            llavaCtxPointer = 0
+        }
+    }
+}
diff --git a/android/llama.android/llama/src/test/java/android/llama/nexa/ExampleUnitTest.kt b/android/llama.android/llama/src/test/java/android/llama/nexa/ExampleUnitTest.kt
new file mode 100644
index 00000000..cfe765a1
--- /dev/null
+++ b/android/llama.android/llama/src/test/java/android/llama/nexa/ExampleUnitTest.kt
@@ -0,0 +1,17 @@
+package android.llama.nexa
+
+import org.junit.Test
+
+import org.junit.Assert.*
+
+/**
+ * Example local unit test, which will execute on the development machine (host).
+ *
+ * See [testing documentation](http://d.android.com/tools/testing).
+ */
+class ExampleUnitTest {
+    @Test
+    fun addition_isCorrect() {
+        assertEquals(4, 2 + 2)
+    }
+}
diff --git a/android/llama.android/settings.gradle.kts b/android/llama.android/settings.gradle.kts
new file mode 100644
index 00000000..71dcab93
--- /dev/null
+++ b/android/llama.android/settings.gradle.kts
@@ -0,0 +1,19 @@
+pluginManagement {
+    repositories {
+        google()
+        mavenCentral()
+        gradlePluginPortal()
+    }
+}
+dependencyResolutionManagement {
+    repositoriesMode.set(RepositoriesMode.FAIL_ON_PROJECT_REPOS)
+    repositories {
+        google()
+        mavenCentral()
+    }
+}
+
+rootProject.name = "LlamaAndroid"
+//include(":app")
+include(":llama")
+include(":app-java")
diff --git a/assets/banner.png b/assets/banner.png
deleted file mode 100644
index a515fdc0..00000000
Binary files a/assets/banner.png and /dev/null differ
diff --git a/assets/linux.png b/assets/linux.png
new file mode 100644
index 00000000..5ba70929
Binary files /dev/null and b/assets/linux.png differ
diff --git a/assets/mac.png b/assets/mac.png
new file mode 100644
index 00000000..861030e5
Binary files /dev/null and b/assets/mac.png differ
diff --git a/assets/nexa.jpeg b/assets/nexa.jpeg
new file mode 100644
index 00000000..dd125aac
Binary files /dev/null and b/assets/nexa.jpeg differ
diff --git a/assets/windows.png b/assets/windows.png
new file mode 100644
index 00000000..5d223654
Binary files /dev/null and b/assets/windows.png differ
diff --git a/dependency/README.md b/dependency/README.md
index 02fc5a7f..ddaf865a 100644
--- a/dependency/README.md
+++ b/dependency/README.md
@@ -1,36 +1,28 @@
 # Add as submodule
-```
-# Step 1: Clone the main repository recursively to include existing submodules
+Step 1: Clone the main repository recursively to include existing submodules
+```shell
 git clone --recursive https://github.com/NexaAI/nexa-sdk-ggml
+```
 
-# Step 2: Navigate to the cloned repository
-cd nexa-sdk-ggml
-
-# Step 3: Add the first submodule
-git submodule add https://github.com/ggerganov/llama.cpp dependency/llama.cpp
-
-# Step 4: Add the second submodule
-git submodule add https://github.com/leejet/stable-diffusion.cpp dependency/stable-diffusion.cpp
+Step 2: Add submodule in a specific branch, for example `nexa-audio-lm`
+```shell
+git submodule add -b nexa-audio-lm https://github.com/NexaAI/llama.cpp dependency/nexa_llama.cpp
+```
 
-# Step 5: Initialize and update the submodules
+Step 3: Initialize and update the submodules
+```shell
 git submodule update --init --recursive
+```
 
-# Step 6: Commit the changes to .gitmodules and the added submodules
+Step 4: Commit the changes to .gitmodules and the added submodules
+```shell
 git add .gitmodules dependency/
 git commit -m "Added llama.cpp and stable-diffusion.cpp as submodules"
 ```
 
 # Update submodules
 pull the latest change
-```
-git pull origin main
-```
-Update submodules
-```
-git submodule update --remote --merge
-```
-Then add and commit the changes
-```
-git add .
-git commit -m "Updated submodules"
+```shell
+git submodule sync
+git submodule update --init --recursive --remote
 ```
\ No newline at end of file
diff --git a/docs/README.md b/docs/README.md
index c2b5903a..d4081d2e 100644
--- a/docs/README.md
+++ b/docs/README.md
@@ -29,10 +29,19 @@ pip install nexaai[onnx] # if you need ONNX support
 
 ### build from source
 
+To build C++ only
+
+```
+cmake -B build -S .
+cmake --build build --config Release -j32
+```
+
+To build C++ and install python package from source, run the following commands:
+
 ```bash
 git clone --recursive https://github.com/NexaAI/nexa-sdk.git
 cd nexa-sdk
-pip install -e .
+pip install -e . --verbose # use --verbose for debugging
 pip install -e .[onnx] # if you need ONNX support
 ```
 
@@ -56,6 +65,7 @@ twine upload dist/*
 ```
 git tag
 git tag -d <version>
+git push origin --delete <version>
 git tag <version>
 git push origin <version>
 ```
@@ -69,12 +79,15 @@ python -m nexa.gguf.nexa_inference_text gemma
 python -m nexa.gguf.nexa_inference_text octopusv2 --stop_words "<nexa_end>"
 wget https://assets-c4akfrf5b4d3f4b7.z01.azurefd.net/assets/2024/04/BMDataViz_661fb89f3845e.png -O test.png
 python -m nexa.gguf.nexa_inference_vlm nanollava
+python -m nexa.gguf.nexa_inference_vlm_omni omniVLM
 python -m nexa.gguf.nexa_inference_image sd1-4
 python -m nexa.gguf.nexa_inference_image sd1-4 --img2img
 wget -O control_normal-fp16.safetensors https://huggingface.co/webui/ControlNet-modules-safetensors/resolve/main/control_normal-fp16.safetensors
 wget -O controlnet_test.png https://huggingface.co/takuma104/controlnet_dev/resolve/main/gen_compare/control_images/converted/control_human_normal.png
 python -m nexa.gguf.nexa_inference_image sd1-5 --control_net_path control_normal-fp16.safetensors --control_image_path controlnet_test.png
 python -m nexa.gguf.nexa_inference_voice whisper-tiny
+python -m nexa.gguf.nexa_inference_audio_lm qwen2audio
+python -m nexa.gguf.nexa_inference_audio_lm omniaudio
 ```
 
 ### Test with Streamlit UI
@@ -224,3 +237,11 @@ del /s /q *.dll # delete
 Get-ChildItem -Recurse -Filter *.dll  # in PowerShell
 dumpbin /dependents your_executable_or_dll.dll  # in Developer PowerShell for Visual Studio
 ```
+
+### Debug dynamic lib
+
+According to [isse](https://github.com/abetlen/llama-cpp-python/issues/1346), below can check the exported symbols on linux.
+
+```
+readelf -Ws --dyn-syms libllama.so
+```
diff --git a/examples/swift-test/Shared/ContentView.swift b/examples/swift-test/Shared/ContentView.swift
new file mode 100644
index 00000000..ad686c70
--- /dev/null
+++ b/examples/swift-test/Shared/ContentView.swift
@@ -0,0 +1,52 @@
+import SwiftUI
+
+struct ContentView: View {
+    @State private var viewModel = ViewModel()
+    @State private var prompt = ""
+    @FocusState private var isInputActive: Bool
+
+    var body: some View {
+        VStack {
+            Text("Nexa Swift Demo").font(.title)
+            
+            Toggle(isOn: $viewModel.usingStream) {
+                Text("Use Stream")
+            }
+            .padding(.bottom)
+            
+            TextField("Enter your message", text: $prompt, axis: .vertical)
+                .textFieldStyle(.roundedBorder)
+                .lineLimit(3...5)
+                .padding(.bottom)
+                .onSubmit {
+                    guard !prompt.isEmpty else { return }
+                    viewModel.run(for: prompt)
+                }
+                .focused($isInputActive)
+            
+            Button(action: {
+                guard !prompt.isEmpty else { return }
+                viewModel.run(for: prompt)
+                isInputActive = false
+            }) {
+                Text("Send")
+                    .frame(maxWidth: .infinity)
+            }
+            .buttonStyle(.borderedProminent)
+            .padding(.bottom)
+            
+            ScrollView {
+                Text(viewModel.result)
+                    .frame(maxWidth: .infinity, alignment: .leading)
+                    .textSelection(.enabled)
+            }
+            
+            Spacer()
+        }
+        .padding()
+    }
+}
+
+#Preview {
+    ContentView()
+}
diff --git a/examples/swift-test/Shared/ViewModel.swift b/examples/swift-test/Shared/ViewModel.swift
new file mode 100644
index 00000000..b2733ee4
--- /dev/null
+++ b/examples/swift-test/Shared/ViewModel.swift
@@ -0,0 +1,57 @@
+import Foundation
+import NexaSwift
+import SwiftUI
+import Combine
+
+@Observable
+class ViewModel {
+    let nexaSwift: NexaTextInference
+    var result = ""
+    var usingStream = true
+    private var messages: [ChatCompletionRequestMessage] = []
+    private let maxHistory = 1
+    private var cancallable: Set<AnyCancellable> = []
+    
+    init() {
+        let configuration = Configuration(maxNewToken: 128, stopTokens: [])
+        let model_path = Bundle.main.path(forResource: "llama3_2_3b_q4_K_M", ofType: "gguf") ?? ""
+        nexaSwift = (try? NexaTextInference(modelPath: model_path, modelConfiguration: configuration))!
+    }
+
+    func run(for userMessage: String) {
+        result = ""
+        let userMessageText = ChatCompletionRequestMessage.user(
+            ChatCompletionRequestUserMessage(content: .text(userMessage))
+        )
+
+        messages.append(userMessageText)
+        if messages.count > maxHistory * 2 {
+            messages.removeFirst(2)
+        }
+
+        Task {
+            switch usingStream {
+            case true:
+                for try await value in await nexaSwift.createChatCompletionStream(for: messages) {
+                    let delta = value.choices[0].delta.content ?? ""
+                    result += delta
+                }
+            case false:
+                if let completionResponse = try? await nexaSwift.createChatCompletion(for: messages) {
+                    let content = completionResponse.choices[0].message.content ?? ""
+                    result += content
+                }
+            }
+
+            // Add assistant's response to history
+            let assistantMessage = ChatCompletionRequestMessage.assistant(
+                ChatCompletionRequestAssistantMessage(
+                    content: result,
+                    toolCalls: nil,
+                    functionCall: nil
+                )
+            )
+            messages.append(assistantMessage)
+        }
+    }
+}
diff --git a/examples/swift-test/TestApp-Commandline/main.swift b/examples/swift-test/TestApp-Commandline/main.swift
new file mode 100644
index 00000000..b50e9ae9
--- /dev/null
+++ b/examples/swift-test/TestApp-Commandline/main.swift
@@ -0,0 +1,62 @@
+import Foundation
+import NexaSwift
+
+let configuration = NexaSwift.Configuration(
+    maxNewToken: 128,
+    stopTokens: []
+)
+
+let model_path = "path/to/your/model" // For Commandline, please add the local path here. 
+let nexaSwift = try NexaSwift.NexaTextInference(modelPath: model_path, modelConfiguration: configuration)
+
+var streamMode = false
+print("Do you want to enable stream mode? (yes/y or no/n):", terminator: " ")
+var userInput = readLine()?.lowercased() ?? ""
+if userInput == "yes" || userInput == "y" {
+    streamMode = true
+}
+print("")
+
+var messages:[ChatCompletionRequestMessage] = []
+let maxHistory = 2
+
+while true {
+    print("You:", terminator: " ")
+    userInput = readLine() ?? ""
+    print("Bot:", terminator: " ")
+    
+    let userMessageText = ChatCompletionRequestMessage.user(
+        ChatCompletionRequestUserMessage(content: .text(userInput))
+    )
+    
+    messages.append(userMessageText)
+    if messages.count > maxHistory * 2 {
+        messages.removeFirst(2)
+    }
+    
+    var currentMessage = ""
+    if streamMode{
+        for try await value in await nexaSwift
+            .createChatCompletionStream(for: messages) {
+            print(value.choices[0].delta.content ?? "", terminator: "")
+            currentMessage += value.choices[0].delta.content ?? ""
+        }
+    }else{
+        let response = try await nexaSwift.createChatCompletion(for: messages)
+        print(response.choices[0].message.content ?? "", terminator: "")
+        currentMessage += response.choices[0].message.content ?? ""
+    }
+    
+    
+    let assistantMessage = ChatCompletionRequestMessage.assistant(
+        ChatCompletionRequestAssistantMessage(
+            content: currentMessage,
+            toolCalls: nil,
+            functionCall: nil
+        )
+    )
+    
+    messages.append(assistantMessage)
+    
+    print("")
+}
diff --git a/examples/swift-test/TestApp-Macos/Assets.xcassets/AccentColor.colorset/Contents.json b/examples/swift-test/TestApp-Macos/Assets.xcassets/AccentColor.colorset/Contents.json
new file mode 100644
index 00000000..eb878970
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/Assets.xcassets/AccentColor.colorset/Contents.json
@@ -0,0 +1,11 @@
+{
+  "colors" : [
+    {
+      "idiom" : "universal"
+    }
+  ],
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-Macos/Assets.xcassets/AppIcon.appiconset/Contents.json b/examples/swift-test/TestApp-Macos/Assets.xcassets/AppIcon.appiconset/Contents.json
new file mode 100644
index 00000000..3f00db43
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/Assets.xcassets/AppIcon.appiconset/Contents.json
@@ -0,0 +1,58 @@
+{
+  "images" : [
+    {
+      "idiom" : "mac",
+      "scale" : "1x",
+      "size" : "16x16"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "2x",
+      "size" : "16x16"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "1x",
+      "size" : "32x32"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "2x",
+      "size" : "32x32"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "1x",
+      "size" : "128x128"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "2x",
+      "size" : "128x128"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "1x",
+      "size" : "256x256"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "2x",
+      "size" : "256x256"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "1x",
+      "size" : "512x512"
+    },
+    {
+      "idiom" : "mac",
+      "scale" : "2x",
+      "size" : "512x512"
+    }
+  ],
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-Macos/Assets.xcassets/Contents.json b/examples/swift-test/TestApp-Macos/Assets.xcassets/Contents.json
new file mode 100644
index 00000000..73c00596
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/Assets.xcassets/Contents.json
@@ -0,0 +1,6 @@
+{
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-Macos/Preview Content/Preview Assets.xcassets/Contents.json b/examples/swift-test/TestApp-Macos/Preview Content/Preview Assets.xcassets/Contents.json
new file mode 100644
index 00000000..73c00596
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/Preview Content/Preview Assets.xcassets/Contents.json	
@@ -0,0 +1,6 @@
+{
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-Macos/TestApp_Macos.entitlements b/examples/swift-test/TestApp-Macos/TestApp_Macos.entitlements
new file mode 100644
index 00000000..18aff0ce
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/TestApp_Macos.entitlements
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+	<key>com.apple.security.app-sandbox</key>
+	<true/>
+	<key>com.apple.security.files.user-selected.read-only</key>
+	<true/>
+</dict>
+</plist>
diff --git a/examples/swift-test/TestApp-Macos/TestApp_MacosApp.swift b/examples/swift-test/TestApp-Macos/TestApp_MacosApp.swift
new file mode 100644
index 00000000..2c39f8ae
--- /dev/null
+++ b/examples/swift-test/TestApp-Macos/TestApp_MacosApp.swift
@@ -0,0 +1,10 @@
+import SwiftUI
+
+@main
+struct TestApp_MacosApp: App {
+    var body: some Scene {
+        WindowGroup {
+            ContentView()
+        }
+    }
+}
diff --git a/examples/swift-test/TestApp-iOS/Assets.xcassets/AccentColor.colorset/Contents.json b/examples/swift-test/TestApp-iOS/Assets.xcassets/AccentColor.colorset/Contents.json
new file mode 100644
index 00000000..eb878970
--- /dev/null
+++ b/examples/swift-test/TestApp-iOS/Assets.xcassets/AccentColor.colorset/Contents.json
@@ -0,0 +1,11 @@
+{
+  "colors" : [
+    {
+      "idiom" : "universal"
+    }
+  ],
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-iOS/Assets.xcassets/AppIcon.appiconset/Contents.json b/examples/swift-test/TestApp-iOS/Assets.xcassets/AppIcon.appiconset/Contents.json
new file mode 100644
index 00000000..13613e3e
--- /dev/null
+++ b/examples/swift-test/TestApp-iOS/Assets.xcassets/AppIcon.appiconset/Contents.json
@@ -0,0 +1,13 @@
+{
+  "images" : [
+    {
+      "idiom" : "universal",
+      "platform" : "ios",
+      "size" : "1024x1024"
+    }
+  ],
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-iOS/Assets.xcassets/Contents.json b/examples/swift-test/TestApp-iOS/Assets.xcassets/Contents.json
new file mode 100644
index 00000000..73c00596
--- /dev/null
+++ b/examples/swift-test/TestApp-iOS/Assets.xcassets/Contents.json
@@ -0,0 +1,6 @@
+{
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-iOS/Preview Content/Preview Assets.xcassets/Contents.json b/examples/swift-test/TestApp-iOS/Preview Content/Preview Assets.xcassets/Contents.json
new file mode 100644
index 00000000..73c00596
--- /dev/null
+++ b/examples/swift-test/TestApp-iOS/Preview Content/Preview Assets.xcassets/Contents.json	
@@ -0,0 +1,6 @@
+{
+  "info" : {
+    "author" : "xcode",
+    "version" : 1
+  }
+}
diff --git a/examples/swift-test/TestApp-iOS/TestApp_iOSApp.swift b/examples/swift-test/TestApp-iOS/TestApp_iOSApp.swift
new file mode 100644
index 00000000..da5c8f69
--- /dev/null
+++ b/examples/swift-test/TestApp-iOS/TestApp_iOSApp.swift
@@ -0,0 +1,10 @@
+import SwiftUI
+
+@main
+struct TestAppApp: App {
+    var body: some Scene {
+        WindowGroup {
+            ContentView()
+        }
+    }
+}
diff --git a/examples/swift-test/TestApp.xcodeproj/project.pbxproj b/examples/swift-test/TestApp.xcodeproj/project.pbxproj
new file mode 100644
index 00000000..7a9f5219
--- /dev/null
+++ b/examples/swift-test/TestApp.xcodeproj/project.pbxproj
@@ -0,0 +1,663 @@
+// !$*UTF8*$!
+{
+	archiveVersion = 1;
+	classes = {
+	};
+	objectVersion = 60;
+	objects = {
+
+/* Begin PBXBuildFile section */
+		4B0B057A2BE5C451002BC7AF /* TestApp_MacosApp.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B0B05792BE5C451002BC7AF /* TestApp_MacosApp.swift */; };
+		4B0B057E2BE5C452002BC7AF /* Assets.xcassets in Resources */ = {isa = PBXBuildFile; fileRef = 4B0B057D2BE5C452002BC7AF /* Assets.xcassets */; };
+		4B0B05812BE5C452002BC7AF /* Preview Assets.xcassets in Resources */ = {isa = PBXBuildFile; fileRef = 4B0B05802BE5C452002BC7AF /* Preview Assets.xcassets */; };
+		4B1334FA2BE5C4AC0020AB8E /* Assets.xcassets in Resources */ = {isa = PBXBuildFile; fileRef = 4B1334F42BE5C4AC0020AB8E /* Assets.xcassets */; };
+		4B1334FB2BE5C4AC0020AB8E /* ViewModel.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B1334F52BE5C4AC0020AB8E /* ViewModel.swift */; };
+		4B1334FC2BE5C4AC0020AB8E /* Preview Assets.xcassets in Resources */ = {isa = PBXBuildFile; fileRef = 4B1334F72BE5C4AC0020AB8E /* Preview Assets.xcassets */; };
+		4B1334FD2BE5C4AC0020AB8E /* TestApp_iOSApp.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B1334F82BE5C4AC0020AB8E /* TestApp_iOSApp.swift */; };
+		4B1334FE2BE5C4AC0020AB8E /* ContentView.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B1334F92BE5C4AC0020AB8E /* ContentView.swift */; };
+		4BB1E3E12BE6464F00F1D21A /* NexaSwift in Frameworks */ = {isa = PBXBuildFile; productRef = 4BB1E3E02BE6464F00F1D21A /* NexaSwift */; };
+		4BB1E3E32BE6466A00F1D21A /* NexaSwift in Frameworks */ = {isa = PBXBuildFile; productRef = 4BB1E3E22BE6466A00F1D21A /* NexaSwift */; };
+		4BB1E3E52BE646CF00F1D21A /* ContentView.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B1334F92BE5C4AC0020AB8E /* ContentView.swift */; };
+		4BB1E3E62BE646CF00F1D21A /* ViewModel.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4B1334F52BE5C4AC0020AB8E /* ViewModel.swift */; };
+		4BEE1DB62BE70024001CE949 /* main.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4BEE1DB52BE70024001CE949 /* main.swift */; };
+		4BEE1DBB2BE7003E001CE949 /* NexaSwift in Frameworks */ = {isa = PBXBuildFile; productRef = 4BEE1DBA2BE7003E001CE949 /* NexaSwift */; };
+		D3DF75452CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf in Resources */ = {isa = PBXBuildFile; fileRef = D3DF75442CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf */; };
+		D3DF75462CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf in Resources */ = {isa = PBXBuildFile; fileRef = D3DF75442CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf */; };
+/* End PBXBuildFile section */
+
+/* Begin PBXCopyFilesBuildPhase section */
+		4BEE1DB12BE70024001CE949 /* CopyFiles */ = {
+			isa = PBXCopyFilesBuildPhase;
+			buildActionMask = 12;
+			dstPath = "";
+			dstSubfolderSpec = 16;
+			files = (
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXCopyFilesBuildPhase section */
+
+/* Begin PBXFileReference section */
+		4B0B055A2BE5B44E002BC7AF /* TestApp-iOS.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = "TestApp-iOS.app"; sourceTree = BUILT_PRODUCTS_DIR; };
+		4B0B05772BE5C451002BC7AF /* TestApp-Macos.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = "TestApp-Macos.app"; sourceTree = BUILT_PRODUCTS_DIR; };
+		4B0B05792BE5C451002BC7AF /* TestApp_MacosApp.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = TestApp_MacosApp.swift; sourceTree = "<group>"; };
+		4B0B057D2BE5C452002BC7AF /* Assets.xcassets */ = {isa = PBXFileReference; lastKnownFileType = folder.assetcatalog; path = Assets.xcassets; sourceTree = "<group>"; };
+		4B0B05802BE5C452002BC7AF /* Preview Assets.xcassets */ = {isa = PBXFileReference; lastKnownFileType = folder.assetcatalog; path = "Preview Assets.xcassets"; sourceTree = "<group>"; };
+		4B0B05822BE5C452002BC7AF /* TestApp_Macos.entitlements */ = {isa = PBXFileReference; lastKnownFileType = text.plist.entitlements; path = TestApp_Macos.entitlements; sourceTree = "<group>"; };
+		4B1334F42BE5C4AC0020AB8E /* Assets.xcassets */ = {isa = PBXFileReference; lastKnownFileType = folder.assetcatalog; path = Assets.xcassets; sourceTree = "<group>"; };
+		4B1334F52BE5C4AC0020AB8E /* ViewModel.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = ViewModel.swift; sourceTree = "<group>"; };
+		4B1334F72BE5C4AC0020AB8E /* Preview Assets.xcassets */ = {isa = PBXFileReference; lastKnownFileType = folder.assetcatalog; path = "Preview Assets.xcassets"; sourceTree = "<group>"; };
+		4B1334F82BE5C4AC0020AB8E /* TestApp_iOSApp.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = TestApp_iOSApp.swift; sourceTree = "<group>"; };
+		4B1334F92BE5C4AC0020AB8E /* ContentView.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = ContentView.swift; sourceTree = "<group>"; };
+		4B51A47B2BE7449700F65BFC /* README.md */ = {isa = PBXFileReference; lastKnownFileType = net.daringfireball.markdown; path = README.md; sourceTree = "<group>"; };
+		4BEE1DB32BE70024001CE949 /* TestApp-CLI */ = {isa = PBXFileReference; explicitFileType = "compiled.mach-o.executable"; includeInIndex = 0; path = "TestApp-CLI"; sourceTree = BUILT_PRODUCTS_DIR; };
+		4BEE1DB52BE70024001CE949 /* main.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = main.swift; sourceTree = "<group>"; };
+		D3DF75442CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf */ = {isa = PBXFileReference; lastKnownFileType = file; path = llama3_2_3b_q4_K_M.gguf; sourceTree = "<group>"; };
+/* End PBXFileReference section */
+
+/* Begin PBXFrameworksBuildPhase section */
+		4B0B05572BE5B44E002BC7AF /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4BB1E3E12BE6464F00F1D21A /* NexaSwift in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		4B0B05742BE5C451002BC7AF /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4BB1E3E32BE6466A00F1D21A /* NexaSwift in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		4BEE1DB02BE70024001CE949 /* Frameworks */ = {
+			isa = PBXFrameworksBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4BEE1DBB2BE7003E001CE949 /* NexaSwift in Frameworks */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXFrameworksBuildPhase section */
+
+/* Begin PBXGroup section */
+		4B0B05512BE5B44E002BC7AF = {
+			isa = PBXGroup;
+			children = (
+				4B51A47B2BE7449700F65BFC /* README.md */,
+				4BB1E3E42BE646BB00F1D21A /* Shared */,
+				4B1334F32BE5C4AC0020AB8E /* TestApp-iOS */,
+				4B0B05782BE5C451002BC7AF /* TestApp-Macos */,
+				4BEE1DB42BE70024001CE949 /* TestApp-Commandline */,
+				4B0B055B2BE5B44E002BC7AF /* Products */,
+			);
+			sourceTree = "<group>";
+		};
+		4B0B055B2BE5B44E002BC7AF /* Products */ = {
+			isa = PBXGroup;
+			children = (
+				4B0B055A2BE5B44E002BC7AF /* TestApp-iOS.app */,
+				4B0B05772BE5C451002BC7AF /* TestApp-Macos.app */,
+				4BEE1DB32BE70024001CE949 /* TestApp-CLI */,
+			);
+			name = Products;
+			sourceTree = "<group>";
+		};
+		4B0B05782BE5C451002BC7AF /* TestApp-Macos */ = {
+			isa = PBXGroup;
+			children = (
+				4B0B05792BE5C451002BC7AF /* TestApp_MacosApp.swift */,
+				4B0B057D2BE5C452002BC7AF /* Assets.xcassets */,
+				4B0B05822BE5C452002BC7AF /* TestApp_Macos.entitlements */,
+				4B0B057F2BE5C452002BC7AF /* Preview Content */,
+			);
+			path = "TestApp-Macos";
+			sourceTree = "<group>";
+		};
+		4B0B057F2BE5C452002BC7AF /* Preview Content */ = {
+			isa = PBXGroup;
+			children = (
+				4B0B05802BE5C452002BC7AF /* Preview Assets.xcassets */,
+			);
+			path = "Preview Content";
+			sourceTree = "<group>";
+		};
+		4B10A3302BE5CD6600BEA6A1 /* Models */ = {
+			isa = PBXGroup;
+			children = (
+				D3DF75442CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf */,
+			);
+			name = Models;
+			path = Shared/Models;
+			sourceTree = SOURCE_ROOT;
+		};
+		4B1334F32BE5C4AC0020AB8E /* TestApp-iOS */ = {
+			isa = PBXGroup;
+			children = (
+				4B1334F82BE5C4AC0020AB8E /* TestApp_iOSApp.swift */,
+				4B1334F42BE5C4AC0020AB8E /* Assets.xcassets */,
+				4B1334F62BE5C4AC0020AB8E /* Preview Content */,
+			);
+			path = "TestApp-iOS";
+			sourceTree = "<group>";
+		};
+		4B1334F62BE5C4AC0020AB8E /* Preview Content */ = {
+			isa = PBXGroup;
+			children = (
+				4B1334F72BE5C4AC0020AB8E /* Preview Assets.xcassets */,
+			);
+			path = "Preview Content";
+			sourceTree = "<group>";
+		};
+		4BB1E3E42BE646BB00F1D21A /* Shared */ = {
+			isa = PBXGroup;
+			children = (
+				4B10A3302BE5CD6600BEA6A1 /* Models */,
+				4B1334F92BE5C4AC0020AB8E /* ContentView.swift */,
+				4B1334F52BE5C4AC0020AB8E /* ViewModel.swift */,
+			);
+			path = Shared;
+			sourceTree = "<group>";
+		};
+		4BEE1DB42BE70024001CE949 /* TestApp-Commandline */ = {
+			isa = PBXGroup;
+			children = (
+				4BEE1DB52BE70024001CE949 /* main.swift */,
+			);
+			path = "TestApp-Commandline";
+			sourceTree = "<group>";
+		};
+/* End PBXGroup section */
+
+/* Begin PBXNativeTarget section */
+		4B0B05592BE5B44E002BC7AF /* TestApp-iOS */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 4B0B05682BE5B450002BC7AF /* Build configuration list for PBXNativeTarget "TestApp-iOS" */;
+			buildPhases = (
+				4B0B05562BE5B44E002BC7AF /* Sources */,
+				4B0B05572BE5B44E002BC7AF /* Frameworks */,
+				4B0B05582BE5B44E002BC7AF /* Resources */,
+			);
+			buildRules = (
+			);
+			dependencies = (
+			);
+			name = "TestApp-iOS";
+			packageProductDependencies = (
+				4BB1E3E02BE6464F00F1D21A /* NexaSwift */,
+			);
+			productName = TestApp;
+			productReference = 4B0B055A2BE5B44E002BC7AF /* TestApp-iOS.app */;
+			productType = "com.apple.product-type.application";
+		};
+		4B0B05762BE5C451002BC7AF /* TestApp-Macos */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 4B0B05832BE5C452002BC7AF /* Build configuration list for PBXNativeTarget "TestApp-Macos" */;
+			buildPhases = (
+				4B0B05732BE5C451002BC7AF /* Sources */,
+				4B0B05742BE5C451002BC7AF /* Frameworks */,
+				4B0B05752BE5C451002BC7AF /* Resources */,
+			);
+			buildRules = (
+			);
+			dependencies = (
+			);
+			name = "TestApp-Macos";
+			packageProductDependencies = (
+				4BB1E3E22BE6466A00F1D21A /* NexaSwift */,
+			);
+			productName = "TestApp-Macos";
+			productReference = 4B0B05772BE5C451002BC7AF /* TestApp-Macos.app */;
+			productType = "com.apple.product-type.application";
+		};
+		4BEE1DB22BE70024001CE949 /* TestApp-CLI */ = {
+			isa = PBXNativeTarget;
+			buildConfigurationList = 4BEE1DB92BE70024001CE949 /* Build configuration list for PBXNativeTarget "TestApp-CLI" */;
+			buildPhases = (
+				4BEE1DAF2BE70024001CE949 /* Sources */,
+				4BEE1DB02BE70024001CE949 /* Frameworks */,
+				4BEE1DB12BE70024001CE949 /* CopyFiles */,
+			);
+			buildRules = (
+			);
+			dependencies = (
+			);
+			name = "TestApp-CLI";
+			packageProductDependencies = (
+				4BEE1DBA2BE7003E001CE949 /* NexaSwift */,
+			);
+			productName = "TestApp-Commandline";
+			productReference = 4BEE1DB32BE70024001CE949 /* TestApp-CLI */;
+			productType = "com.apple.product-type.tool";
+		};
+/* End PBXNativeTarget section */
+
+/* Begin PBXProject section */
+		4B0B05522BE5B44E002BC7AF /* Project object */ = {
+			isa = PBXProject;
+			attributes = {
+				BuildIndependentTargetsInParallel = 1;
+				LastSwiftUpdateCheck = 1520;
+				LastUpgradeCheck = 1520;
+				TargetAttributes = {
+					4B0B05592BE5B44E002BC7AF = {
+						CreatedOnToolsVersion = 15.2;
+					};
+					4B0B05762BE5C451002BC7AF = {
+						CreatedOnToolsVersion = 15.2;
+					};
+					4BEE1DB22BE70024001CE949 = {
+						CreatedOnToolsVersion = 15.2;
+					};
+				};
+			};
+			buildConfigurationList = 4B0B05552BE5B44E002BC7AF /* Build configuration list for PBXProject "TestApp" */;
+			compatibilityVersion = "Xcode 14.0";
+			developmentRegion = en;
+			hasScannedForEncodings = 0;
+			knownRegions = (
+				en,
+				Base,
+			);
+			mainGroup = 4B0B05512BE5B44E002BC7AF;
+			packageReferences = (
+				4B1335012BE5C58A0020AB8E /* XCLocalSwiftPackageReference "../.." */,
+			);
+			productRefGroup = 4B0B055B2BE5B44E002BC7AF /* Products */;
+			projectDirPath = "";
+			projectRoot = "";
+			targets = (
+				4B0B05592BE5B44E002BC7AF /* TestApp-iOS */,
+				4B0B05762BE5C451002BC7AF /* TestApp-Macos */,
+				4BEE1DB22BE70024001CE949 /* TestApp-CLI */,
+			);
+		};
+/* End PBXProject section */
+
+/* Begin PBXResourcesBuildPhase section */
+		4B0B05582BE5B44E002BC7AF /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4B1334FC2BE5C4AC0020AB8E /* Preview Assets.xcassets in Resources */,
+				4B1334FA2BE5C4AC0020AB8E /* Assets.xcassets in Resources */,
+				D3DF75462CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		4B0B05752BE5C451002BC7AF /* Resources */ = {
+			isa = PBXResourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4B0B05812BE5C452002BC7AF /* Preview Assets.xcassets in Resources */,
+				4B0B057E2BE5C452002BC7AF /* Assets.xcassets in Resources */,
+				D3DF75452CD80FBD00FEFA14 /* llama3_2_3b_q4_K_M.gguf in Resources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXResourcesBuildPhase section */
+
+/* Begin PBXSourcesBuildPhase section */
+		4B0B05562BE5B44E002BC7AF /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4B1334FB2BE5C4AC0020AB8E /* ViewModel.swift in Sources */,
+				4B1334FD2BE5C4AC0020AB8E /* TestApp_iOSApp.swift in Sources */,
+				4B1334FE2BE5C4AC0020AB8E /* ContentView.swift in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		4B0B05732BE5C451002BC7AF /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4BB1E3E62BE646CF00F1D21A /* ViewModel.swift in Sources */,
+				4BB1E3E52BE646CF00F1D21A /* ContentView.swift in Sources */,
+				4B0B057A2BE5C451002BC7AF /* TestApp_MacosApp.swift in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+		4BEE1DAF2BE70024001CE949 /* Sources */ = {
+			isa = PBXSourcesBuildPhase;
+			buildActionMask = 2147483647;
+			files = (
+				4BEE1DB62BE70024001CE949 /* main.swift in Sources */,
+			);
+			runOnlyForDeploymentPostprocessing = 0;
+		};
+/* End PBXSourcesBuildPhase section */
+
+/* Begin XCBuildConfiguration section */
+		4B0B05662BE5B450002BC7AF /* Debug */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ASSETCATALOG_COMPILER_GENERATE_SWIFT_ASSET_SYMBOL_EXTENSIONS = YES;
+				CLANG_ANALYZER_NONNULL = YES;
+				CLANG_ANALYZER_NUMBER_OBJECT_CONVERSION = YES_AGGRESSIVE;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++20";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_ENABLE_OBJC_WEAK = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_DOCUMENTATION_COMMENTS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_QUOTED_INCLUDE_IN_FRAMEWORK_HEADER = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNGUARDED_AVAILABILITY = YES_AGGRESSIVE;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				DEBUG_INFORMATION_FORMAT = dwarf;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_TESTABILITY = YES;
+				ENABLE_USER_SCRIPT_SANDBOXING = YES;
+				GCC_C_LANGUAGE_STANDARD = gnu17;
+				GCC_DYNAMIC_NO_PIC = NO;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_OPTIMIZATION_LEVEL = 0;
+				GCC_PREPROCESSOR_DEFINITIONS = (
+					"DEBUG=1",
+					"$(inherited)",
+				);
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 17.2;
+				LOCALIZATION_PREFERS_STRING_CATALOGS = YES;
+				MTL_ENABLE_DEBUG_INFO = INCLUDE_SOURCE;
+				MTL_FAST_MATH = YES;
+				ONLY_ACTIVE_ARCH = YES;
+				SDKROOT = iphoneos;
+				SWIFT_ACTIVE_COMPILATION_CONDITIONS = "DEBUG $(inherited)";
+				SWIFT_OPTIMIZATION_LEVEL = "-Onone";
+			};
+			name = Debug;
+		};
+		4B0B05672BE5B450002BC7AF /* Release */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ALWAYS_SEARCH_USER_PATHS = NO;
+				ASSETCATALOG_COMPILER_GENERATE_SWIFT_ASSET_SYMBOL_EXTENSIONS = YES;
+				CLANG_ANALYZER_NONNULL = YES;
+				CLANG_ANALYZER_NUMBER_OBJECT_CONVERSION = YES_AGGRESSIVE;
+				CLANG_CXX_LANGUAGE_STANDARD = "gnu++20";
+				CLANG_ENABLE_MODULES = YES;
+				CLANG_ENABLE_OBJC_ARC = YES;
+				CLANG_ENABLE_OBJC_WEAK = YES;
+				CLANG_WARN_BLOCK_CAPTURE_AUTORELEASING = YES;
+				CLANG_WARN_BOOL_CONVERSION = YES;
+				CLANG_WARN_COMMA = YES;
+				CLANG_WARN_CONSTANT_CONVERSION = YES;
+				CLANG_WARN_DEPRECATED_OBJC_IMPLEMENTATIONS = YES;
+				CLANG_WARN_DIRECT_OBJC_ISA_USAGE = YES_ERROR;
+				CLANG_WARN_DOCUMENTATION_COMMENTS = YES;
+				CLANG_WARN_EMPTY_BODY = YES;
+				CLANG_WARN_ENUM_CONVERSION = YES;
+				CLANG_WARN_INFINITE_RECURSION = YES;
+				CLANG_WARN_INT_CONVERSION = YES;
+				CLANG_WARN_NON_LITERAL_NULL_CONVERSION = YES;
+				CLANG_WARN_OBJC_IMPLICIT_RETAIN_SELF = YES;
+				CLANG_WARN_OBJC_LITERAL_CONVERSION = YES;
+				CLANG_WARN_OBJC_ROOT_CLASS = YES_ERROR;
+				CLANG_WARN_QUOTED_INCLUDE_IN_FRAMEWORK_HEADER = YES;
+				CLANG_WARN_RANGE_LOOP_ANALYSIS = YES;
+				CLANG_WARN_STRICT_PROTOTYPES = YES;
+				CLANG_WARN_SUSPICIOUS_MOVE = YES;
+				CLANG_WARN_UNGUARDED_AVAILABILITY = YES_AGGRESSIVE;
+				CLANG_WARN_UNREACHABLE_CODE = YES;
+				CLANG_WARN__DUPLICATE_METHOD_MATCH = YES;
+				COPY_PHASE_STRIP = NO;
+				DEBUG_INFORMATION_FORMAT = "dwarf-with-dsym";
+				ENABLE_NS_ASSERTIONS = NO;
+				ENABLE_STRICT_OBJC_MSGSEND = YES;
+				ENABLE_USER_SCRIPT_SANDBOXING = YES;
+				GCC_C_LANGUAGE_STANDARD = gnu17;
+				GCC_NO_COMMON_BLOCKS = YES;
+				GCC_WARN_64_TO_32_BIT_CONVERSION = YES;
+				GCC_WARN_ABOUT_RETURN_TYPE = YES_ERROR;
+				GCC_WARN_UNDECLARED_SELECTOR = YES;
+				GCC_WARN_UNINITIALIZED_AUTOS = YES_AGGRESSIVE;
+				GCC_WARN_UNUSED_FUNCTION = YES;
+				GCC_WARN_UNUSED_VARIABLE = YES;
+				IPHONEOS_DEPLOYMENT_TARGET = 17.2;
+				LOCALIZATION_PREFERS_STRING_CATALOGS = YES;
+				MTL_ENABLE_DEBUG_INFO = NO;
+				MTL_FAST_MATH = YES;
+				SDKROOT = iphoneos;
+				SWIFT_COMPILATION_MODE = wholemodule;
+				VALIDATE_PRODUCT = YES;
+			};
+			name = Release;
+		};
+		4B0B05692BE5B450002BC7AF /* Debug */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
+				ASSETCATALOG_COMPILER_GLOBAL_ACCENT_COLOR_NAME = AccentColor;
+				CODE_SIGN_STYLE = Automatic;
+				CURRENT_PROJECT_VERSION = 1;
+				DEVELOPMENT_ASSET_PATHS = "\"TestApp-iOS/Preview Content\"";
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_PREVIEWS = YES;
+				GENERATE_INFOPLIST_FILE = YES;
+				INFOPLIST_KEY_UIApplicationSceneManifest_Generation = YES;
+				INFOPLIST_KEY_UIApplicationSupportsIndirectInputEvents = YES;
+				INFOPLIST_KEY_UILaunchScreen_Generation = YES;
+				INFOPLIST_KEY_UISupportedInterfaceOrientations_iPad = "UIInterfaceOrientationPortrait UIInterfaceOrientationPortraitUpsideDown UIInterfaceOrientationLandscapeLeft UIInterfaceOrientationLandscapeRight";
+				INFOPLIST_KEY_UISupportedInterfaceOrientations_iPhone = "UIInterfaceOrientationPortrait UIInterfaceOrientationLandscapeLeft UIInterfaceOrientationLandscapeRight";
+				IPHONEOS_DEPLOYMENT_TARGET = 18.0;
+				LD_RUNPATH_SEARCH_PATHS = (
+					"$(inherited)",
+					"@executable_path/Frameworks",
+				);
+				MARKETING_VERSION = 1.0;
+				PRODUCT_BUNDLE_IDENTIFIER = test.nexaai.TestApp;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SWIFT_EMIT_LOC_STRINGS = YES;
+				SWIFT_VERSION = 5.0;
+				TARGETED_DEVICE_FAMILY = "1,2";
+			};
+			name = Debug;
+		};
+		4B0B056A2BE5B450002BC7AF /* Release */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
+				ASSETCATALOG_COMPILER_GLOBAL_ACCENT_COLOR_NAME = AccentColor;
+				CODE_SIGN_STYLE = Automatic;
+				CURRENT_PROJECT_VERSION = 1;
+				DEVELOPMENT_ASSET_PATHS = "\"TestApp-iOS/Preview Content\"";
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_PREVIEWS = YES;
+				GENERATE_INFOPLIST_FILE = YES;
+				INFOPLIST_KEY_UIApplicationSceneManifest_Generation = YES;
+				INFOPLIST_KEY_UIApplicationSupportsIndirectInputEvents = YES;
+				INFOPLIST_KEY_UILaunchScreen_Generation = YES;
+				INFOPLIST_KEY_UISupportedInterfaceOrientations_iPad = "UIInterfaceOrientationPortrait UIInterfaceOrientationPortraitUpsideDown UIInterfaceOrientationLandscapeLeft UIInterfaceOrientationLandscapeRight";
+				INFOPLIST_KEY_UISupportedInterfaceOrientations_iPhone = "UIInterfaceOrientationPortrait UIInterfaceOrientationLandscapeLeft UIInterfaceOrientationLandscapeRight";
+				IPHONEOS_DEPLOYMENT_TARGET = 18.0;
+				LD_RUNPATH_SEARCH_PATHS = (
+					"$(inherited)",
+					"@executable_path/Frameworks",
+				);
+				MARKETING_VERSION = 1.0;
+				PRODUCT_BUNDLE_IDENTIFIER = test.nexaai.TestApp;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SWIFT_EMIT_LOC_STRINGS = YES;
+				SWIFT_VERSION = 5.0;
+				TARGETED_DEVICE_FAMILY = "1,2";
+			};
+			name = Release;
+		};
+		4B0B05842BE5C452002BC7AF /* Debug */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
+				ASSETCATALOG_COMPILER_GLOBAL_ACCENT_COLOR_NAME = AccentColor;
+				CODE_SIGN_ENTITLEMENTS = "TestApp-Macos/TestApp_Macos.entitlements";
+				"CODE_SIGN_IDENTITY[sdk=macosx*]" = "Apple Development";
+				CODE_SIGN_STYLE = Automatic;
+				COMBINE_HIDPI_IMAGES = YES;
+				CURRENT_PROJECT_VERSION = 1;
+				DEVELOPMENT_ASSET_PATHS = "\"TestApp-Macos/Preview Content\"";
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_HARDENED_RUNTIME = YES;
+				ENABLE_PREVIEWS = YES;
+				GENERATE_INFOPLIST_FILE = YES;
+				INFOPLIST_KEY_NSHumanReadableCopyright = "";
+				LD_RUNPATH_SEARCH_PATHS = (
+					"$(inherited)",
+					"@executable_path/../Frameworks",
+				);
+				MACOSX_DEPLOYMENT_TARGET = 15.0;
+				MARKETING_VERSION = 1.0;
+				PRODUCT_BUNDLE_IDENTIFIER = "test.nexaai.TestApp-Macos";
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = macosx;
+				SWIFT_EMIT_LOC_STRINGS = YES;
+				SWIFT_VERSION = 5.0;
+			};
+			name = Debug;
+		};
+		4B0B05852BE5C452002BC7AF /* Release */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
+				ASSETCATALOG_COMPILER_GLOBAL_ACCENT_COLOR_NAME = AccentColor;
+				CODE_SIGN_ENTITLEMENTS = "TestApp-Macos/TestApp_Macos.entitlements";
+				"CODE_SIGN_IDENTITY[sdk=macosx*]" = "Apple Development";
+				CODE_SIGN_STYLE = Automatic;
+				COMBINE_HIDPI_IMAGES = YES;
+				CURRENT_PROJECT_VERSION = 1;
+				DEVELOPMENT_ASSET_PATHS = "\"TestApp-Macos/Preview Content\"";
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_HARDENED_RUNTIME = YES;
+				ENABLE_PREVIEWS = YES;
+				GENERATE_INFOPLIST_FILE = YES;
+				INFOPLIST_KEY_NSHumanReadableCopyright = "";
+				LD_RUNPATH_SEARCH_PATHS = (
+					"$(inherited)",
+					"@executable_path/../Frameworks",
+				);
+				MACOSX_DEPLOYMENT_TARGET = 15.0;
+				MARKETING_VERSION = 1.0;
+				PRODUCT_BUNDLE_IDENTIFIER = "test.nexaai.TestApp-Macos";
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = macosx;
+				SWIFT_EMIT_LOC_STRINGS = YES;
+				SWIFT_VERSION = 5.0;
+			};
+			name = Release;
+		};
+		4BEE1DB72BE70024001CE949 /* Debug */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CODE_SIGN_STYLE = Automatic;
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_HARDENED_RUNTIME = YES;
+				MACOSX_DEPLOYMENT_TARGET = 15.0;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = macosx;
+				SWIFT_VERSION = 5.0;
+			};
+			name = Debug;
+		};
+		4BEE1DB82BE70024001CE949 /* Release */ = {
+			isa = XCBuildConfiguration;
+			buildSettings = {
+				CODE_SIGN_STYLE = Automatic;
+				DEVELOPMENT_TEAM = 8235LVN3VW;
+				ENABLE_HARDENED_RUNTIME = YES;
+				MACOSX_DEPLOYMENT_TARGET = 15.0;
+				PRODUCT_NAME = "$(TARGET_NAME)";
+				SDKROOT = macosx;
+				SWIFT_VERSION = 5.0;
+			};
+			name = Release;
+		};
+/* End XCBuildConfiguration section */
+
+/* Begin XCConfigurationList section */
+		4B0B05552BE5B44E002BC7AF /* Build configuration list for PBXProject "TestApp" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				4B0B05662BE5B450002BC7AF /* Debug */,
+				4B0B05672BE5B450002BC7AF /* Release */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release;
+		};
+		4B0B05682BE5B450002BC7AF /* Build configuration list for PBXNativeTarget "TestApp-iOS" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				4B0B05692BE5B450002BC7AF /* Debug */,
+				4B0B056A2BE5B450002BC7AF /* Release */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release;
+		};
+		4B0B05832BE5C452002BC7AF /* Build configuration list for PBXNativeTarget "TestApp-Macos" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				4B0B05842BE5C452002BC7AF /* Debug */,
+				4B0B05852BE5C452002BC7AF /* Release */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release;
+		};
+		4BEE1DB92BE70024001CE949 /* Build configuration list for PBXNativeTarget "TestApp-CLI" */ = {
+			isa = XCConfigurationList;
+			buildConfigurations = (
+				4BEE1DB72BE70024001CE949 /* Debug */,
+				4BEE1DB82BE70024001CE949 /* Release */,
+			);
+			defaultConfigurationIsVisible = 0;
+			defaultConfigurationName = Release;
+		};
+/* End XCConfigurationList section */
+
+/* Begin XCLocalSwiftPackageReference section */
+		4B1335012BE5C58A0020AB8E /* XCLocalSwiftPackageReference "../.." */ = {
+			isa = XCLocalSwiftPackageReference;
+			relativePath = ../..;
+		};
+/* End XCLocalSwiftPackageReference section */
+
+/* Begin XCSwiftPackageProductDependency section */
+		4BB1E3E02BE6464F00F1D21A /* NexaSwift */ = {
+			isa = XCSwiftPackageProductDependency;
+			productName = NexaSwift;
+		};
+		4BB1E3E22BE6466A00F1D21A /* NexaSwift */ = {
+			isa = XCSwiftPackageProductDependency;
+			productName = NexaSwift;
+		};
+		4BEE1DBA2BE7003E001CE949 /* NexaSwift */ = {
+			isa = XCSwiftPackageProductDependency;
+			productName = NexaSwift;
+		};
+/* End XCSwiftPackageProductDependency section */
+	};
+	rootObject = 4B0B05522BE5B44E002BC7AF /* Project object */;
+}
diff --git a/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/contents.xcworkspacedata b/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/contents.xcworkspacedata
new file mode 100644
index 00000000..919434a6
--- /dev/null
+++ b/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/contents.xcworkspacedata
@@ -0,0 +1,7 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Workspace
+   version = "1.0">
+   <FileRef
+      location = "self:">
+   </FileRef>
+</Workspace>
diff --git a/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved b/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
new file mode 100644
index 00000000..7c675f2c
--- /dev/null
+++ b/examples/swift-test/TestApp.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
@@ -0,0 +1,15 @@
+{
+  "originHash" : "b2becbcc0254795d9a140b56614e328e9054fc0127630faeab494795dc5b48bf",
+  "pins" : [
+    {
+      "identity" : "llama.cpp",
+      "kind" : "remoteSourceControl",
+      "location" : "https://github.com/ggerganov/llama.cpp.git",
+      "state" : {
+        "branch" : "master",
+        "revision" : "96b69121033d2b6b951d1b6b1b43f8b4f97dac99"
+      }
+    }
+  ],
+  "version" : 3
+}
diff --git a/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-Commandline.xcscheme b/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-Commandline.xcscheme
new file mode 100644
index 00000000..6e130b24
--- /dev/null
+++ b/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-Commandline.xcscheme
@@ -0,0 +1,84 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "1520"
+   version = "1.7">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "4BEE1DB22BE70024001CE949"
+               BuildableName = "TestApp-CLI"
+               BlueprintName = "TestApp-CLI"
+               ReferencedContainer = "container:TestApp.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      shouldAutocreateTestPlan = "YES">
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES"
+      viewDebuggingEnabled = "No">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "4BEE1DB22BE70024001CE949"
+            BuildableName = "TestApp-CLI"
+            BlueprintName = "TestApp-CLI"
+            ReferencedContainer = "container:TestApp.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+      <CommandLineArguments>
+         <CommandLineArgument
+            argument = ""
+            isEnabled = "YES">
+         </CommandLineArgument>
+      </CommandLineArguments>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "4BEE1DB22BE70024001CE949"
+            BuildableName = "TestApp-CLI"
+            BlueprintName = "TestApp-CLI"
+            ReferencedContainer = "container:TestApp.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-iOS.xcscheme b/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-iOS.xcscheme
new file mode 100644
index 00000000..4d900c28
--- /dev/null
+++ b/examples/swift-test/TestApp.xcodeproj/xcshareddata/xcschemes/TestApp-iOS.xcscheme
@@ -0,0 +1,77 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<Scheme
+   LastUpgradeVersion = "1520"
+   version = "1.7">
+   <BuildAction
+      parallelizeBuildables = "YES"
+      buildImplicitDependencies = "YES">
+      <BuildActionEntries>
+         <BuildActionEntry
+            buildForTesting = "YES"
+            buildForRunning = "YES"
+            buildForProfiling = "YES"
+            buildForArchiving = "YES"
+            buildForAnalyzing = "YES">
+            <BuildableReference
+               BuildableIdentifier = "primary"
+               BlueprintIdentifier = "4B0B05592BE5B44E002BC7AF"
+               BuildableName = "TestApp-iOS.app"
+               BlueprintName = "TestApp-iOS"
+               ReferencedContainer = "container:TestApp.xcodeproj">
+            </BuildableReference>
+         </BuildActionEntry>
+      </BuildActionEntries>
+   </BuildAction>
+   <TestAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      shouldAutocreateTestPlan = "YES">
+   </TestAction>
+   <LaunchAction
+      buildConfiguration = "Debug"
+      selectedDebuggerIdentifier = "Xcode.DebuggerFoundation.Debugger.LLDB"
+      selectedLauncherIdentifier = "Xcode.DebuggerFoundation.Launcher.LLDB"
+      launchStyle = "0"
+      useCustomWorkingDirectory = "NO"
+      ignoresPersistentStateOnLaunch = "NO"
+      debugDocumentVersioning = "YES"
+      debugServiceExtension = "internal"
+      allowLocationSimulation = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "4B0B05592BE5B44E002BC7AF"
+            BuildableName = "TestApp-iOS.app"
+            BlueprintName = "TestApp-iOS"
+            ReferencedContainer = "container:TestApp.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </LaunchAction>
+   <ProfileAction
+      buildConfiguration = "Release"
+      shouldUseLaunchSchemeArgsEnv = "YES"
+      savedToolIdentifier = ""
+      useCustomWorkingDirectory = "NO"
+      debugDocumentVersioning = "YES">
+      <BuildableProductRunnable
+         runnableDebuggingMode = "0">
+         <BuildableReference
+            BuildableIdentifier = "primary"
+            BlueprintIdentifier = "4B0B05592BE5B44E002BC7AF"
+            BuildableName = "TestApp-iOS.app"
+            BlueprintName = "TestApp-iOS"
+            ReferencedContainer = "container:TestApp.xcodeproj">
+         </BuildableReference>
+      </BuildableProductRunnable>
+   </ProfileAction>
+   <AnalyzeAction
+      buildConfiguration = "Debug">
+   </AnalyzeAction>
+   <ArchiveAction
+      buildConfiguration = "Release"
+      revealArchiveInOrganizer = "YES">
+   </ArchiveAction>
+</Scheme>
diff --git a/nexa/__init__.py b/nexa/__init__.py
index 237c12f8..26e7b666 100644
--- a/nexa/__init__.py
+++ b/nexa/__init__.py
@@ -1 +1 @@
-__version__ = "0.0.9.0"
+__version__ = "0.0.9.5"
diff --git a/nexa/cli/entry.py b/nexa/cli/entry.py
index dff1526a..ece27ca7 100644
--- a/nexa/cli/entry.py
+++ b/nexa/cli/entry.py
@@ -40,20 +40,22 @@ def run_ggml_inference(args):
     is_local_path = kwargs.pop("local_path", False)
     model_type = kwargs.pop("model_type", None)
     hf = kwargs.pop('huggingface', False)
+    ms = kwargs.pop('modelscope', False)
     
     run_type = None
     if model_type:
         run_type = ModelType[model_type].value
+    elif is_local_path or hf or ms:
+        run_type = ModelType["NLP"].value
 
     local_path = None
-    if is_local_path or hf:
-        if not model_type:
-            print("Error: --model_type must be provided when using --local_path or --huggingface")
-            return
+    projector_local_path = None
+    
+    if is_local_path or hf or ms:
         if is_local_path:
             local_path = os.path.abspath(model_path)
             model_path = local_path
-            if run_type == "Multimodal":
+            if run_type == "Multimodal" or run_type == "AudioLM":
                 if not os.path.isdir(local_path):
                     print("Error: For Multimodal models with --local_path, the provided path must be a directory containing both model and projector ggufs.")
                     return
@@ -68,20 +70,24 @@ def run_ggml_inference(args):
                 if not os.path.isdir(local_path):
                     print("Error: For Audio models with --local_path, the provided path must be a directory containing all related files.")
                     return
-        else:  # hf case
+        else:  # hf or ms case
             # TODO: remove this after adding support for Multimodal model in CLI
             if run_type == "Multimodal" or run_type == "Audio" or run_type == "TTS":
-                print("Running multimodal model or audio model from Hugging Face is currently not supported in CLI mode. Please use SDK to run Multimodal model or Audio model or TTS model.")
+                print("Running multimodal model or audio model or TTS model from Hugging Face is currently not supported in CLI mode. Please use SDK to run Multimodal model or Audio model or TTS model.")
                 return
             from nexa.general import pull_model
-            local_path, _ = pull_model(model_path, hf=True)
+            local_path, _ = pull_model(model_path, hf=hf, ms=ms, run_type=run_type)
     else: # Model Hub
         from nexa.general import pull_model
         local_path, run_type = pull_model(model_path)
-        
+
     stop_words = kwargs.pop("stop_words", None)
 
     try:
+        if (is_local_path or hf or ms) and not model_type:
+            print("No model type specified. Running with default model type: NLP")
+            print("You can specify a different model type using the -mt flag")
+            
         if run_type == "NLP":
             from nexa.gguf.nexa_inference_text import NexaTextInference
             inference = NexaTextInference(model_path=model_path, local_path=local_path, stop_words=stop_words, **kwargs)
@@ -96,29 +102,45 @@ def run_ggml_inference(args):
                 inference.run_txt2img()
             return
         elif run_type == "Multimodal":
-            from nexa.gguf.nexa_inference_vlm import NexaVLMInference
             if is_local_path:
-                inference = NexaVLMInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path, stop_words=stop_words, **kwargs)
+                if "omni" in local_path:
+                    from nexa.gguf.nexa_inference_vlm_omni import NexaOmniVlmInference
+                    inference = NexaOmniVlmInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path, **kwargs)
+                else:
+                    from nexa.gguf.nexa_inference_vlm import NexaVLMInference
+                    inference = NexaVLMInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path, stop_words=stop_words, **kwargs)
             else:
-                inference = NexaVLMInference(model_path=model_path, local_path=local_path, stop_words=stop_words, **kwargs)
+                if "omni" in local_path:
+                    from nexa.gguf.nexa_inference_vlm_omni import NexaOmniVlmInference
+                    inference = NexaOmniVlmInference(model_path=model_path, local_path=local_path, **kwargs)
+                else:
+                    from nexa.gguf.nexa_inference_vlm import NexaVLMInference
+                    inference = NexaVLMInference(model_path=model_path, local_path=local_path, stop_words=stop_words, **kwargs)
         elif run_type == "Audio":
             from nexa.gguf.nexa_inference_voice import NexaVoiceInference
             inference = NexaVoiceInference(model_path=model_path, local_path=local_path, **kwargs)
         elif run_type == "TTS":
-            from nexa.gguf.nexa_inference_tts import NexaTTSInference
-            inference = NexaTTSInference(model_path=model_path, local_path=local_path, **kwargs)
+            # # Temporarily disabled since version v0.0.9.3
+            raise NotImplementedError("TTS model is not supported in CLI mode.")
+            # from nexa.gguf.nexa_inference_tts import NexaTTSInference
+            # inference = NexaTTSInference(model_path=model_path, local_path=local_path, **kwargs)
+        elif run_type == "AudioLM":
+            from nexa.gguf.nexa_inference_audio_lm import NexaAudioLMInference
+            inference = NexaAudioLMInference(model_path=model_path, local_path=local_path, **kwargs)
         else:
             print(f"Unknown task: {run_type}. Skipping inference.")
             return
+        
     except Exception as e:
-        print(f"Error loading GGUF models, please refer to our docs to install nexaai package: https://docs.nexaai.com/getting-started/installation ")
+        print(f"Error running ggml inference: {e}")
+        print(f"Please refer to our docs to install nexaai package: https://docs.nexaai.com/getting-started/installation ")
         return
 
     if hasattr(args, 'streamlit') and args.streamlit:
-        if run_type == "Multimodal":
-            inference.run_streamlit(model_path, is_local_path = is_local_path, hf = hf, projector_local_path = projector_local_path)
+        if run_type == "Multimodal" or run_type == "AudioLM":
+            inference.run_streamlit(model_path, is_local_path=is_local_path, hf=hf, projector_local_path=projector_local_path)
         else:
-            inference.run_streamlit(model_path, is_local_path = is_local_path, hf = hf)
+            inference.run_streamlit(model_path, is_local_path=is_local_path, hf=hf)
     else:
         inference.run()
 
@@ -130,10 +152,13 @@ def run_ggml_server(args):
     is_local_path = kwargs.pop("local_path", False)
     model_type = kwargs.pop("model_type", None)
     hf = kwargs.pop('huggingface', False)
+    ms = kwargs.pop('modelscope', False)
     
     run_type = None
     if model_type:
         run_type = ModelType[model_type].value
+    elif is_local_path or hf or ms:
+        run_type = ModelType["NLP"].value
 
     projector_local_path = None
     if run_type == "Multimodal" and is_local_path:
@@ -152,11 +177,16 @@ def run_ggml_server(args):
             print("Error: For Audio models with --local_path, the provided path must be a directory containing all related files.")
             return
 
+    if (is_local_path or hf or ms) and not model_type:
+        print("No model type specified. Running with default model type: NLP")
+        print("You can specify a different model type using the -mt flag")
+
     NexaServer(
         model_path_arg=model_path,
         is_local_path_arg=is_local_path,
         model_type_arg=run_type,
         huggingface=hf,
+        modelscope=ms,
         projector_local_path_arg=projector_local_path,
         **kwargs
     )
@@ -170,12 +200,11 @@ def run_onnx_inference(args):
     run_type = None
     if model_type:
         run_type = ModelType[model_type].value
+    elif is_local_path:
+        run_type = ModelType["NLP"].value
 
     local_path = None
     if is_local_path:
-        if not model_type:
-            print("Error: --model_type must be provided when using --local_path")
-            return
         local_path = os.path.abspath(model_path)
         if not os.path.isdir(local_path):
             print("Error: For ONNX models, the provided path must be a directory.")
@@ -186,6 +215,10 @@ def run_onnx_inference(args):
         local_path, run_type = pull_model(model_path)
 
     try:
+        if is_local_path and not model_type:
+            print("No model type specified. Running with default model type: NLP")
+            print("You can specify a different model type using the -mt flag")
+            
         if run_type == "NLP":
             from nexa.onnx.nexa_inference_text import NexaTextInference as NexaTextOnnxInference
             inference = NexaTextOnnxInference(model_path=model_path, local_path=local_path, **kwargs)
@@ -202,7 +235,8 @@ def run_onnx_inference(args):
             print(f"Unknown task: {run_type}. Skipping inference.")
             return
     except Exception as e:
-        print(f"Error loading ONNX models, please refer to our docs to install nexaai[onnx] package: https://docs.nexaai.com/getting-started/installation ")
+        print(f"Error running onnx inference: {e}")
+        print(f"Please refer to our docs to install nexaai[onnx] package: https://docs.nexaai.com/getting-started/installation ")
         return
 
     if hasattr(args, 'streamlit') and args.streamlit:
@@ -240,17 +274,18 @@ def run_embedding_generation(args):
     prompt = kwargs.pop("prompt")
     is_local_path = kwargs.pop("local_path", False)
     hf = kwargs.pop('huggingface', False)
+    ms = kwargs.pop('modelscope', False)
     normalize = kwargs.pop('normalize', False)
     no_truncate = kwargs.pop('no_truncate', False)
 
     local_path = None
-    if is_local_path or hf:
+    if is_local_path or hf or ms:
         if is_local_path:
             local_path = os.path.abspath(model_path)
             model_path = local_path
-        else:  # hf case
+        else:  # hf or ms case
             from nexa.general import pull_model
-            local_path, _ = pull_model(model_path, hf=True)
+            local_path, _ = pull_model(model_path, hf=hf, ms=ms, run_type="Text Embedding")
     else:  # Model Hub
         from nexa.general import pull_model
         local_path, _ = pull_model(model_path)
@@ -264,49 +299,128 @@ def run_embedding_generation(args):
         print(f"Error generating embedding: {e}")
         print("Please refer to our docs to install nexaai package: https://docs.nexaai.com/getting-started/installation")
 
+def _select_model_type():
+    """Helper function to get model type selection from user."""
+    print("\nSelect model type:")
+    print("1. NLP (text generation)")
+    print("2. COMPUTER_VISION (image generation)")
+    
+    while True:
+        try:
+            choice = int(input("\nSelect model type (enter number): "))
+            if choice == 1:
+                return "NLP"
+            elif choice == 2:
+                return "COMPUTER_VISION"
+            print("Invalid selection. Please try again.")
+        except ValueError:
+            print("Please enter a valid number.")
+
+def _select_quantization_type():
+    """Helper function to get quantization type selection from user."""
+    from nexa.gguf.converter.constants import LLAMA_QUANTIZATION_TYPES
+    print("\nAvailable quantization types:")
+    for i, qt in enumerate(LLAMA_QUANTIZATION_TYPES.keys(), 1):
+        print(f"{i}. {qt}")
+    
+    while True:
+        try:
+            choice = int(input("\nSelect quantization type (enter number): ")) - 1
+            if 0 <= choice < len(LLAMA_QUANTIZATION_TYPES):
+                return list(LLAMA_QUANTIZATION_TYPES.keys())[choice]
+            print("Invalid selection. Please try again.")
+        except ValueError:
+            print("Please enter a valid number.")
+
+def _store_in_nexa_list(converted_path, model_type, input_name, output_ftype):
+    """Helper function to store converted model in nexa list."""
+    import shutil
+    from nexa.general import add_model_to_list
+    from nexa.gguf.converter.constants import NEXA_MODELS_HUB_CONVERTED_DIR
+    
+    # Create the converted directory if it doesn't exist
+    os.makedirs(NEXA_MODELS_HUB_CONVERTED_DIR, exist_ok=True)
+    
+    # Copy the file to the converted directory
+    nexa_list_path = os.path.join(NEXA_MODELS_HUB_CONVERTED_DIR, os.path.basename(converted_path))
+    shutil.copy2(converted_path, nexa_list_path)
+    
+    # Add the new path to the model list
+    nexa_model_name = f"{input_name}:{output_ftype}"
+    add_model_to_list(nexa_model_name, nexa_list_path, "gguf", model_type)
+
+def _run_converted_model(converted_path, model_type):
+    """Helper function to run the converted model."""
+    try:
+        import subprocess
+        command = f"nexa run {converted_path} -lp -mt {model_type}"
+        print(f"Running command: {command}")
+        subprocess.run(command.split(), check=True, text=True)
+    except subprocess.CalledProcessError as e:
+        print("Error running the converted model.")
+        print("Change model type with -mt to run the model correctly. Or refer to our docs: https://docs.nexa.ai/sdk/cli-reference")
+
 def run_convert(args):
+    # Get model type and quantization type
+    model_type = _select_model_type()
+    ftype = args.ftype or _select_quantization_type()
+    
     input_path = args.input_path
     
-    # Check if input_path is a valid directory
-    if not os.path.isdir(input_path):
-        from nexa.general import download_repo_from_hf
-        success, local_path = download_repo_from_hf(input_path)
+    # Check input path conditions
+    if os.path.isdir(input_path):
+        # Valid directory, proceed as is
+        pass
+    elif os.path.isfile(input_path) and input_path.endswith('.gguf'):
+        # Valid GGUF file, proceed as is
+        pass
+    else:
+        # Try downloading from HF or MS if path isn't a valid local directory/file
+        if args.modelscope:
+            from nexa.general import download_repo_from_ms
+            success, local_path = download_repo_from_ms(input_path)
+        else:
+            from nexa.general import download_repo_from_hf
+            success, local_path = download_repo_from_hf(input_path)
         
         if success:
             input_path = local_path
         else:
-            print("Error: Failed to download the repository and the provided path is not a valid directory.")
+            print("Error: Input path must be either a directory, a .gguf file, or a valid Hugging Face model identifier.")
             return
-    
+
     # Input_path here should be a valid directory
     kwargs = {k: v for k, v in vars(args).items() if v is not None and k not in ['input_path', 'ftype', 'output_file', 'convert_type']}
     
     try:
         from nexa.gguf.converter.nexa_convert import convert_hf_to_quantized_gguf
-        converted_path = convert_hf_to_quantized_gguf(
+        converted_path, input_name, output_ftype = convert_hf_to_quantized_gguf(
             input_path,
             output_file=args.output_file,
-            ftype=args.ftype,
+            ftype=ftype,
             convert_type=args.convert_type,
             **kwargs
         )
         if converted_path:
-            print(f"Conversion completed successfully. Output file: {converted_path}")
+            print(f"\nConversion completed successfully. Output file: {converted_path}")
+            
+            # Ask if user wants to store in nexa list
+            store_choice = input("\nWould you like to store this model in nexa list so you can run it with `nexa run <model_name>` anywhere and anytime? (y/N): ").strip().lower()
+            if store_choice == 'y':
+                _store_in_nexa_list(converted_path, model_type, input_name, output_ftype)
             
-            # Ask user if they want to run the converted model
-            user_choice = input("Would you like to run the converted model? (y/N) (Currently only supports NLP): ").strip().lower()
-            if user_choice == 'y':
-                try:
-                    import subprocess
-                    command = f"nexa run {converted_path} -lp -mt NLP"
-                    print(f"Running command: {command}")
-                    subprocess.run(command.split(), check=True, text=True)
-                except subprocess.CalledProcessError as e:
-                    print("Error running the converted model.")
-                    print("Change model type with -mt to run the model correctly. Or refer to our docs: https://docs.nexa.ai/sdk/cli-reference")
+            # Ask if user wants to run the model
+            run_choice = input("\nWould you like to run the converted model? (y/N): ").strip().lower()
+            if run_choice == 'y':
+                _run_converted_model(converted_path, model_type)
             else:
                 print("Exiting without running the model.")
-                return
+            
+            print(f"\nConverted model stored at {converted_path}")
+            nexa_model_name = f"{input_name}:{output_ftype}"
+            running_command = f"nexa run {nexa_model_name}"\
+                if store_choice == 'y' else f"nexa run {converted_path} -lp -mt {model_type}"
+            print(f"\nYou can run the converted model with command: {running_command}")
         else:
             print("Conversion failed.")
     except Exception as e:
@@ -322,9 +436,10 @@ def main():
     run_parser.add_argument("model_path", type=str, help="Path or identifier for the model in Nexa Model Hub")
     run_parser.add_argument("-st", "--streamlit", action="store_true", help="Run the inference in Streamlit UI")
     run_parser.add_argument("-pf", "--profiling", action="store_true", help="Enable profiling logs for the inference process")
-    run_parser.add_argument("-lp", "--local_path", action="store_true", help="Indicate that the model path provided is the local path, must be used with -mt")
-    run_parser.add_argument("-mt", "--model_type", type=str, choices=[e.name for e in ModelType], help="Indicate the model running type, must be used with -lp or -hf")
-    run_parser.add_argument("-hf", "--huggingface", action="store_true", help="Load model from Hugging Face Hub, must be used with -mt")
+    run_parser.add_argument("-lp", "--local_path", action="store_true", help="Indicate that the model path provided is the local path")
+    run_parser.add_argument("-mt", "--model_type", type=str, choices=[e.name for e in ModelType], help="Indicate the model running type (default: NLP)")
+    run_parser.add_argument("-hf", "--huggingface", action="store_true", help="Load model from Hugging Face Hub")
+    run_parser.add_argument("-ms", "--modelscope", action="store_true", help="Load model from ModelScope Hub")
 
     # Text generation/vlm arguments
     text_group = run_parser.add_argument_group('Text generation/VLM options')
@@ -403,13 +518,14 @@ def main():
     embed_parser.add_argument("prompt", type=str, help="The prompt to generate an embedding for")
     embed_parser.add_argument("-lp", "--local_path", action="store_true", help="Indicate that the model path provided is the local path")
     embed_parser.add_argument("-hf", "--huggingface", action="store_true", help="Load model from Hugging Face Hub")
+    embed_parser.add_argument("-ms", "--modelscope", action="store_true", help="Load model from ModelScope Hub")
     embed_parser.add_argument("-n", "--normalize", action="store_true", help="Normalize the embeddings")
     embed_parser.add_argument("-nt", "--no_truncate", action="store_true", help="Not truncate the embeddings")
 
     # Convert command
     convert_parser = subparsers.add_parser("convert", help="Convert and quantize a Hugging Face model to GGUF format.")
     convert_parser.add_argument("input_path", type=str, help="Path to the input Hugging Face model directory or GGUF file")
-    convert_parser.add_argument("ftype", nargs='?', type=str, default="q4_0", help="Quantization type (default: q4_0)")
+    convert_parser.add_argument("ftype", nargs='?', type=str, help="Quantization type")
     convert_parser.add_argument("output_file", nargs='?', type=str, help="Path to the output quantized GGUF file")    
 
     convert_hf_parser = convert_parser.add_argument_group('Convert from safetensors options')
@@ -423,6 +539,7 @@ def main():
     convert_hf_parser.add_argument("--no_tensor_first_split", action="store_true", help="Disable tensor-first splitting")
     convert_hf_parser.add_argument("--vocab_only", action="store_true", help="Only process vocabulary")
     convert_hf_parser.add_argument("--dry_run", action="store_true", help="Perform a dry run without actual conversion")
+    convert_hf_parser.add_argument("-ms", "--modelscope", action="store_true", help="Download model from ModelScope Hub")
 
     quantization_parser = convert_parser.add_argument_group('Quantization options')
     quantization_parser.add_argument("--nthread", type=int, default=4, help="Number of threads to use (default: 4)")
@@ -437,9 +554,10 @@ def main():
     # GGML server parser
     server_parser = subparsers.add_parser("server", help="Run the Nexa AI Text Generation Service")
     server_parser.add_argument("model_path", type=str, nargs='?', help="Path or identifier for the model in Nexa Model Hub")
-    server_parser.add_argument("-lp", "--local_path", action="store_true", help="Indicate that the model path provided is the local path, must be used with -mt")
-    server_parser.add_argument("-mt", "--model_type", type=str, choices=[e.name for e in ModelType], help="Indicate the model running type, must be used with -lp or -hf")
-    server_parser.add_argument("-hf", "--huggingface", action="store_true", help="Load model from Hugging Face Hub, must be used with -mt")
+    server_parser.add_argument("-lp", "--local_path", action="store_true", help="Indicate that the model path provided is the local path")
+    server_parser.add_argument("-mt", "--model_type", type=str, choices=[e.name for e in ModelType], help="Indicate the model running type, must be used with -lp, -hf or -ms")
+    server_parser.add_argument("-hf", "--huggingface", action="store_true", help="Load model from Hugging Face Hub")
+    server_parser.add_argument("-ms", "--modelscope", action="store_true", help="Load model from ModelScope Hub")
     server_parser.add_argument("--host", type=str, default="localhost", help="Host to bind the server to")
     server_parser.add_argument("--port", type=int, default=8000, help="Port to bind the server to")
     server_parser.add_argument("--reload", action="store_true", help="Enable automatic reloading on code changes")
@@ -449,6 +567,7 @@ def main():
     pull_parser = subparsers.add_parser("pull", help="Pull a model from official or hub.")
     pull_parser.add_argument("model_path", type=str, help="Path or identifier for the model in Nexa Model Hub")
     pull_parser.add_argument("-hf", "--huggingface", action="store_true", help="Pull model from Hugging Face Hub")
+    pull_parser.add_argument("-ms", "--modelscope", action="store_true", help="Pull model from ModelScope Hub")
     pull_parser.add_argument("-o", "--output_path", type=str, help="Custom output path for the pulled model")
 
     remove_parser = subparsers.add_parser("remove", help="Remove a model from local machine.")
@@ -482,22 +601,25 @@ def main():
         if args.local_path and args.huggingface:
             print("Error: --local_path and --huggingface flags cannot be used together")
             return
-        if (args.local_path or args.huggingface) and not args.model_type:
-            print("Error: --model_type must be provided when using --local_path or --huggingface")
+        if args.local_path and args.modelscope:
+            print("Error: --local_path and --modelscope flags cannot be used together")
+            return
+        if args.huggingface and args.modelscope:
+            print("Error: --huggingface and --modelscope flags cannot be used together")
             return
         run_ggml_inference(args)
     elif args.command == "server":
         if args.local_path and args.huggingface:
             print("Error: --local_path and --huggingface flags cannot be used together")
             return
-        if (args.local_path or args.huggingface) and not args.model_type:
-            print("Error: --model_type must be provided when using --local_path or --huggingface")
+        if args.local_path and args.modelscope:
+            print("Error: --local_path and --modelscope flags cannot be used together")
+            return
+        if args.huggingface and args.modelscope:
+            print("Error: --huggingface and --modelscope flags cannot be used together")
             return
         run_ggml_server(args)
     elif args.command == "onnx":
-        if args.local_path and not args.model_type:
-            print("Error: --model_type must be provided when using --local_path")
-            return
         run_onnx_inference(args)
     elif args.command == "eval":
         run_eval_tasks(args)
@@ -508,6 +630,7 @@ def main():
         import os
 
         hf = getattr(args, 'huggingface', False)
+        ms = getattr(args, 'modelscope', False)
         local_download_path = None
         
         if args.output_path:
@@ -515,8 +638,7 @@ def main():
                 os.makedirs(args.output_path, exist_ok=True)
                 print(f"Created output directory: {args.output_path}")
             local_download_path = os.path.abspath(args.output_path)
-            
-        pull_model(args.model_path, hf, local_download_path=local_download_path)
+        pull_model(args.model_path, hf, ms, local_download_path=local_download_path)
     elif args.command == "convert":
         run_convert(args)
     elif args.command == "remove":
diff --git a/nexa/constants.py b/nexa/constants.py
index 8d423f73..51d6e051 100644
--- a/nexa/constants.py
+++ b/nexa/constants.py
@@ -9,6 +9,7 @@
 NEXA_MODEL_EVAL_RESULTS_PATH = NEXA_CACHE_ROOT / "eval"
 NEXA_MODELS_HUB_OFFICIAL_DIR = NEXA_MODELS_HUB_DIR / "official"
 NEXA_MODELS_HUB_HF_DIR = NEXA_MODELS_HUB_DIR / "huggingface"
+NEXA_MODELS_HUB_MS_DIR = NEXA_MODELS_HUB_DIR / "modelscope"
 NEXA_MODEL_LIST_PATH = NEXA_MODELS_HUB_DIR / "model_list.json"
 
 # URLs and buckets
@@ -38,6 +39,7 @@ class ModelType(Enum):
     TTS = "TTS"
     MULTIMODAL = "Multimodal"
     TEXT_EMBEDDING = "Text Embedding"
+    AUDIOLM = "AudioLM"
 
 
 NEXA_RUN_MODEL_MAP_TEXT = {
@@ -57,7 +59,7 @@ class ModelType(Enum):
     "mistral": "Mistral-7B-Instruct-v0.3:q4_0",
     "codegemma": "codegemma-2b:q4_0",
     "codellama": "CodeLlama-7b-Instruct:q4_0",
-    "codeqwen": "Qwen2.5-Coder-1.5B-Instruct:q4_0",
+    "codeqwen": "Qwen2.5-Coder-3B-Instruct:q4_0",
     "mathqwen": "Qwen2.5-Math-1.5B-Instruct:q4_0",
     "deepseek-coder": "deepseek-coder-1.3b-instruct:q4_0",
     "dolphin-mistral": "dolphin-2.8-mistral-7b:q4_0",
@@ -108,6 +110,28 @@ class ModelType(Enum):
     "llava-v1.6-vicuna-7b:fp16": "llava-v1.6-vicuna-7b:model-fp16",
 }
 
+NEXA_RUN_MODEL_MAP_AUDIO_LM = {
+    "qwen2audio": "Qwen2-Audio-7.8B-Instruct:model-q4_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q2_K": "Qwen2-Audio-7.8B-Instruct:model-q2_K",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_L": "Qwen2-Audio-7.8B-Instruct:model-q3_K_L",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_M": "Qwen2-Audio-7.8B-Instruct:model-q3_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_S": "Qwen2-Audio-7.8B-Instruct:model-q3_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q4_0": "Qwen2-Audio-7.8B-Instruct:model-q4_0",
+    "Qwen2-Audio-7.8B-Instruct:q4_1": "Qwen2-Audio-7.8B-Instruct:model-q4_1",
+    "Qwen2-Audio-7.8B-Instruct:q4_K_M": "Qwen2-Audio-7.8B-Instruct:model-q4_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q4_K_S": "Qwen2-Audio-7.8B-Instruct:model-q4_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q5_0": "Qwen2-Audio-7.8B-Instruct:model-q5_0",
+    "Qwen2-Audio-7.8B-Instruct:q5_1": "Qwen2-Audio-7.8B-Instruct:model-q5_1",
+    "Qwen2-Audio-7.8B-Instruct:q5_K_M": "Qwen2-Audio-7.8B-Instruct:model-q5_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q5_K_S": "Qwen2-Audio-7.8B-Instruct:model-q5_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q6_K": "Qwen2-Audio-7.8B-Instruct:model-q6_K",
+    "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:model-q8_0",
+    "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:model-fp16",
+    "omniaudio": "omniaudio:model-fp16",
+    "omniaudio:fp16": "omniaudio:model-fp16",
+    "omniaudio:q4_0": "omniaudio:model-q4_0",
+}
+
 NEXA_RUN_MODEL_MAP_VOICE = {
     "whisper-large": "whisper-large:bin-large-v3",
     "whisper-tiny": "whisper-tiny:bin-tiny",
@@ -160,6 +184,48 @@ class ModelType(Enum):
     "llava-v1.6-vicuna-7b:fp16": "llava-v1.6-vicuna-7b:projector-fp16",
 }
 
+NEXA_RUN_OMNI_VLM_PROJECTOR_MAP = {
+    "omnivision-preview": "omnivision-preview:projector-fp16",
+    "omnivision-preview:fp16": "omnivision-preview:projector-fp16",
+    "omnivision-preview:q4_0": "omnivision-preview:projector-q4_0",
+    "omniVLM": "omniVLM:projector-fp16",
+    "omniVLM:fp16": "omniVLM:projector-fp16",
+    "omnivision-ocr": "omnivision-ocr:projector-fp16",
+    "omnivision-ocr:fp16": "omnivision-ocr:projector-fp16",
+}
+
+NEXA_RUN_OMNI_VLM_MAP = {
+    "omnivision-preview": "omnivision-preview:model-fp16",
+    "omnivision-preview:fp16": "omnivision-preview:model-fp16",
+    "omnivision-preview:q4_0": "omnivision-preview:model-q4_0",
+    "omniVLM": "omniVLM:model-fp16",
+    "omniVLM:fp16": "omniVLM:model-fp16",
+    "omnivision-ocr": "omnivision-ocr:model-fp16",
+    "omnivision-ocr:fp16": "omnivision-ocr:model-fp16",
+}
+
+NEXA_RUN_AUDIO_LM_PROJECTOR_MAP = {
+    "qwen2audio": "Qwen2-Audio-7.8B-Instruct:projector-q4_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q2_K": "Qwen2-Audio-7.8B-Instruct:projector-q2_K",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_L": "Qwen2-Audio-7.8B-Instruct:projector-q3_K_L",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_M": "Qwen2-Audio-7.8B-Instruct:projector-q3_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q3_K_S": "Qwen2-Audio-7.8B-Instruct:projector-q3_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q4_0": "Qwen2-Audio-7.8B-Instruct:projector-q4_0",
+    "Qwen2-Audio-7.8B-Instruct:q4_1": "Qwen2-Audio-7.8B-Instruct:projector-q4_1",
+    "Qwen2-Audio-7.8B-Instruct:q4_K_M": "Qwen2-Audio-7.8B-Instruct:projector-q4_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q4_K_S": "Qwen2-Audio-7.8B-Instruct:projector-q4_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q5_0": "Qwen2-Audio-7.8B-Instruct:projector-q5_0",
+    "Qwen2-Audio-7.8B-Instruct:q5_1": "Qwen2-Audio-7.8B-Instruct:projector-q5_1",
+    "Qwen2-Audio-7.8B-Instruct:q5_K_M": "Qwen2-Audio-7.8B-Instruct:projector-q5_K_M",
+    "Qwen2-Audio-7.8B-Instruct:q5_K_S": "Qwen2-Audio-7.8B-Instruct:projector-q5_K_S",
+    "Qwen2-Audio-7.8B-Instruct:q6_K": "Qwen2-Audio-7.8B-Instruct:projector-q6_K",
+    "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:projector-q8_0",
+    "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:projector-fp16",
+    "omniaudio": "omniaudio:projector-fp16",
+    "omniaudio:fp16": "omniaudio:projector-fp16",
+    "omniaudio:q4_0": "omniaudio:projector-q4_0",
+}
+
 NEXA_RUN_T5XXL_MAP = {
     "flux": "FLUX.1-schnell:t5xxl-q4_0",
     "FLUX.1-schnell:q4_0": "FLUX.1-schnell:t5xxl-q4_0",
@@ -207,6 +273,8 @@ class ModelType(Enum):
 NEXA_RUN_MODEL_MAP = {
     **NEXA_RUN_MODEL_MAP_TEXT,
     **NEXA_RUN_MODEL_MAP_VLM,
+    **NEXA_RUN_OMNI_VLM_MAP,
+    **NEXA_RUN_MODEL_MAP_AUDIO_LM,
     **NEXA_RUN_MODEL_MAP_IMAGE,
     **NEXA_RUN_MODEL_MAP_VOICE,
     **NEXA_RUN_MODEL_MAP_TTS,
@@ -244,7 +312,9 @@ class ModelType(Enum):
     "qwen2.5-1.5b-instruct": "qwen",
     "qwen2.5-3b-instruct": "qwen",
     "qwen2.5-7b-instruct": "qwen",
+    "qwen2.5-coder-0.5b-instruct": "qwen",
     "qwen2.5-coder-1.5b-instruct": "qwen",
+    "qwen2.5-coder-3b-instruct": "qwen",
     "qwen2.5-coder-7b-instruct": "qwen",
     "qwen2.5-math-1.5b-instruct": "qwen",
     "qwen2.5-math-7b-instruct": "qwen",
@@ -319,6 +389,9 @@ class ModelType(Enum):
     "compute_type": "default",
 }
 
+# key is the repo name on Nexa model hub, NOT model abbreviation
+# For example : https://nexa.ai/NexaAI/Octo-omni-vision/gguf-fp16/readme
+# We need to register key : Octo-omni-vision
 NEXA_OFFICIAL_MODELS_TYPE = {
     "gemma-2b": ModelType.NLP,
     "Llama-2-7b-chat": ModelType.NLP,
@@ -347,7 +420,9 @@ class ModelType(Enum):
     "Qwen2.5-0.5B-Instruct": ModelType.NLP,
     "Qwen2.5-1.5B-Instruct": ModelType.NLP,
     "Qwen2.5-3B-Instruct": ModelType.NLP,
+    "Qwen2.5-Coder-0.5B-Instruct": ModelType.NLP,
     "Qwen2.5-Coder-1.5B-Instruct": ModelType.NLP,
+    "Qwen2.5-Coder-3B-Instruct": ModelType.NLP,
     "Qwen2.5-Coder-7B-Instruct": ModelType.NLP,
     "Qwen2.5-Math-1.5B-Instruct": ModelType.NLP,
     "Qwen2.5-Math-7B-Instruct": ModelType.NLP,
@@ -385,11 +460,16 @@ class ModelType(Enum):
     "anything-v30-LCM": ModelType.COMPUTER_VISION,
     "FLUX.1-schnell": ModelType.COMPUTER_VISION,
     "Phi-3-vision-128k-instruct": ModelType.MULTIMODAL,
+    "omnivision-preview": ModelType.MULTIMODAL,
+    "omniVLM": ModelType.MULTIMODAL,
+    "omnivision-ocr": ModelType.MULTIMODAL,
     "nanoLLaVA": ModelType.MULTIMODAL,
     "llava-v1.6-mistral-7b": ModelType.MULTIMODAL,
     "llava-v1.6-vicuna-7b": ModelType.MULTIMODAL,
     "llava-phi-3-mini": ModelType.MULTIMODAL,
     "llava-llama-3-8b-v1.1": ModelType.MULTIMODAL,
+    "omniaudio": ModelType.AUDIOLM,
+    "Qwen2-Audio-7.8B-Instruct": ModelType.AUDIOLM,
     "faster-whisper-tiny.en": ModelType.AUDIO,
     "faster-whisper-tiny": ModelType.AUDIO,
     "faster-whisper-small.en": ModelType.AUDIO,
@@ -412,154 +492,4 @@ class ModelType(Enum):
     "nomic-embed-text-v1.5": ModelType.TEXT_EMBEDDING,
     "all-MiniLM-L6-v2": ModelType.TEXT_EMBEDDING,
     "all-MiniLM-L12-v2": ModelType.TEXT_EMBEDDING,
-}
-
-from nexa.gguf.llama.llama_cpp import (
-    LLAMA_FTYPE_ALL_F32,
-    LLAMA_FTYPE_MOSTLY_F16,
-    LLAMA_FTYPE_MOSTLY_Q4_0,
-    LLAMA_FTYPE_MOSTLY_Q4_1,
-    LLAMA_FTYPE_MOSTLY_Q8_0,
-    LLAMA_FTYPE_MOSTLY_Q5_0,
-    LLAMA_FTYPE_MOSTLY_Q5_1,
-    LLAMA_FTYPE_MOSTLY_Q2_K,
-    LLAMA_FTYPE_MOSTLY_Q3_K_S,
-    LLAMA_FTYPE_MOSTLY_Q3_K_M,
-    LLAMA_FTYPE_MOSTLY_Q3_K_L,
-    LLAMA_FTYPE_MOSTLY_Q4_K_S,
-    LLAMA_FTYPE_MOSTLY_Q4_K_M,
-    LLAMA_FTYPE_MOSTLY_Q5_K_S,
-    LLAMA_FTYPE_MOSTLY_Q5_K_M,
-    LLAMA_FTYPE_MOSTLY_Q6_K,
-    LLAMA_FTYPE_MOSTLY_IQ2_XXS,
-    LLAMA_FTYPE_MOSTLY_IQ2_XS,
-    LLAMA_FTYPE_MOSTLY_Q2_K_S,
-    LLAMA_FTYPE_MOSTLY_IQ3_XS,
-    LLAMA_FTYPE_MOSTLY_IQ3_XXS,
-    LLAMA_FTYPE_MOSTLY_IQ1_S,
-    LLAMA_FTYPE_MOSTLY_IQ4_NL,
-    LLAMA_FTYPE_MOSTLY_IQ3_S,
-    LLAMA_FTYPE_MOSTLY_IQ3_M,
-    LLAMA_FTYPE_MOSTLY_IQ2_S,
-    LLAMA_FTYPE_MOSTLY_IQ2_M,
-    LLAMA_FTYPE_MOSTLY_IQ4_XS,
-    LLAMA_FTYPE_MOSTLY_IQ1_M,
-    LLAMA_FTYPE_MOSTLY_BF16,
-    LLAMA_FTYPE_MOSTLY_Q4_0_4_4,
-    LLAMA_FTYPE_MOSTLY_Q4_0_4_8,
-    LLAMA_FTYPE_MOSTLY_Q4_0_8_8,
-    LLAMA_FTYPE_MOSTLY_TQ1_0,
-    LLAMA_FTYPE_MOSTLY_TQ2_0,
-)
-from nexa.gguf.llama.llama_cpp import (
-    GGML_TYPE_F32,
-    GGML_TYPE_F16,
-    GGML_TYPE_Q4_0,
-    GGML_TYPE_Q4_1,
-    GGML_TYPE_Q5_0,
-    GGML_TYPE_Q5_1,
-    GGML_TYPE_Q8_0,
-    GGML_TYPE_Q8_1,
-    GGML_TYPE_Q2_K,
-    GGML_TYPE_Q3_K,
-    GGML_TYPE_Q4_K,
-    GGML_TYPE_Q5_K,
-    GGML_TYPE_Q6_K,
-    GGML_TYPE_Q8_K,
-    GGML_TYPE_IQ2_XXS,
-    GGML_TYPE_IQ2_XS,
-    GGML_TYPE_IQ3_XXS,
-    GGML_TYPE_IQ1_S,
-    GGML_TYPE_IQ4_NL,
-    GGML_TYPE_IQ3_S,
-    GGML_TYPE_IQ2_S,
-    GGML_TYPE_IQ4_XS,
-    GGML_TYPE_I8,
-    GGML_TYPE_I16,
-    GGML_TYPE_I32,
-    GGML_TYPE_I64,
-    GGML_TYPE_F64,
-    GGML_TYPE_IQ1_M,
-    GGML_TYPE_BF16,
-    GGML_TYPE_Q4_0_4_4,
-    GGML_TYPE_Q4_0_4_8,
-    GGML_TYPE_Q4_0_8_8,
-    GGML_TYPE_COUNT,
-)
-
-# From quantize.cpp
-# For mapping of general quantization options (ftypes)
-LLAMA_QUANTIZATION_TYPES = {
-    "q4_0": LLAMA_FTYPE_MOSTLY_Q4_0,
-    "q4_1": LLAMA_FTYPE_MOSTLY_Q4_1,
-    "q5_0": LLAMA_FTYPE_MOSTLY_Q5_0,
-    "q5_1": LLAMA_FTYPE_MOSTLY_Q5_1,
-    "q8_0": LLAMA_FTYPE_MOSTLY_Q8_0,
-    "q2_k": LLAMA_FTYPE_MOSTLY_Q2_K,
-    "q3_k_s": LLAMA_FTYPE_MOSTLY_Q3_K_S,
-    "q3_k_m": LLAMA_FTYPE_MOSTLY_Q3_K_M,
-    "q3_k_l": LLAMA_FTYPE_MOSTLY_Q3_K_L,
-    "q4_k_s": LLAMA_FTYPE_MOSTLY_Q4_K_S,
-    "q4_k_m": LLAMA_FTYPE_MOSTLY_Q4_K_M,
-    "q5_k_s": LLAMA_FTYPE_MOSTLY_Q5_K_S,
-    "q5_k_m": LLAMA_FTYPE_MOSTLY_Q5_K_M,
-    "q6_k": LLAMA_FTYPE_MOSTLY_Q6_K,
-    "iq2_xxs": LLAMA_FTYPE_MOSTLY_IQ2_XXS,
-    "iq2_xs": LLAMA_FTYPE_MOSTLY_IQ2_XS,
-    "q2_k_s": LLAMA_FTYPE_MOSTLY_Q2_K_S,
-    "iq3_xs": LLAMA_FTYPE_MOSTLY_IQ3_XS,
-    "iq3_xxs": LLAMA_FTYPE_MOSTLY_IQ3_XXS,
-    "iq1_s": LLAMA_FTYPE_MOSTLY_IQ1_S,
-    "iq4_nl": LLAMA_FTYPE_MOSTLY_IQ4_NL,
-    "iq3_s": LLAMA_FTYPE_MOSTLY_IQ3_S,
-    "iq3_m": LLAMA_FTYPE_MOSTLY_IQ3_M,
-    "iq2_s": LLAMA_FTYPE_MOSTLY_IQ2_S,
-    "iq2_m": LLAMA_FTYPE_MOSTLY_IQ2_M,
-    "iq4_xs": LLAMA_FTYPE_MOSTLY_IQ4_XS,
-    "iq1_m": LLAMA_FTYPE_MOSTLY_IQ1_M,
-    "f16": LLAMA_FTYPE_MOSTLY_F16,
-    "f32": LLAMA_FTYPE_ALL_F32,
-    "bf16": LLAMA_FTYPE_MOSTLY_BF16,
-    "q4_0_4_4": LLAMA_FTYPE_MOSTLY_Q4_0_4_4,
-    "q4_0_4_8": LLAMA_FTYPE_MOSTLY_Q4_0_4_8,
-    "q4_0_8_8": LLAMA_FTYPE_MOSTLY_Q4_0_8_8,
-    "tq1_0": LLAMA_FTYPE_MOSTLY_TQ1_0,
-    "tq2_0": LLAMA_FTYPE_MOSTLY_TQ2_0,
-}
-
-# From ggml.h
-# For mapping of output_tensor_type and token_embedding_type only
-GGML_TYPES = {
-    "f32": GGML_TYPE_F32,
-    "f16": GGML_TYPE_F16,
-    "q4_0": GGML_TYPE_Q4_0,
-    "q4_1": GGML_TYPE_Q4_1,
-    "q5_0": GGML_TYPE_Q5_0,
-    "q5_1": GGML_TYPE_Q5_1,
-    "q8_0": GGML_TYPE_Q8_0,
-    "q8_1": GGML_TYPE_Q8_1,
-    "q2_k": GGML_TYPE_Q2_K,
-    "q3_k": GGML_TYPE_Q3_K,
-    "q4_k": GGML_TYPE_Q4_K,
-    "q5_k": GGML_TYPE_Q5_K,
-    "q6_k": GGML_TYPE_Q6_K,
-    "q8_k": GGML_TYPE_Q8_K,
-    "iq2_xxs": GGML_TYPE_IQ2_XXS,
-    "iq2_xs": GGML_TYPE_IQ2_XS,
-    "iq3_xxs": GGML_TYPE_IQ3_XXS,
-    "iq1_s": GGML_TYPE_IQ1_S,
-    "iq4_nl": GGML_TYPE_IQ4_NL,
-    "iq3_s": GGML_TYPE_IQ3_S,
-    "iq2_s": GGML_TYPE_IQ2_S,
-    "iq4_xs": GGML_TYPE_IQ4_XS,
-    "i8": GGML_TYPE_I8,
-    "i16": GGML_TYPE_I16,
-    "i32": GGML_TYPE_I32,
-    "i64": GGML_TYPE_I64,
-    "f64": GGML_TYPE_F64,
-    "iq1_m": GGML_TYPE_IQ1_M,
-    "bf16": GGML_TYPE_BF16,
-    "q4_0_4_4": GGML_TYPE_Q4_0_4_4,
-    "q4_0_4_8": GGML_TYPE_Q4_0_4_8,
-    "q4_0_8_8": GGML_TYPE_Q4_0_8_8,
 }
\ No newline at end of file
diff --git a/nexa/general.py b/nexa/general.py
index f522446d..2289f661 100644
--- a/nexa/general.py
+++ b/nexa/general.py
@@ -18,6 +18,7 @@
     NEXA_MODELS_HUB_DIR,
     NEXA_MODELS_HUB_OFFICIAL_DIR,
     NEXA_MODELS_HUB_HF_DIR,
+    NEXA_MODELS_HUB_MS_DIR,
     NEXA_OFFICIAL_BUCKET,
     NEXA_RUN_MODEL_MAP,
     NEXA_TOKEN_PATH,
@@ -107,12 +108,14 @@ def get_user_info(token):
         return None
 
 
-def pull_model(model_path, hf = False, **kwargs):
+def pull_model(model_path, hf = False, ms = False, **kwargs):
     model_path = NEXA_RUN_MODEL_MAP.get(model_path, model_path)
 
     try:
         if hf == True:
             result = pull_model_from_hf(model_path, **kwargs)
+        elif ms == True:
+            result = pull_model_from_ms(model_path, **kwargs)
         else: 
             if is_model_exists(model_path):
                 location, run_type = get_model_info(model_path)
@@ -126,10 +129,11 @@ def pull_model(model_path, hf = False, **kwargs):
 
         if result["success"]:
             # Only add to model list if not using custom download path
+            model_path = model_path if not (hf or ms) else f"{model_path}:{result['local_path'].split('/')[-1]}"
             if not kwargs.get('local_download_path'):
                 add_model_to_list(model_path, result["local_path"], result["model_type"], result["run_type"])
             
-            if hf:
+            if hf or ms:
                 print(f"Successfully pulled model {model_path} to {result['local_path']}")
             else:
                 print(f"Successfully pulled model {model_path} to {result['local_path']}, run_type: {result['run_type']}")
@@ -230,8 +234,8 @@ def pull_model_from_official(model_path, **kwargs):
         "run_type": run_type_str
     }
 
-def pull_model_from_hf(repo_id, **kwargs):
-    repo_id, filename = select_gguf_in_hf_repo(repo_id)
+def pull_model_from_hf(repo_id, run_type = "NLP", **kwargs):
+    repo_id, filename = select_gguf_from_repo(repo_id, 'huggingface')
     success, model_path = download_gguf_from_hf(repo_id, filename, **kwargs)
 
     # For beta version, we only support NLP gguf models
@@ -239,7 +243,20 @@ def pull_model_from_hf(repo_id, **kwargs):
         "success": success,
         "local_path": model_path,
         "model_type": "gguf",
-        "run_type": "NLP" # Just for compatibility, hf model type will be passed from outsice
+        "run_type": run_type
+    }
+
+
+def pull_model_from_ms(repo_id, run_type = "NLP", **kwargs):
+    repo_id, filename = select_gguf_from_repo(repo_id, 'modelscope')
+    success, model_path = download_gguf_from_ms(repo_id, filename, **kwargs)
+
+    # For beta version, we only support NLP gguf models
+    return {
+        "success": success,
+        "local_path": model_path,
+        "model_type": "gguf",
+        "run_type": run_type
     }
 
 
@@ -321,7 +338,7 @@ def default_use_processes():
 def download_file_with_progress(
     url: str,
     file_path: Path,
-    chunk_size: int = 40 * 1024 * 1024,
+    chunk_size: int = 5 * 1024 * 1024,
     max_workers: int = 20,
     use_processes: bool = default_use_processes(),
     **kwargs
@@ -379,12 +396,25 @@ def download_file_with_progress(
         progress_bar.close()
 
         if all(completed_chunks):
+            # Create a new progress bar for combining chunks
+            combine_progress = tqdm(
+                total=file_size,
+                unit='B',
+                unit_scale=True,
+                desc="Verifying download",
+                unit_divisor=1024
+            )
+            
+            buffer_size = 1 * 1024 * 1024  # 1MB buffer
+            
             with open(file_path, "wb") as final_file:
                 for i in range(len(chunks)):
                     chunk_file = temp_dir / f"{file_path.name}.part{i}"
                     with open(chunk_file, "rb") as part_file:
-                        final_file.write(part_file.read())
-
+                        shutil.copyfileobj(part_file, final_file, buffer_size)
+                        combine_progress.update(os.path.getsize(chunk_file))
+            
+            combine_progress.close()
         else:
             raise Exception("Some chunks failed to download")
 
@@ -468,6 +498,32 @@ def download_repo_from_hf(repo_id):
         print(f"Failed to download the repository: {e}")
         return False, None
 
+def download_repo_from_ms(repo_id):
+    try:
+        from modelscope import snapshot_download
+        from pathlib import Path
+    except ImportError:
+        print("The modelscope package is required. Please install it with `pip install modelscope`.")
+        return False, None
+    
+    # Define the local directory to save the model
+    local_dir = NEXA_MODELS_HUB_MS_DIR / Path(repo_id)
+    local_dir.mkdir(parents=True, exist_ok=True)
+    
+    try:
+        # Download the entire repository
+        repo_path = snapshot_download(
+            model_id=repo_id,
+            local_dir=local_dir,
+            revision="master"
+        )
+
+        print(f"Successfully downloaded repository '{repo_id}' to {repo_path}")
+        return True, repo_path
+    except Exception as e:
+        print(f"Failed to download the repository: {e}")
+        return False, None
+
 def download_gguf_from_hf(repo_id, filename, **kwargs):
     try:
         from huggingface_hub import hf_hub_download
@@ -507,12 +563,60 @@ def download_gguf_from_hf(repo_id, filename, **kwargs):
         print(f"Failed to download the model: {e}")
         return False, None
 
+def download_gguf_from_ms(repo_id, filename, **kwargs):
+    from pathlib import Path
+    import shutil
+    try:
+        from modelscope.hub.file_download import model_file_download
+    except ImportError:
+        print("The modelscope package is required. Please install it with `pip install modelscope`.")
+        return None
+
+    # Get custom download path from kwargs if present
+    local_download_path = kwargs.get('local_download_path')
+    base_download_dir = Path(local_download_path) if local_download_path else NEXA_MODELS_HUB_MS_DIR
+    local_dir = base_download_dir / Path(repo_id)
+    local_dir.mkdir(parents=True, exist_ok=True)
+
+    # Download the model
+    try:
+        model_path = model_file_download(
+            model_id=repo_id,
+            file_path=filename,
+            local_dir=local_dir,
+            local_files_only=False,
+        )
+        # If using custom download path, move the file and cleanup
+        if local_download_path:
+            model_file = Path(model_path)
+            target_path = base_download_dir / filename
+            shutil.move(str(model_file), str(target_path))
+            # Get the organization directory (first part of repo_id)
+            org_dir = base_download_dir / repo_id.split('/')[0]
+            shutil.rmtree(org_dir)
+            return True, str(target_path)
+
+        return True, model_path
+    except Exception as e:
+        print(f"Failed to download the model: {e}")
+        return False, None
+
 def is_model_exists(model_name):
     if not NEXA_MODEL_LIST_PATH.exists():
         return False
 
     with open(NEXA_MODEL_LIST_PATH, "r") as f:
         model_list = json.load(f)
+        
+    # For AudioLM and Multimodal models, should check the file location instead of model name
+    if ":" in model_name:
+        model_path_with_slash = model_name.replace(":", "/")
+        model_path_with_backslash = model_name.replace(":", "\\")
+        
+        # Check if model_prefix/model_suffix or model_prefix\model_suffix exists in any location path
+        for model_key, model_info in model_list.items():
+            if model_path_with_slash in model_info["location"] or model_path_with_backslash in model_info["location"]:
+                return model_key
 
     return model_name in model_list
 
@@ -525,6 +629,13 @@ def add_model_to_list(model_name, model_location, model_type, run_type):
             model_list = json.load(f)
     else:
         model_list = {}
+    
+    # For AudioLM and Multimodal models, should remove the "model-" prefix from the tag name
+    if run_type == "AudioLM" or run_type == "Multimodal":
+        tag_name = model_name.split(":")[1]
+        if tag_name.startswith("model-"):
+            tag_name = tag_name[6:]
+            model_name = f"{model_name.split(':')[0]}:{tag_name}"
 
     model_list[model_name] = {
         "type": model_type,
@@ -543,11 +654,22 @@ def get_model_info(model_name):
     with open(NEXA_MODEL_LIST_PATH, "r") as f:
         model_list = json.load(f)
 
+    # First try direct lookup
     model_data = model_list.get(model_name, {})
-    location = model_data.get("location")
-    run_type = model_data.get("run_type")
+    if model_data:
+        return model_data.get("location"), model_data.get("run_type")
+
+    # If not found and model_name contains ":", try path-based lookup
+    if ":" in model_name:
+        model_path_with_slash = model_name.replace(":", "/")
+        model_path_with_backslash = model_name.replace(":", "\\")
+        
+        # Check if model_prefix/model_suffix or model_prefix\model_suffix exists in any location path
+        for model_key, model_info in model_list.items():
+            if model_path_with_slash in model_info["location"] or model_path_with_backslash in model_info["location"]:
+                return model_info["location"], model_info["run_type"]
 
-    return location, run_type
+    return None, None
 
 
 def list_models():
@@ -558,22 +680,31 @@ def list_models():
         with open(NEXA_MODEL_LIST_PATH, "r") as f:
             model_list = json.load(f)
 
+        filtered_list = {
+            model_name: model_info 
+            for model_name, model_info in model_list.items() 
+            if ':' not in model_name or not model_name.split(':')[1].startswith('projector')
+        }
+
         table = [
             (model_name, model_info["type"], model_info["run_type"], model_info["location"])
-            for model_name, model_info in model_list.items()
+            for model_name, model_info in filtered_list.items()
         ]
         headers = ["Model Name", "Type", "Run Type", "Location"]
         from tabulate import tabulate
 
         print(
             tabulate(
-                table, headers, tablefmt="pretty", colalign=("left", "left", "left", "left")
+                table, 
+                headers, 
+                tablefmt="pretty", 
+                colalign=("left", "left", "left", "left"),
+                maxcolwidths=[150, 15, 20, 90]
             )
         )
     except Exception as e:
         print(f"An error occurred while listing the models: {e}")
 
-
 def remove_model(model_path):
     model_path = NEXA_RUN_MODEL_MAP.get(model_path, model_path)
 
@@ -585,24 +716,68 @@ def remove_model(model_path):
         with open(NEXA_MODEL_LIST_PATH, "r") as f:
             model_list = json.load(f)
 
+        # First try direct lookup
         if model_path not in model_list:
-            print(f"Model {model_path} not found.")
-            return
+            # If not found and model_path contains ":", try path-based lookup
+            if ":" in model_path:
+                model_path_with_slash = model_path.replace(":", "/")
+                model_path_with_backslash = model_path.replace(":", "\\")
+                
+                # Find matching model key
+                matching_key = None
+                for model_key, model_info in model_list.items():
+                    if model_path_with_slash in model_info["location"] or model_path_with_backslash in model_info["location"]:
+                        matching_key = model_key
+                        break
+                
+                if matching_key:
+                    model_path = matching_key
+                else:
+                    print(f"Model {model_path} not found.")
+                    return
+            else:
+                print(f"Model {model_path} not found.")
+                return
 
         model_info = model_list.pop(model_path)
         model_location = model_info['location']
         model_path = Path(model_location)
 
         # Delete the model files
+        model_deleted = False
         if model_path.is_file():
             model_path.unlink()
             print(f"Deleted model file: {model_path}")
+            model_deleted = True
         elif model_path.is_dir():
             shutil.rmtree(model_path)
             print(f"Deleted model directory: {model_path}")
+            model_deleted = True
         else:
             print(f"Warning: Model location not found: {model_path}")
 
+        # Delete projectors only if model was successfully deleted
+        if model_deleted:
+            parent_dir = model_path.parent
+            gguf_files = list(parent_dir.glob("*.gguf"))
+            
+            # Only proceed if there's exactly one .gguf file in the directory
+            if len(gguf_files) == 1:
+                projector_keys = [
+                    k for k in model_list.keys() 
+                    if 'projector' in k and str(parent_dir) in model_list[k]['location']
+                ]
+                
+                for key in projector_keys:
+                    projector_info = model_list.pop(key)
+                    projector_location = Path(projector_info['location'])
+                    if projector_location.exists():
+                        if projector_location.is_file():
+                            projector_location.unlink()
+                        else:
+                            shutil.rmtree(projector_location)
+                        print(f"Deleted projector: {projector_location}")
+
         # Update the model list file
         with open(NEXA_MODEL_LIST_PATH, "w") as f:
             json.dump(model_list, f, indent=2)
@@ -638,42 +813,60 @@ def clean():
     except Exception as e:
         print(f"An error occurred while cleaning the directory: {e}")
 
-def select_gguf_in_hf_repo(repo_id: str) -> Tuple[str, str]:
+def select_gguf_from_repo(repo_id: str, model_hub: str) -> Tuple[str, str]:
     """
-    Lists all files ending with .gguf in the given Hugging Face repository,
+    Lists all files ending with .gguf in the given (HuggingFace or ModelScope) repository,
     prompts the user to select one, and returns the repo_id and the selected filename.
 
     Args:
-        repo_id (str): The Hugging Face repository ID.
+        repo_id (str): The repository ID.
+        model_hub (str): huggingface or modelscope
 
     Returns:
         Tuple[str, str]: A tuple containing the repo_id and the selected filename.
     """
-    try:
-        from huggingface_hub import HfFileSystem
-        from huggingface_hub.utils import validate_repo_id
-        from pathlib import Path
-    except ImportError:
-        print("The huggingface-hub package is required. Please install it with `pip install huggingface-hub`.")
-        exit(1)
+    if model_hub == 'huggingface':
+        try:
+            from huggingface_hub import HfFileSystem
+            from huggingface_hub.utils import validate_repo_id
+            from pathlib import Path
+        except ImportError:
+            print("The huggingface-hub package is required. Please install it with `pip install huggingface-hub`.")
+            exit(1)
 
-    validate_repo_id(repo_id)
-    hffs = HfFileSystem()
+        validate_repo_id(repo_id)
+        hffs = HfFileSystem()
 
-    try:
-        files = [
-            file["name"] if isinstance(file, dict) else file
-            for file in hffs.ls(repo_id, recursive=True)
-        ]
-    except Exception as e:
-        print(f"Error accessing repository '{repo_id}'. Please make sure you have access to the Hugging Face repository first.")
-        exit(1)
+        try:
+            files = [
+                file["name"] if isinstance(file, dict) else file
+                for file in hffs.ls(repo_id, recursive=True)
+            ]
+        except Exception as e:
+            print(f"Error accessing repository '{repo_id}'. Please make sure you have access to the Hugging Face repository first.")
+            exit(1)
+
+        # Remove the repo prefix from files
+        file_list = []
+        for file in files:
+            rel_path = Path(file).relative_to(repo_id)
+            file_list.append(str(rel_path))
+    elif model_hub == 'modelscope':
+        try:
+            from modelscope.hub.api import HubApi
+        except ImportError:
+            print("The modelscope package is required. Please install it with `pip install modelscope`.")
+            exit(1)
 
-    # Remove the repo prefix from files
-    file_list = []
-    for file in files:
-        rel_path = Path(file).relative_to(repo_id)
-        file_list.append(str(rel_path))
+        try:
+            ms_api = HubApi()
+            infos = ms_api.get_model_files(repo_id, recursive=True)
+            file_list = [info['Path'] for info in infos]
+        except Exception as e:
+            print(f"Error accessing repository '{repo_id}'. Please make sure you have access to the ModelScope repository first.")
+            exit(1)
+    else:
+        raise ValueError("Invalid model hub specified. Supported model hub are 'huggingface' and 'modelscope")
 
     # Filter for files ending with .gguf
     gguf_files = [file for file in file_list if file.endswith('.gguf')]
diff --git a/nexa/gguf/__init__.py b/nexa/gguf/__init__.py
index 81e20228..d2afff06 100644
--- a/nexa/gguf/__init__.py
+++ b/nexa/gguf/__init__.py
@@ -2,12 +2,15 @@
 from .nexa_inference_text import NexaTextInference
 from .nexa_inference_vlm import NexaVLMInference
 from .nexa_inference_voice import NexaVoiceInference
-from .nexa_inference_tts import NexaTTSInference
+
+# Temporarily disabled since version v0.0.9.3
+# from .nexa_inference_tts import NexaTTSInference
 
 __all__ = [
     "NexaImageInference",
     "NexaTextInference",
     "NexaVLMInference",
     "NexaVoiceInference",
-    "NexaTTSInference",
+    #"NexaTTSInference",
+    "NexaAudioLMInference"
 ]
\ No newline at end of file
diff --git a/nexa/gguf/bark/bark_cpp.py b/nexa/gguf/bark/bark_cpp.py
index d2e2a250..e015cf44 100644
--- a/nexa/gguf/bark/bark_cpp.py
+++ b/nexa/gguf/bark/bark_cpp.py
@@ -80,6 +80,7 @@ class bark_context_params(ctypes.Structure):
         ("verbosity", ctypes.c_int),
         ("temp", ctypes.c_float),
         ("fine_temp", ctypes.c_float),
+        ("n_gpu_layers", ctypes.c_int32),
         ("min_eos_p", ctypes.c_float),
         ("sliding_window_size", ctypes.c_int32),
         ("max_coarse_history", ctypes.c_int32),
diff --git a/nexa/gguf/converter/constants.py b/nexa/gguf/converter/constants.py
new file mode 100644
index 00000000..2512f4d5
--- /dev/null
+++ b/nexa/gguf/converter/constants.py
@@ -0,0 +1,156 @@
+import os
+from pathlib import Path
+
+from nexa.gguf.llama.llama_cpp import (
+    LLAMA_FTYPE_ALL_F32,
+    LLAMA_FTYPE_MOSTLY_F16,
+    LLAMA_FTYPE_MOSTLY_Q4_0,
+    LLAMA_FTYPE_MOSTLY_Q4_1,
+    LLAMA_FTYPE_MOSTLY_Q8_0,
+    LLAMA_FTYPE_MOSTLY_Q5_0,
+    LLAMA_FTYPE_MOSTLY_Q5_1,
+    LLAMA_FTYPE_MOSTLY_Q2_K,
+    LLAMA_FTYPE_MOSTLY_Q3_K_S,
+    LLAMA_FTYPE_MOSTLY_Q3_K_M,
+    LLAMA_FTYPE_MOSTLY_Q3_K_L,
+    LLAMA_FTYPE_MOSTLY_Q4_K_S,
+    LLAMA_FTYPE_MOSTLY_Q4_K_M,
+    LLAMA_FTYPE_MOSTLY_Q5_K_S,
+    LLAMA_FTYPE_MOSTLY_Q5_K_M,
+    LLAMA_FTYPE_MOSTLY_Q6_K,
+    LLAMA_FTYPE_MOSTLY_IQ2_XXS,
+    LLAMA_FTYPE_MOSTLY_IQ2_XS,
+    LLAMA_FTYPE_MOSTLY_Q2_K_S,
+    LLAMA_FTYPE_MOSTLY_IQ3_XS,
+    LLAMA_FTYPE_MOSTLY_IQ3_XXS,
+    LLAMA_FTYPE_MOSTLY_IQ1_S,
+    LLAMA_FTYPE_MOSTLY_IQ4_NL,
+    LLAMA_FTYPE_MOSTLY_IQ3_S,
+    LLAMA_FTYPE_MOSTLY_IQ3_M,
+    LLAMA_FTYPE_MOSTLY_IQ2_S,
+    LLAMA_FTYPE_MOSTLY_IQ2_M,
+    LLAMA_FTYPE_MOSTLY_IQ4_XS,
+    LLAMA_FTYPE_MOSTLY_IQ1_M,
+    LLAMA_FTYPE_MOSTLY_BF16,
+    LLAMA_FTYPE_MOSTLY_Q4_0_4_4,
+    LLAMA_FTYPE_MOSTLY_Q4_0_4_8,
+    LLAMA_FTYPE_MOSTLY_Q4_0_8_8,
+    LLAMA_FTYPE_MOSTLY_TQ1_0,
+    LLAMA_FTYPE_MOSTLY_TQ2_0,
+)
+from nexa.gguf.llama.llama_cpp import (
+    GGML_TYPE_F32,
+    GGML_TYPE_F16,
+    GGML_TYPE_Q4_0,
+    GGML_TYPE_Q4_1,
+    GGML_TYPE_Q5_0,
+    GGML_TYPE_Q5_1,
+    GGML_TYPE_Q8_0,
+    GGML_TYPE_Q8_1,
+    GGML_TYPE_Q2_K,
+    GGML_TYPE_Q3_K,
+    GGML_TYPE_Q4_K,
+    GGML_TYPE_Q5_K,
+    GGML_TYPE_Q6_K,
+    GGML_TYPE_Q8_K,
+    GGML_TYPE_IQ2_XXS,
+    GGML_TYPE_IQ2_XS,
+    GGML_TYPE_IQ3_XXS,
+    GGML_TYPE_IQ1_S,
+    GGML_TYPE_IQ4_NL,
+    GGML_TYPE_IQ3_S,
+    GGML_TYPE_IQ2_S,
+    GGML_TYPE_IQ4_XS,
+    GGML_TYPE_I8,
+    GGML_TYPE_I16,
+    GGML_TYPE_I32,
+    GGML_TYPE_I64,
+    GGML_TYPE_F64,
+    GGML_TYPE_IQ1_M,
+    GGML_TYPE_BF16,
+    GGML_TYPE_Q4_0_4_4,
+    GGML_TYPE_Q4_0_4_8,
+    GGML_TYPE_Q4_0_8_8,
+    GGML_TYPE_COUNT,
+)
+
+# From quantize.cpp
+# For mapping of general quantization options (ftypes)
+LLAMA_QUANTIZATION_TYPES = {
+    "q4_0": LLAMA_FTYPE_MOSTLY_Q4_0,
+    "q4_1": LLAMA_FTYPE_MOSTLY_Q4_1,
+    "q5_0": LLAMA_FTYPE_MOSTLY_Q5_0,
+    "q5_1": LLAMA_FTYPE_MOSTLY_Q5_1,
+    "q8_0": LLAMA_FTYPE_MOSTLY_Q8_0,
+    "q2_k": LLAMA_FTYPE_MOSTLY_Q2_K,
+    "q3_k_s": LLAMA_FTYPE_MOSTLY_Q3_K_S,
+    "q3_k_m": LLAMA_FTYPE_MOSTLY_Q3_K_M,
+    "q3_k_l": LLAMA_FTYPE_MOSTLY_Q3_K_L,
+    "q4_k_s": LLAMA_FTYPE_MOSTLY_Q4_K_S,
+    "q4_k_m": LLAMA_FTYPE_MOSTLY_Q4_K_M,
+    "q5_k_s": LLAMA_FTYPE_MOSTLY_Q5_K_S,
+    "q5_k_m": LLAMA_FTYPE_MOSTLY_Q5_K_M,
+    "q6_k": LLAMA_FTYPE_MOSTLY_Q6_K,
+    "iq2_xxs": LLAMA_FTYPE_MOSTLY_IQ2_XXS,
+    "iq2_xs": LLAMA_FTYPE_MOSTLY_IQ2_XS,
+    "q2_k_s": LLAMA_FTYPE_MOSTLY_Q2_K_S,
+    "iq3_xs": LLAMA_FTYPE_MOSTLY_IQ3_XS,
+    "iq3_xxs": LLAMA_FTYPE_MOSTLY_IQ3_XXS,
+    "iq1_s": LLAMA_FTYPE_MOSTLY_IQ1_S,
+    "iq4_nl": LLAMA_FTYPE_MOSTLY_IQ4_NL,
+    "iq3_s": LLAMA_FTYPE_MOSTLY_IQ3_S,
+    "iq3_m": LLAMA_FTYPE_MOSTLY_IQ3_M,
+    "iq2_s": LLAMA_FTYPE_MOSTLY_IQ2_S,
+    "iq2_m": LLAMA_FTYPE_MOSTLY_IQ2_M,
+    "iq4_xs": LLAMA_FTYPE_MOSTLY_IQ4_XS,
+    "iq1_m": LLAMA_FTYPE_MOSTLY_IQ1_M,
+    "f16": LLAMA_FTYPE_MOSTLY_F16,
+    "f32": LLAMA_FTYPE_ALL_F32,
+    "bf16": LLAMA_FTYPE_MOSTLY_BF16,
+    "q4_0_4_4": LLAMA_FTYPE_MOSTLY_Q4_0_4_4,
+    "q4_0_4_8": LLAMA_FTYPE_MOSTLY_Q4_0_4_8,
+    "q4_0_8_8": LLAMA_FTYPE_MOSTLY_Q4_0_8_8,
+    "tq1_0": LLAMA_FTYPE_MOSTLY_TQ1_0,
+    "tq2_0": LLAMA_FTYPE_MOSTLY_TQ2_0,
+}
+
+# From ggml.h
+# For mapping of output_tensor_type and token_embedding_type only
+GGML_TYPES = {
+    "f32": GGML_TYPE_F32,
+    "f16": GGML_TYPE_F16,
+    "q4_0": GGML_TYPE_Q4_0,
+    "q4_1": GGML_TYPE_Q4_1,
+    "q5_0": GGML_TYPE_Q5_0,
+    "q5_1": GGML_TYPE_Q5_1,
+    "q8_0": GGML_TYPE_Q8_0,
+    "q8_1": GGML_TYPE_Q8_1,
+    "q2_k": GGML_TYPE_Q2_K,
+    "q3_k": GGML_TYPE_Q3_K,
+    "q4_k": GGML_TYPE_Q4_K,
+    "q5_k": GGML_TYPE_Q5_K,
+    "q6_k": GGML_TYPE_Q6_K,
+    "q8_k": GGML_TYPE_Q8_K,
+    "iq2_xxs": GGML_TYPE_IQ2_XXS,
+    "iq2_xs": GGML_TYPE_IQ2_XS,
+    "iq3_xxs": GGML_TYPE_IQ3_XXS,
+    "iq1_s": GGML_TYPE_IQ1_S,
+    "iq4_nl": GGML_TYPE_IQ4_NL,
+    "iq3_s": GGML_TYPE_IQ3_S,
+    "iq2_s": GGML_TYPE_IQ2_S,
+    "iq4_xs": GGML_TYPE_IQ4_XS,
+    "i8": GGML_TYPE_I8,
+    "i16": GGML_TYPE_I16,
+    "i32": GGML_TYPE_I32,
+    "i64": GGML_TYPE_I64,
+    "f64": GGML_TYPE_F64,
+    "iq1_m": GGML_TYPE_IQ1_M,
+    "bf16": GGML_TYPE_BF16,
+    "q4_0_4_4": GGML_TYPE_Q4_0_4_4,
+    "q4_0_4_8": GGML_TYPE_Q4_0_4_8,
+    "q4_0_8_8": GGML_TYPE_Q4_0_8_8,
+}
+
+NEXA_CACHE_ROOT = Path(os.getenv("NEXA_CACHE_ROOT") or "~/.cache/nexa").expanduser()
+NEXA_MODELS_HUB_DIR = NEXA_CACHE_ROOT / "hub"
+NEXA_MODELS_HUB_CONVERTED_DIR = NEXA_MODELS_HUB_DIR / "converted"
diff --git a/nexa/gguf/converter/nexa_convert.py b/nexa/gguf/converter/nexa_convert.py
index c38970cd..7c24771b 100644
--- a/nexa/gguf/converter/nexa_convert.py
+++ b/nexa/gguf/converter/nexa_convert.py
@@ -6,7 +6,7 @@
 import json
 
 from nexa.gguf.llama.llama_cpp import GGML_TYPE_COUNT, LLAMA_FTYPE_MOSTLY_Q4_0
-from nexa.constants import LLAMA_QUANTIZATION_TYPES, GGML_TYPES
+from nexa.gguf.converter.constants import LLAMA_QUANTIZATION_TYPES, GGML_TYPES
 from nexa.gguf.llama.llama_cpp import llama_model_quantize_params, llama_model_quantize
 
 # Set up logging
@@ -110,7 +110,7 @@ def convert_hf_to_quantized_gguf(
     ftype: str = "q4_0", 
     convert_type: str = "f16", 
     **kwargs
-) -> Optional[str]:
+) -> Optional[tuple[str, str, str]]:
     """
     Convert a model in safetensors format to a quantized GGUF file.
 
@@ -118,14 +118,14 @@ def convert_hf_to_quantized_gguf(
     It can process both directories containing .safetensors files and existing .gguf files.
 
     Args:
-        input_path (str): Path to the input Hugging Face model directory or GGUF file.
+        input_path (str): Path in the local file system to the input Hugging Face model directory or GGUF file.
         output_file (str, optional): Path to the output quantized GGUF file. If None, a default path will be used.
         ftype (str, optional): Quantization type (default: "q4_0").
         convert_type (str, optional): Conversion type for safetensors to GGUF (default: "f16").
         **kwargs: Additional keyword arguments for the conversion and quantization process.
 
     Returns:
-        Optional[str]: Path to the output quantized GGUF file if successful, None otherwise.
+        Optional[tuple[str, str, str]]: Tuple of (output_file_path, input_name, ftype) if successful, None otherwise.
 
     Raises:
         FileNotFoundError: If the input directory or file does not exist.
@@ -139,9 +139,13 @@ def convert_hf_to_quantized_gguf(
     # Convert input path to absolute path
     input_path = os.path.abspath(input_path)
     
+    # Get input name early
+    input_name = os.path.basename(input_path)
+    if input_path.endswith('.gguf'):
+        input_name = os.path.splitext(input_name)[0]  # Remove .gguf extension
+    
     # Set default output file if not provided
     if not output_file:
-        input_name = os.path.basename(input_path)
         output_file = os.path.abspath(f"./{input_name}-{ftype}.gguf")
     else:
         output_file = os.path.abspath(output_file)
@@ -166,7 +170,7 @@ def convert_hf_to_quantized_gguf(
 
                 # Quantize GGUF model
                 quantize_model(str(tmp_file_path.absolute()), output_file, ftype, **kwargs)
-                return output_file
+                return output_file, input_name, ftype
             finally:
                 # Delete the temporary file
                 if tmp_file_path.exists():
@@ -177,7 +181,7 @@ def convert_hf_to_quantized_gguf(
     elif input_path.endswith('.gguf'):
         # Directly call quantize_model with input_path
         quantize_model(input_file=input_path, output_file=output_file, ftype=ftype, **kwargs)
-        return output_file
+        return output_file, input_name, ftype
     else:
         logger.error(f"Invalid input path: {input_path}. Must be a directory with .safetensors files or a .gguf file.")
         return None
diff --git a/nexa/gguf/llama/_utils_spinner.py b/nexa/gguf/llama/_utils_spinner.py
new file mode 100644
index 00000000..f89ba2e1
--- /dev/null
+++ b/nexa/gguf/llama/_utils_spinner.py
@@ -0,0 +1,79 @@
+# For similar spinner animation implementation, refer to: nexa/utils.py
+
+import sys
+import threading
+import time
+import os
+import itertools
+from contextlib import contextmanager
+
+def get_spinner_style(style="default"):
+    spinners = {
+        "default": ["⠋", "⠙", "⠹", "⠸", "⠼", "⠴", "⠦", "⠧", "⠇", "⠏"]
+    }
+    return spinners.get(style, spinners["default"])
+
+def _get_output_stream():
+    """Get the appropriate output stream based on platform."""
+    if sys.platform == "win32":
+        return open('CONOUT$', 'wb')
+    else:
+        try:
+            return os.open('/dev/tty', os.O_WRONLY)
+        except (FileNotFoundError, OSError):
+            return os.open('/dev/stdout', os.O_WRONLY)
+
+def show_spinner(stop_event, style="default", message=""):
+    spinner = itertools.cycle(get_spinner_style(style))
+    fd = _get_output_stream()
+    is_windows = sys.platform == "win32"
+    
+    try:
+        while not stop_event.is_set():
+            display = f"\r{message} {next(spinner)}" if message else f"\r{next(spinner)} "
+            
+            if is_windows:
+                fd.write(display.encode())
+                fd.flush()
+            else:
+                os.write(fd, display.encode())
+            time.sleep(0.1)
+            
+        # Clear the spinner
+        clear_msg = b"\r" + b" " * (len(message) + 2) + b"\r"
+        if is_windows:
+            fd.write(clear_msg)
+            fd.flush()
+        else:
+            os.write(fd, clear_msg)
+            
+    finally:
+        if is_windows:
+            fd.close()
+        else:
+            os.close(fd)
+
+def start_spinner(style="default", message=""):
+    stop_event = threading.Event()
+    spinner_thread = threading.Thread(
+        target=show_spinner, 
+        args=(stop_event, style, message),
+        daemon=True
+    )
+    spinner_thread.start()
+    return stop_event, spinner_thread
+
+def stop_spinner(stop_event, spinner_thread):
+    if stop_event and not stop_event.is_set():
+        stop_event.set()
+    if spinner_thread and spinner_thread.is_alive():
+        spinner_thread.join()
+
+@contextmanager
+def spinning_cursor(message="", style="default"):
+    """Context manager for spinner animation."""
+    stop_event, thread = start_spinner(style, message)
+    try:
+        yield
+    finally:
+        stop_spinner(stop_event, thread)
\ No newline at end of file
diff --git a/nexa/gguf/llama/audio_lm_cpp.py b/nexa/gguf/llama/audio_lm_cpp.py
new file mode 100644
index 00000000..88db2a33
--- /dev/null
+++ b/nexa/gguf/llama/audio_lm_cpp.py
@@ -0,0 +1,116 @@
+import ctypes
+import os
+import sys
+from pathlib import Path
+
+
+# Load the library
+def _load_shared_library(lib_base_name: str, base_path: Path = None):
+    # Determine the file extension based on the platform
+    if sys.platform.startswith("linux"):
+        lib_ext = ".so"
+    elif sys.platform == "darwin":
+        lib_ext = ".dylib"
+    elif sys.platform == "win32":
+        lib_ext = ".dll"
+    else:
+        raise RuntimeError("Unsupported platform")
+    # Construct the paths to the possible shared library names
+    if base_path is None:
+        _base_path = Path(__file__).parent.parent.resolve()
+    else:
+        _base_path = base_path
+    _lib_paths = [
+        _base_path / f"lib{lib_base_name}{lib_ext}",
+        _base_path / f"{lib_base_name}{lib_ext}",
+    ]
+    # Add the library directory to the DLL search path on Windows (if needed)
+    if sys.platform == "win32" and sys.version_info >= (3, 8):
+        os.add_dll_directory(str(_base_path))
+    # Try to load the shared library, handling potential errors
+    for _lib_path in _lib_paths:
+        if _lib_path.exists():
+            try:
+                return ctypes.CDLL(str(_lib_path))
+            except Exception as e:
+                print(f"Failed to load shared library '{_lib_path}': {e}")
+    raise FileNotFoundError(
+        f"Shared library with base name '{lib_base_name}' not found"
+    )
+
+def _get_lib(is_qwen: bool = True):
+    # Specify the base name of the shared library to load
+    _lib_base_name = "nexa-qwen2-audio-lib_shared" if is_qwen else "nexa-omni-audio-lib_shared"
+    base_path = (
+        Path(__file__).parent.parent.parent.parent.resolve()
+        / "nexa"
+        / "gguf"
+        / "lib"
+    )
+    return _load_shared_library(_lib_base_name, base_path)
+
+# Initialize both libraries
+_lib_omni = _get_lib(is_qwen=False)
+_lib_qwen = _get_lib(is_qwen=True)
+
+#   conda config --add channels conda-forge
+#   conda update libstdcxx-ng
+# struct omni_context_params
+# {
+#     char *model;
+#     char *mmproj;
+#     char *file;
+#     char *prompt;
+#     int32_t n_gpu_layers;
+# };
+class omni_context_params(ctypes.Structure):
+    _fields_ = [
+        ("model", ctypes.c_char_p),
+        ("mmproj", ctypes.c_char_p),
+        ("file", ctypes.c_char_p),
+        ("prompt", ctypes.c_char_p),
+        ("n_gpu_layers", ctypes.c_int32),
+    ]
+
+omni_context_params_p = ctypes.POINTER(omni_context_params)
+omni_context_p = ctypes.c_void_p
+
+# OMNI_AUDIO_API omni_context_params omni_context_default_params();
+def context_default_params(is_qwen: bool = True) -> omni_context_params:
+    _lib = _lib_qwen if is_qwen else _lib_omni
+    return _lib.omni_context_default_params()
+
+# OMNI_AUDIO_API struct omni_context *omni_init_context(omni_context_params &params);
+def init_context(params: omni_context_params_p, is_qwen: bool = True) -> omni_context_p:  # type: ignore
+    _lib = _lib_qwen if is_qwen else _lib_omni
+    return _lib.omni_init_context(params)
+
+# OMNI_AUDIO_API void omni_process_full(
+#     struct omni_context *ctx_omni,
+#     omni_context_params &params
+# );
+def process_full(ctx: omni_context_p, params: omni_context_params_p, is_qwen: bool = True):  # type: ignore
+    _lib = _lib_qwen if is_qwen else _lib_omni
+    return _lib.omni_process_full(ctx, params)
+
+# OMNI_AUDIO_API void omni_free(struct omni_context *ctx_omni);
+def free(ctx: omni_context_p, is_qwen: bool = True):
+    _lib = _lib_qwen if is_qwen else _lib_omni
+    return _lib.omni_free(ctx)
+
+for lib in [_lib_omni, _lib_qwen]:
+    # Configure context_default_params
+    lib.omni_context_default_params.argtypes = []
+    lib.omni_context_default_params.restype = omni_context_params
+
+    # Configure init_context
+    lib.omni_init_context.argtypes = [omni_context_params_p]
+    lib.omni_init_context.restype = omni_context_p
+
+    # Configure process_full
+    lib.omni_process_full.argtypes = [omni_context_p, omni_context_params_p]
+    lib.omni_process_full.restype = ctypes.c_char_p
+
+    # Configure free
+    lib.omni_free.argtypes = [omni_context_p]
+    lib.omni_free.restype = None
diff --git a/nexa/gguf/llama/kv_cache.py b/nexa/gguf/llama/kv_cache.py
new file mode 100644
index 00000000..aa01630d
--- /dev/null
+++ b/nexa/gguf/llama/kv_cache.py
@@ -0,0 +1,86 @@
+from nexa.gguf.llama.llama_cache import LlamaDiskCache
+from typing import Any, Dict
+
+def run_inference_with_disk_cache(
+    model: Any, 
+    cache_prompt: str, 
+    total_prompt: str, 
+    use_cache: bool = True, 
+    cache_dir: str = "llama.cache", 
+    **kwargs: Dict[str, Any]
+) -> Any:
+    """
+    Runs inference using a disk cache to store and retrieve model states.
+
+    Parameters:
+    - model: The model object that supports caching and inference.
+    - cache_prompt: The prompt used to generate a cache key.
+    - total_prompt: The full prompt for generating output.
+    - use_cache: Flag to determine if caching should be used.
+    - cache_dir: Directory where cache files are stored.
+    - kwargs: Additional parameters for model inference.
+
+    Returns:
+    - The output generated by the model.
+    """
+    temperature = kwargs.get('temperature', 0.7)
+    max_tokens = kwargs.get('max_tokens', 2048)
+    top_p = kwargs.get('top_p', 0.8)
+    top_k = kwargs.get('top_k', 50)
+    repeat_penalty = kwargs.get('repeat_penalty', 1.0)
+
+    if use_cache:
+        # Initialize disk cache with specified directory
+        cache_context = LlamaDiskCache(cache_dir=cache_dir)
+        model.set_cache(cache_context)
+        # Convert prompt to tokens for cache key
+        prompt_tokens = model.tokenize(cache_prompt.encode("utf-8"))
+
+        try:
+            # Try to load existing cache
+            cached_state = cache_context[prompt_tokens]
+            model.load_state(cached_state)
+
+            output = model(
+                total_prompt,
+                max_tokens=max_tokens,
+                temperature=temperature,
+                stream=True,
+            )
+        except KeyError:
+            # If cache doesn't exist, create it
+            model.reset()
+            # Run initial inference to populate cache
+            _ = model(
+                cache_prompt,
+                max_tokens=1,  # Minimal tokens for cache creation
+                temperature=temperature,
+                echo=False,
+            )
+            # Save the state to cache
+            cache_context[prompt_tokens] = model.save_state()
+
+            # Generate output after creating cache
+            output = model(
+                total_prompt,
+                max_tokens=max_tokens,
+                temperature=temperature,
+                top_p=top_p,
+                top_k=top_k,
+                repeat_penalty=repeat_penalty,
+                stream=True,
+            )
+    else:
+        model.reset()
+        model.set_cache(None)
+
+        output = model(
+            total_prompt,
+            max_tokens=max_tokens,
+            temperature=temperature,
+            top_p=top_p,
+            top_k=top_k,
+            repeat_penalty=repeat_penalty,
+            stream=True,
+        )
+    return output
\ No newline at end of file
diff --git a/nexa/gguf/llama/llama.py b/nexa/gguf/llama/llama.py
index a183743d..0007b515 100644
--- a/nexa/gguf/llama/llama.py
+++ b/nexa/gguf/llama/llama.py
@@ -31,6 +31,7 @@
 
 from nexa.gguf.llama.llama_types import *
 from nexa.gguf.llama.llama_grammar import LlamaGrammar
+from nexa.gguf.llama.llama_cache import BaseLlamaCache
 from nexa.gguf.llama.llama_tokenizer import BaseLlamaTokenizer, LlamaTokenizer
 import nexa.gguf.llama.llama_cpp as llama_cpp
 import nexa.gguf.llama.llama_chat_format as llama_chat_format
@@ -350,6 +351,8 @@ def __init__(
         # Sampling Params
         self.last_n_tokens_size = last_n_tokens_size
 
+        self.cache: Optional[BaseLlamaCache] = None
+
         self.lora_base = lora_base
         self.lora_scale = lora_scale
         self.lora_path = lora_path
@@ -596,6 +599,14 @@ def detokenize(
             The detokenized string.
         """
         return self.tokenizer_.detokenize(tokens, prev_tokens=prev_tokens, special=special)
+    
+    def set_cache(self, cache: Optional[BaseLlamaCache]):
+        """Set the cache.
+
+        Args:
+            cache: The cache to set.
+        """
+        self.cache = cache
 
     def set_seed(self, seed: int):
         """Set the random seed.
@@ -1211,6 +1222,23 @@ def logit_bias_processor(
             raise ValueError(
                 "logprobs is not supported for models created with logits_all=False"
             )
+        
+        if self.cache:
+            try:
+                cache_item = self.cache[prompt_tokens]
+                cache_prefix_len = Llama.longest_token_prefix(
+                    cache_item.input_ids.tolist(), prompt_tokens
+                )
+                eval_prefix_len = Llama.longest_token_prefix(
+                    self._input_ids.tolist(), prompt_tokens
+                )
+                if cache_prefix_len > eval_prefix_len:
+                    self.load_state(cache_item)
+                    if self.verbose:
+                        print("Llama._create_completion: cache hit", file=sys.stderr)
+            except KeyError:
+                if self.verbose:
+                    print("Llama._create_completion: cache miss", file=sys.stderr)
 
         if seed is not None:
             self._ctx.set_rng_seed(seed)
@@ -1552,8 +1580,19 @@ def logit_bias_processor(
                     }
                 ],
             }
+            if self.cache:
+                if self.verbose:
+                    print("Llama._create_completion: cache save", file=sys.stderr)
+                self.cache[prompt_tokens + completion_tokens] = self.save_state()
+                if self.verbose:
+                    print("Llama._create_completion: cache saved", file=sys.stderr)
             return
 
+        if self.cache:
+            if self.verbose:
+                print("Llama._create_completion: cache save", file=sys.stderr)
+            self.cache[prompt_tokens + completion_tokens] = self.save_state()
+
         text_str = text.decode("utf-8", errors="ignore")
 
         if echo:
@@ -2108,6 +2147,62 @@ def pooling_type(self) -> str:
     def close(self) -> None:
         """Explicitly free the model from memory."""
         self._stack.close()
+        
+    def unload_lora(self):
+        """Unload the LoRA adapter while keeping the base model in memory."""
+        if self._lora_adapter is not None:
+            llama_cpp.llama_lora_adapter_clear(self._ctx.ctx)
+            llama_cpp.llama_lora_adapter_free(self._lora_adapter)
+            self._lora_adapter = None
+            self.lora_path = None
+            self.lora_scale = 1.0
+        
+    def reload_lora(self, lora_path: str, lora_scale: float = 1.0):
+        """Reload a LoRA adapter from the given path.
+        
+        Args:
+            lora_path: Path to the LoRA adapter file
+            lora_scale: Scale to apply to the LoRA adapter (default: 1.0)
+            
+        Raises:
+            RuntimeError: If initialization or setting of the LoRA adapter fails
+        """
+        # First unload any existing LoRA adapter
+        if self._lora_adapter is not None:
+            self.unload_lora()
+        
+        # Initialize new LoRA adapter
+        assert self._model.model is not None
+        self._lora_adapter = llama_cpp.llama_lora_adapter_init(
+            self._model.model,
+            lora_path.encode("utf-8"),
+        )
+        if self._lora_adapter is None:
+            raise RuntimeError(
+                f"Failed to initialize LoRA adapter from lora path: {lora_path}"
+            )
+        
+        def free_lora_adapter():
+            if self._lora_adapter is None:
+                return
+            llama_cpp.llama_lora_adapter_free(self._lora_adapter)
+            self._lora_adapter = None
+            
+        self._stack.callback(free_lora_adapter)
+        
+        # Apply the LoRA adapter
+        assert self._ctx.ctx is not None
+        if llama_cpp.llama_lora_adapter_set(
+            self._ctx.ctx, self._lora_adapter, lora_scale
+        ):
+            # Clean up on failure
+            self.unload_lora()
+            raise RuntimeError(
+                f"Failed to set LoRA adapter from lora path: {lora_path}"
+            )
+        
+        self.lora_path = lora_path
+        self.lora_scale = lora_scale
 
     def __del__(self) -> None:
         self.close()
diff --git a/nexa/gguf/llama/llava_cpp.py b/nexa/gguf/llama/llava_cpp.py
index fa8eb7c0..9671eafb 100644
--- a/nexa/gguf/llama/llava_cpp.py
+++ b/nexa/gguf/llama/llava_cpp.py
@@ -33,7 +33,7 @@
 from nexa.gguf.lib_utils import load_library
 
 # Specify the base name of the shared library to load
-_libllava_base_name = "llava"
+_libllava_base_name = "llava_shared"
 
 # Load the library
 _libllava = load_library(_libllava_base_name)
diff --git a/nexa/gguf/llama/omni_vlm_cpp.py b/nexa/gguf/llama/omni_vlm_cpp.py
new file mode 100644
index 00000000..ab7a5699
--- /dev/null
+++ b/nexa/gguf/llama/omni_vlm_cpp.py
@@ -0,0 +1,79 @@
+import ctypes
+import os
+import sys
+from pathlib import Path
+
+
+# Load the library
+def _load_shared_library(lib_base_name: str, base_path: Path = None):
+    # Determine the file extension based on the platform
+    if sys.platform.startswith("linux"):
+        lib_ext = ".so"
+    elif sys.platform == "darwin":
+        lib_ext = ".dylib"
+    elif sys.platform == "win32":
+        lib_ext = ".dll"
+    else:
+        raise RuntimeError("Unsupported platform")
+    # Construct the paths to the possible shared library names
+    if base_path is None:
+        _base_path = Path(__file__).parent.parent.resolve()
+    else:
+        _base_path = base_path
+    _lib_paths = [
+        _base_path / f"lib{lib_base_name}{lib_ext}",
+        _base_path / f"{lib_base_name}{lib_ext}",
+    ]
+    # Add the library directory to the DLL search path on Windows (if needed)
+    if sys.platform == "win32" and sys.version_info >= (3, 8):
+        os.add_dll_directory(str(_base_path))
+    # Try to load the shared library, handling potential errors
+    for _lib_path in _lib_paths:
+        if _lib_path.exists():
+            try:
+                return ctypes.CDLL(str(_lib_path))
+            except Exception as e:
+                print(f"Failed to load shared library '{_lib_path}': {e}")
+    raise FileNotFoundError(
+        f"Shared library with base name '{lib_base_name}' not found"
+    )
+
+def _get_lib():
+    # Specify the base name of the shared library to load
+    _lib_base_name = "omni_vlm_wrapper_shared"
+    base_path = (
+        Path(__file__).parent.parent.parent.parent.resolve()
+        / "nexa"
+        / "gguf"
+        / "lib"
+    )
+    return _load_shared_library(_lib_base_name, base_path)
+
+# Initialize both libraries
+_lib = _get_lib()
+
+omni_char_p = ctypes.c_char_p
+
+
+def omnivlm_init(llm_model_path: omni_char_p, mmproj_model_path: omni_char_p, vlm_version: omni_char_p):
+    return _lib.omnivlm_init(llm_model_path, mmproj_model_path, vlm_version)
+
+
+_lib.omnivlm_init.argtypes = [omni_char_p, omni_char_p, omni_char_p]
+_lib.omnivlm_init.restype = None
+
+
+def omnivlm_inference(prompt: omni_char_p, image_path: omni_char_p):
+    return _lib.omnivlm_inference(prompt, image_path)
+
+
+_lib.omnivlm_inference.argtypes = [omni_char_p, omni_char_p]
+_lib.omnivlm_inference.restype = omni_char_p
+
+
+def omnivlm_free():
+    return _lib.omnivlm_free()
+
+
+_lib.omnivlm_free.argtypes = []
+_lib.omnivlm_free.restype = None
\ No newline at end of file
diff --git a/nexa/gguf/nexa_inference_audio_lm.py b/nexa/gguf/nexa_inference_audio_lm.py
new file mode 100644
index 00000000..fa63cd38
--- /dev/null
+++ b/nexa/gguf/nexa_inference_audio_lm.py
@@ -0,0 +1,329 @@
+import ctypes
+import logging
+import os
+import sys
+import librosa
+import tempfile
+import soundfile as sf
+from pathlib import Path
+from streamlit.web import cli as stcli
+from nexa.utils import SpinningCursorAnimation, nexa_prompt
+from nexa.constants import (
+    DEFAULT_TEXT_GEN_PARAMS,
+    NEXA_RUN_MODEL_MAP_AUDIO_LM,
+    NEXA_RUN_AUDIO_LM_PROJECTOR_MAP,
+)
+from nexa.gguf.lib_utils import is_gpu_available
+from nexa.gguf.llama import audio_lm_cpp
+from nexa.gguf.llama._utils_transformers import suppress_stdout_stderr
+from nexa.general import pull_model
+
+def is_qwen(model_name):
+    if "qwen" in model_name.lower():  # TEMPORARY SOLUTION : this hardcode can be risky
+        return True
+    return False
+
+
+assert set(NEXA_RUN_MODEL_MAP_AUDIO_LM.keys()) == set(
+    NEXA_RUN_AUDIO_LM_PROJECTOR_MAP.keys()
+), "Model, projector, and handler should have the same keys"
+
+
+class NexaAudioLMInference:
+    """
+    A class used for loading Bark text-to-speech models and running text-to-speech generation.
+
+    Methods:
+        run: Run the audio LM generation loop.
+
+    Args:
+        model_path (str): Path to the model file.
+        mmproj_path (str): Path to the audio projector file.
+        n_gpu_layers(int): Number of gpu layers to use for processing. Defaults to -1.
+        output_dir (str): Output directory for tts. Defaults to "tts".
+        verbosity (int): Verbosity level for the Bark model. Defaults to 0.
+    """
+
+    def __init__(
+        self,
+        model_path=None,
+        local_path=None,
+        projector_local_path=None,
+        device="auto",
+        **kwargs,
+    ):
+        if model_path is None and local_path is None:
+            raise ValueError("Either model_path or local_path must be provided.")
+
+        self.params = DEFAULT_TEXT_GEN_PARAMS.copy()
+        self.params.update(kwargs)
+        self.model = None
+        self.projector = None
+        self.projector_path = NEXA_RUN_AUDIO_LM_PROJECTOR_MAP.get(model_path, None)
+        self.downloaded_path = local_path
+        self.projector_downloaded_path = projector_local_path
+        self.device = device
+        self.context = None
+        self.temp_file = None
+
+        if self.device == "auto" or self.device == "gpu":
+            self.n_gpu_layers = -1 if is_gpu_available() else 0
+        else:
+            self.n_gpu_layers = 0
+
+        if (
+            self.downloaded_path is not None
+            and self.projector_downloaded_path is not None
+        ):
+            # when running from local, both path should be provided
+            pass
+        elif self.downloaded_path is not None:
+            if model_path in NEXA_RUN_MODEL_MAP_AUDIO_LM:
+                self.projector_path = NEXA_RUN_AUDIO_LM_PROJECTOR_MAP[model_path]
+                self.projector_downloaded_path, _ = pull_model(
+                    self.projector_path, **kwargs
+                )
+        elif model_path in NEXA_RUN_MODEL_MAP_AUDIO_LM:
+            self.model_path = NEXA_RUN_MODEL_MAP_AUDIO_LM[model_path]
+            self.projector_path = NEXA_RUN_AUDIO_LM_PROJECTOR_MAP[model_path]
+            self.downloaded_path, _ = pull_model(self.model_path, **kwargs)
+            self.projector_downloaded_path, _ = pull_model(
+                self.projector_path, **kwargs
+            )
+        elif Path(model_path).parent.exists():
+            local_dir = Path(model_path).parent
+            model_name = Path(model_path).name
+            tag_and_ext = model_name.split(":")[-1]
+            self.downloaded_path = local_dir / f"model-{tag_and_ext}"
+            self.projector_downloaded_path = local_dir / f"projector-{tag_and_ext}"
+            if not (
+                self.downloaded_path.exists()
+                and self.projector_downloaded_path.exists()
+            ):
+                logging.error(
+                    f"Model or projector not found in {local_dir}. "
+                    "Make sure to name them as 'model-<tag>.gguf' and 'projector-<tag>.gguf'."
+                )
+                exit(1)
+        else:
+            logging.error("VLM user model from hub is not supported yet.")
+            exit(1)
+
+        if self.downloaded_path is None or self.projector_downloaded_path is None:
+            logging.error(
+                f"Model ({model_path}) is not applicable. Please refer to our docs for proper usage.",
+                exc_info=True,
+            )
+            exit(1)
+        self.is_qwen = is_qwen(self.downloaded_path) # TEMPORARY SOLUTION : this hardcode can be risky
+        self.ctx_params = audio_lm_cpp.context_default_params(self.is_qwen)
+        with suppress_stdout_stderr():
+            self._load_model()
+
+    @SpinningCursorAnimation()
+    def _load_model(self):
+        try:
+            self.ctx_params.model = ctypes.c_char_p(
+                self.downloaded_path.encode("utf-8")
+            )
+            self.ctx_params.mmproj = ctypes.c_char_p(
+                self.projector_downloaded_path.encode("utf-8")
+            )
+            self.ctx_params.n_gpu_layers = (
+                0x7FFFFFFF if self.n_gpu_layers == -1 else self.n_gpu_layers
+            )  # 0x7FFFFFFF is INT32 max, will be auto set to all layers
+
+            # self.context = audio_lm_cpp.init_context(
+            #     ctypes.byref(self.ctx_params), is_qwen=self.is_qwen
+            # )
+            # if not self.context:
+            #     raise RuntimeError("Failed to load audio language model")
+            # logging.debug("Model loaded successfully")
+        except Exception as e:
+            logging.error(f"Error loading model: {e}")
+            raise
+
+    def run(self):
+        """
+        Run the audio language model inference loop.
+        """
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+        
+        try:
+            while True:
+                audio_path = self._get_valid_audio_path()
+                user_input = nexa_prompt("Enter text (leave empty if no prompt): ")
+                
+                stop_event, spinner_thread = start_spinner(
+                    style="default", 
+                    message=""
+                )
+            
+                try:
+                    with suppress_stdout_stderr():
+                        response = self.inference(audio_path, user_input)
+                finally:
+                    stop_spinner(stop_event, spinner_thread)
+            
+                print(f"{response}")
+                self.cleanup()
+
+        except KeyboardInterrupt:
+            print("\nExiting...")
+        except Exception as e:
+            logging.error(f"\nError during audio generation: {e}", exc_info=True)
+
+    def _get_valid_audio_path(self) -> str:
+        """
+        Helper method to get a valid audio file path from user
+        """
+        while True:
+            audio_path = nexa_prompt("Enter the path to your audio file (required): ")
+            if os.path.exists(audio_path):
+                # Check if it's a supported audio format
+                if any(audio_path.lower().endswith(ext) for ext in ['.wav', '.mp3', '.m4a', '.flac', '.ogg']):
+                    return audio_path
+                print(f"Unsupported audio format. Please use WAV, MP3, M4A, FLAC, or OGG files.")
+            else:
+                print(f"'{audio_path}' is not a valid audio path. Please try again.")
+
+    # @SpinningCursorAnimation()
+    def inference(self, audio_path: str, prompt: str = "") -> str:
+        """
+        Perform a single inference with the audio language model.
+        """
+        if not os.path.exists(audio_path):
+            raise FileNotFoundError(f"Audio file not found: {audio_path}")
+
+        try:
+            # Ensure audio is at 16kHz before processing
+            audio_path = self._ensure_16khz(audio_path)
+
+            self.ctx_params.file = ctypes.c_char_p(audio_path.encode("utf-8"))
+            self.ctx_params.prompt = ctypes.c_char_p(prompt.encode("utf-8"))
+
+            self.context = audio_lm_cpp.init_context(
+                ctypes.byref(self.ctx_params), is_qwen=self.is_qwen
+            )
+            if not self.context:
+                raise RuntimeError("Failed to load audio language model")
+            logging.debug("Model loaded successfully")
+
+            response = audio_lm_cpp.process_full(
+                self.context, ctypes.byref(self.ctx_params), is_qwen=self.is_qwen
+            )
+            return response.decode("utf-8") if isinstance(response, bytes) else response
+        except Exception as e:
+            raise RuntimeError(f"Error during inference: {str(e)}")
+        finally:
+            if self.temp_file:
+                try:
+                    self.temp_file.close()
+                    if os.path.exists(self.temp_file.name):
+                        os.unlink(self.temp_file.name)
+                except:
+                    pass
+                self.temp_file = None
+
+    def cleanup(self):
+        """
+        Explicitly cleanup resources
+        """
+        if self.context:
+            audio_lm_cpp.free(self.context, is_qwen=self.is_qwen)
+            self.context = None
+        
+        if self.temp_file:
+            try:
+                self.temp_file.close()
+                if os.path.exists(self.temp_file.name):
+                    os.unlink(self.temp_file.name)
+            except:
+                pass
+            self.temp_file = None
+
+    # def __del__(self):
+    #     """
+    #     Destructor to free the Bark context when the instance is deleted.
+    #     """
+    #     if self.context:
+    #         audio_lm_cpp.free(self.context, is_qwen=self.is_qwen)
+
+    def _ensure_16khz(self, audio_path: str) -> str:
+        """
+        Check if audio is 16kHz, resample if necessary.
+        Supports various audio formats (mp3, wav, m4a, etc.)
+        """
+        try:
+            y, sr = librosa.load(audio_path, sr=None)
+    
+            if sr == 16000:
+                return audio_path
+            
+            # Resample to 16kHz
+            print(f"Resampling audio from {sr} to 16000")
+            y_resampled = librosa.resample(y=y, orig_sr=sr, target_sr=16000)
+            self.temp_file = tempfile.NamedTemporaryFile(
+                suffix='.wav',
+                delete=False
+            )
+            sf.write(
+                self.temp_file.name, 
+                y_resampled, 
+                16000,
+                subtype='PCM_16'
+            )
+            return self.temp_file.name
+
+        except Exception as e:
+            raise RuntimeError(f"Error processing audio file: {str(e)}")
+
+    def run_streamlit(self, model_path: str, is_local_path = False, hf = False, projector_local_path = None):
+        """
+        Run the Streamlit UI.
+        """
+        logging.info("Running Streamlit UI...")
+
+        streamlit_script_path = (
+            Path(os.path.abspath(__file__)).parent / "streamlit" / "streamlit_audio_lm.py"
+        )
+
+        sys.argv = ["streamlit", "run", str(streamlit_script_path), model_path, str(is_local_path), str(hf), str(projector_local_path)]
+        sys.exit(stcli.main())
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description="Run audio-in text-out generation with nexa-omni-audio model"
+    )
+    parser.add_argument(
+        "model_path",
+        type=str,
+        help="Path or identifier for the model in Nexa Model Hub",
+    )
+    parser.add_argument(
+        "-d",
+        "--device",
+        type=str,
+        choices=["auto", "cpu", "gpu"],
+        default="auto",
+        help="Device to use for inference (auto, cpu, or gpu)",
+    )
+    parser.add_argument(
+        "-st",
+        "--streamlit",
+        action="store_true",
+        help="Run the inference in Streamlit UI",
+    )
+
+    args = parser.parse_args()
+    kwargs = {k: v for k, v in vars(args).items() if v is not None}
+    model_path = kwargs.pop("model_path")
+    device = kwargs.pop("device", "auto")
+
+    inference = NexaAudioLMInference(model_path, device=device, **kwargs)
+    if args.streamlit:
+        inference.run_streamlit(model_path)
+    else:
+        inference.run()
diff --git a/nexa/gguf/nexa_inference_image.py b/nexa/gguf/nexa_inference_image.py
index 0813f725..65ef0c22 100644
--- a/nexa/gguf/nexa_inference_image.py
+++ b/nexa/gguf/nexa_inference_image.py
@@ -203,12 +203,20 @@ def txt2img(
         return images
 
     def run_txt2img(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         while True:
             try:
                 prompt = nexa_prompt("Enter your prompt: ")
                 negative_prompt = nexa_prompt(
                     "Enter your negative prompt (press Enter to skip): "
                 )
+
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
                 try:
                     images = self.txt2img(
                         prompt,
@@ -225,6 +233,9 @@ def run_txt2img(self):
                         self._save_images(images)
                 except Exception as e:
                     logging.error(f"Error during text to image generation: {e}")
+                finally:
+                    stop_spinner(stop_event, spinner_thread)
+
             except KeyboardInterrupt:
                 print(EXIT_REMINDER)
             except Exception as e:
@@ -270,6 +281,8 @@ def img2img(
         return images
 
     def run_img2img(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         while True:
             try:
                 image_path = nexa_prompt("Enter the path to your image: ")
@@ -277,6 +290,12 @@ def run_img2img(self):
                 negative_prompt = nexa_prompt(
                     "Enter your negative prompt (press Enter to skip): "
                 )
+
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
                 images = self.img2img(
                     image_path,
                     prompt,
@@ -292,6 +311,9 @@ def run_img2img(self):
 
                 if images:
                     self._save_images(images)
+                
+                stop_spinner(stop_event, spinner_thread)
+
             except KeyboardInterrupt:
                 print(EXIT_REMINDER)
             except Exception as e:
diff --git a/nexa/gguf/nexa_inference_text.py b/nexa/gguf/nexa_inference_text.py
index 47bde1eb..c7802ace 100644
--- a/nexa/gguf/nexa_inference_text.py
+++ b/nexa/gguf/nexa_inference_text.py
@@ -152,6 +152,8 @@ def run(self):
         """
         CLI interactive session. Not for SDK.
         """
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         while True:
             generated_text = ""
             try:
@@ -160,9 +162,16 @@ def run(self):
 
                 generation_start_time = time.time()
 
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
                 if self.chat_format:
                     output = self._chat(user_input)
                     first_token = True
+                    stop_spinner(stop_event, spinner_thread) 
+
                     for chunk in output:
                         if first_token:
                             decoding_start_time = time.time()
@@ -179,6 +188,8 @@ def run(self):
                 else:
                     output = self._complete(user_input)
                     first_token = True
+                    stop_spinner(stop_event, spinner_thread) 
+
                     for chunk in output:
                         if first_token:
                             decoding_start_time = time.time()
@@ -297,6 +308,12 @@ def _complete(self, user_input: str) -> Iterator:
             stop=self.stop_words,
             logprobs=self.logprobs,
         )
+        
+    def unload_lora(self):
+        self.model.unload_lora()
+        
+    def reload_lora(self, lora_path: str, lora_scale: float = 1.0):
+        self.model.reload_lora(lora_path, lora_scale)
 
     def run_streamlit(self, model_path: str, is_local_path = False, hf = False):
         """
diff --git a/nexa/gguf/nexa_inference_tts.py b/nexa/gguf/nexa_inference_tts.py
index 173996be..cba950a0 100644
--- a/nexa/gguf/nexa_inference_tts.py
+++ b/nexa/gguf/nexa_inference_tts.py
@@ -7,7 +7,9 @@
 import platform
 import functools
 from .bark import bark_cpp
+
 from nexa.general import pull_model
+from nexa.gguf.lib_utils import is_gpu_available
 
 class NexaTTSInference:
     """
@@ -27,7 +29,8 @@ class NexaTTSInference:
     """
     
     def __init__(self, model_path=None, local_path=None, n_threads=1, seed=0, 
-                 sampling_rate=24000, verbosity=0, win_stack_size=16*1024*1024, **kwargs):
+                 sampling_rate=24000, verbosity=0, win_stack_size=16*1024*1024,
+                 device="auto", n_gpu_layers=4, **kwargs):
         if model_path is None and local_path is None:
             raise ValueError("Either model_path or local_path must be provided.")
             
@@ -38,6 +41,8 @@ def __init__(self, model_path=None, local_path=None, n_threads=1, seed=0,
         self.sampling_rate = sampling_rate
         self.verbosity = verbosity
         self.win_stack_size = win_stack_size
+        self.device = device
+        self.n_gpu_layers = n_gpu_layers
         self.params = {
             "output_path": os.path.join(os.getcwd(), "tts"),
         }
@@ -93,9 +98,29 @@ def _load_model(self):
             params = bark_cpp.bark_context_default_params()
             params.sample_rate = self.sampling_rate
             params.verbosity = self.verbosity
+
+            # Use configured n_gpu_layers when device is auto/gpu and GPU is available
+            if self.device == "auto" or self.device == "gpu":
+                if is_gpu_available():
+                    params.n_gpu_layers = self.n_gpu_layers
+                    logging.info(f"Using GPU acceleration with {self.n_gpu_layers} layers")
+                else:
+                    params.n_gpu_layers = 0
+                    logging.info("GPU not available, falling back to CPU")
+            else:
+                params.n_gpu_layers = 0
+                logging.info("Using CPU mode")
+
             c_model_path = ctypes.c_char_p(self.downloaded_path.encode('utf-8'))
             c_seed = ctypes.c_uint32(self.seed)
-            self.context = bark_cpp.bark_load_model(c_model_path, params, c_seed)
+            
+            try:
+                self.context = bark_cpp.bark_load_model(c_model_path, params, c_seed)
+            except Exception as e:
+                logging.error(f"Failed to load model with GPU. Falling back to CPU: {e}")
+                params.n_gpu_layers = 0
+                self.context = bark_cpp.bark_load_model(c_model_path, params, c_seed)
+
             if not self.context:
                 raise RuntimeError("Failed to load Bark model")
             logging.debug("Model loaded successfully")
@@ -105,12 +130,23 @@ def _load_model(self):
 
 
     def run(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         while True:
             try:
                 user_input = input("Enter text to generate audio: ")
+
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
                 audio_data = self.audio_generation(user_input)
+               
                 self._save_audio(audio_data, self.sampling_rate, self.params["output_path"])
                 logging.info(f"Audio saved to {self.params['output_path']}")                
+            
+                stop_spinner(stop_event, spinner_thread)
             except KeyboardInterrupt:
                 print("Exiting...")
                 break
diff --git a/nexa/gguf/nexa_inference_vlm.py b/nexa/gguf/nexa_inference_vlm.py
index 214462f8..fa62b589 100644
--- a/nexa/gguf/nexa_inference_vlm.py
+++ b/nexa/gguf/nexa_inference_vlm.py
@@ -221,6 +221,8 @@ def embed(
         return self.model.embed(input, normalize, truncate, return_count)
 
     def run(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         # I just use completion, no conversation history
         while True:
             try:
@@ -239,14 +241,22 @@ def run(self):
                     print("Please provide an image or text input.")
                     continue
 
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
                 output = self._chat(user_input, image_path)
+                stop_spinner(stop_event, spinner_thread)
+
                 for chunk in output:
                     delta = chunk["choices"][0]["delta"]
                     if "role" in delta:
                         print(delta["role"], end=": ", flush=True)
                     elif "content" in delta:
                         print(delta["content"], end="", flush=True)
-                        generated_text += delta["content"]
+                        generated_text += delta["content"]            
+
             except KeyboardInterrupt:
                 pass
             except Exception as e:
diff --git a/nexa/gguf/nexa_inference_vlm_omni.py b/nexa/gguf/nexa_inference_vlm_omni.py
new file mode 100644
index 00000000..4a76a4eb
--- /dev/null
+++ b/nexa/gguf/nexa_inference_vlm_omni.py
@@ -0,0 +1,221 @@
+import ctypes
+import logging
+import os
+import sys
+from pathlib import Path
+from streamlit.web import cli as stcli
+from nexa.utils import nexa_prompt, SpinningCursorAnimation
+from nexa.constants import (
+    NEXA_RUN_OMNI_VLM_PROJECTOR_MAP,
+    NEXA_RUN_OMNI_VLM_MAP
+)
+from nexa.gguf.lib_utils import is_gpu_available
+from nexa.gguf.llama import omni_vlm_cpp
+from nexa.gguf.llama._utils_transformers import suppress_stdout_stderr
+from nexa.general import pull_model
+
+class NexaOmniVlmInference:
+    """
+    A class used for vision language model inference.
+    """
+
+    def __init__(
+        self,
+        model_path=None,
+        local_path=None,
+        projector_local_path=None,
+        device="auto",
+        **kwargs,
+    ):
+        if model_path is None and local_path is None:
+            raise ValueError("Either model_path or local_path must be provided.")
+
+        self.model = None
+        self.projector = None
+        self.device = device
+        self.context = None
+        self.omni_vlm_version = "vlm-81-instruct"
+        if self.device == "auto" or self.device == "gpu":
+            self.n_gpu_layers = -1 if is_gpu_available() else 0
+        else:
+            self.n_gpu_layers = 0
+
+        # Handle direct model file paths (e.g., omniVLM:model-fp16)
+        if model_path and ':model-' in model_path:
+            base_name = model_path.split(':')[0]
+            model_type = model_path.split('model-')[1]
+            if base_name in NEXA_RUN_OMNI_VLM_PROJECTOR_MAP:
+                self.model_path = model_path
+                # Construct corresponding projector path
+                self.projector_path = f"{base_name}:projector-{model_type}"
+                self.downloaded_path, _ = pull_model(self.model_path, **kwargs)
+                self.projector_downloaded_path, _ = pull_model(self.projector_path, **kwargs)
+                self.omni_vlm_version = self._determine_vlm_version(model_path)
+
+        else:
+            # Handle other path formats and model loading scenarios
+            self.projector_path = NEXA_RUN_OMNI_VLM_PROJECTOR_MAP.get(model_path, None)
+            self.downloaded_path = local_path
+            self.projector_downloaded_path = projector_local_path
+
+            if self.downloaded_path is not None and self.projector_downloaded_path is not None:
+                # when running from local, both path should be provided
+                self.omni_vlm_version = self._determine_vlm_version(str(self.downloaded_path))
+            elif self.downloaded_path is not None:
+                if model_path in NEXA_RUN_OMNI_VLM_MAP:
+                    self.projector_path = NEXA_RUN_OMNI_VLM_PROJECTOR_MAP[model_path]
+                    self.projector_downloaded_path, _ = pull_model(self.projector_path, **kwargs)
+                    self.omni_vlm_version = self._determine_vlm_version(model_path)
+            elif model_path in NEXA_RUN_OMNI_VLM_MAP:
+                self.model_path = NEXA_RUN_OMNI_VLM_MAP[model_path]
+                self.projector_path = NEXA_RUN_OMNI_VLM_PROJECTOR_MAP[model_path]
+                self.downloaded_path, _ = pull_model(self.model_path, **kwargs)
+                self.projector_downloaded_path, _ = pull_model(self.projector_path, **kwargs)
+                self.omni_vlm_version = self._determine_vlm_version(model_path)
+            elif Path(model_path).parent.exists():
+                local_dir = Path(model_path).parent
+                model_name = Path(model_path).name
+                tag_and_ext = model_name.split(":")[-1]
+                self.downloaded_path = local_dir / f"model-{tag_and_ext}"
+                self.projector_downloaded_path = local_dir / f"projector-{tag_and_ext}"
+                if not (
+                    self.downloaded_path.exists()
+                    and self.projector_downloaded_path.exists()
+                ):
+                    logging.error(
+                        f"Model or projector not found in {local_dir}. "
+                        "Make sure to name them as 'model-<tag>.gguf' and 'projector-<tag>.gguf'."
+                    )
+                    exit(1)
+                self.omni_vlm_version = self._determine_vlm_version(model_path)
+            else:
+                logging.error("VLM user model from hub is not supported yet.")
+                exit(1)
+        
+        # Override version if specified in kwargs
+        if 'omni_vlm_version' in kwargs:
+            self.omni_vlm_version = kwargs.get('omni_vlm_version')
+        print(f"Using omni-vlm-version: {self.omni_vlm_version}")
+            
+        with suppress_stdout_stderr():
+            self._load_model()
+
+    def _determine_vlm_version(self, path_str: str) -> str:
+        """Helper function to determine VLM version from path string."""
+        if 'ocr' in path_str:
+            return "vlm-81-ocr"
+        elif 'preview' in path_str:
+            return "nano-vlm-instruct"
+        return "vlm-81-instruct"
+    
+    @SpinningCursorAnimation()
+    def _load_model(self):
+        try:
+            self.ctx_params_model = ctypes.c_char_p(self.downloaded_path.encode("utf-8"))
+            self.ctx_params_mmproj = ctypes.c_char_p(self.projector_downloaded_path.encode("utf-8"))
+            self.ctx_params_omni_vlm_version = ctypes.c_char_p(self.omni_vlm_version.encode("utf-8"))
+            omni_vlm_cpp.omnivlm_init(self.ctx_params_model, self.ctx_params_mmproj, self.ctx_params_omni_vlm_version)
+        except Exception as e:
+            logging.error(f"Error loading model: {e}")
+            raise
+        
+    def run(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+        
+        while True:
+            try:
+                image_path = nexa_prompt("Image Path (required): ")
+                if not os.path.exists(image_path):
+                    print(f"Image path: {image_path} not found, running omni VLM without image input.")
+                # Skip user input for OCR version
+                user_input = "" if self.omni_vlm_version == "vlm-81-ocr" else nexa_prompt()
+
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+
+                response = self.inference(user_input, image_path)
+
+                stop_spinner(stop_event, spinner_thread)
+
+                print(f"\nResponse: {response}")
+            except KeyboardInterrupt:
+                print("\nExiting...")
+                break
+            except Exception as e:
+                logging.error(f"\nError during audio generation: {e}", exc_info=True)
+            print("\n")
+
+    def inference(self, prompt: str, image_path: str):
+        with suppress_stdout_stderr():
+            prompt = ctypes.c_char_p(prompt.encode("utf-8"))
+            image_path = ctypes.c_char_p(image_path.encode("utf-8"))
+            response = omni_vlm_cpp.omnivlm_inference(prompt, image_path)
+            
+            decoded_response = response.decode('utf-8')
+            if '<|im_start|>assistant' in decoded_response:
+                decoded_response = decoded_response.replace('<|im_start|>assistant', '').strip()
+                
+            return decoded_response
+
+    def __del__(self):
+        omni_vlm_cpp.omnivlm_free()
+
+    def run_streamlit(self, model_path: str, is_local_path = False, hf = False, projector_local_path = None):
+        """
+        Run the Streamlit UI.
+        """
+        logging.info("Running Streamlit UI...")
+
+        streamlit_script_path = (
+            Path(os.path.abspath(__file__)).parent / "streamlit" / "streamlit_vlm_omni.py"
+        )
+
+        sys.argv = ["streamlit", "run", str(streamlit_script_path), model_path, str(is_local_path), str(hf), str(projector_local_path)]
+        sys.exit(stcli.main())
+
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        description="Run audio-in text-out generation with nexa-omni-audio model"
+    )
+    parser.add_argument(
+        "model_path",
+        type=str,
+        help="Path or identifier for the model in Nexa Model Hub",
+    )
+    parser.add_argument(
+        "-d",
+        "--device",
+        type=str,
+        choices=["auto", "cpu", "gpu"],
+        default="auto",
+        help="Device to use for inference (auto, cpu, or gpu)",
+    )
+    parser.add_argument(
+        "-st",
+        "--streamlit",
+        action="store_true",
+        help="Run the inference in Streamlit UI",
+    )
+    parser.add_argument(
+        "--omni_vlm_version",
+        type=str,
+        choices=["vlm-81-ocr", "vlm-81-instruct", "nano-vlm-instruct"],
+        default="vlm-81-instruct",
+        help="omni-vlm-version to use",
+    )
+
+    args = parser.parse_args()
+    kwargs = {k: v for k, v in vars(args).items() if v is not None}
+    model_path = kwargs.pop("model_path")
+    device = kwargs.pop("device", "auto")
+
+    inference = NexaOmniVlmInference(model_path, device=device, **kwargs)
+    if args.streamlit:
+        inference.run_streamlit(model_path)
+    else:
+        inference.run()
\ No newline at end of file
diff --git a/nexa/gguf/nexa_inference_voice.py b/nexa/gguf/nexa_inference_voice.py
index 84864713..b3659776 100644
--- a/nexa/gguf/nexa_inference_voice.py
+++ b/nexa/gguf/nexa_inference_voice.py
@@ -81,10 +81,21 @@ def _load_model(self):
         logging.debug("Model loaded successfully")
 
     def run(self):
+        from nexa.gguf.llama._utils_spinner import start_spinner, stop_spinner
+
         while True:
             try:
                 audio_path = nexa_prompt("Enter the path to your audio file: ")
+
+                stop_event, spinner_thread = start_spinner(
+                    style="default",
+                    message=""
+                )
+            
                 self._transcribe_audio(audio_path)
+
+                stop_spinner(stop_event, spinner_thread)
+                
             except KeyboardInterrupt:
                 print(EXIT_REMINDER)
             except Exception as e:
diff --git a/nexa/gguf/server/nexa_service.py b/nexa/gguf/server/nexa_service.py
index d0267098..73772e31 100644
--- a/nexa/gguf/server/nexa_service.py
+++ b/nexa/gguf/server/nexa_service.py
@@ -82,6 +82,7 @@
 is_local_path = False
 model_type = None
 is_huggingface = False
+is_modelscope = False
 projector_path = None
 # Request Classes
 class GenerationRequest(BaseModel):
@@ -176,7 +177,7 @@ class EmbeddingRequest(BaseModel):
 
 # helper functions
 async def load_model():
-    global model, chat_format, completion_template, model_path, n_ctx, is_local_path, model_type, is_huggingface, projector_path
+    global model, chat_format, completion_template, model_path, n_ctx, is_local_path, model_type, is_huggingface, is_modelscope, projector_path
     if is_local_path:
         if model_type == "Multimodal":
             if not projector_path:
@@ -185,11 +186,11 @@ async def load_model():
             projector_downloaded_path = projector_path
         else:
             downloaded_path = model_path
-    elif is_huggingface:
+    elif is_huggingface or is_modelscope:
         # TODO: currently Multimodal models and Audio models are not supported for Hugging Face
         if model_type == "Multimodal" or model_type == "Audio":
             raise ValueError("Multimodal and Audio models are not supported for Hugging Face")
-        downloaded_path, _ = pull_model(model_path, hf=True)
+        downloaded_path, _ = pull_model(model_path, hf=is_huggingface, ms=is_modelscope)
     else:
         if model_path in NEXA_RUN_MODEL_MAP_VLM: # for Multimodal models
             downloaded_path, _ = pull_model(NEXA_RUN_MODEL_MAP_VLM[model_path])
@@ -333,7 +334,7 @@ def nexa_run_text_generation(
     logprobs_or_none = None
 
     if is_chat_completion:
-        if is_local_path or is_huggingface: # do not add system prompt if local path or huggingface
+        if is_local_path or is_huggingface or is_modelscope: # do not add system prompt if local path or huggingface or modelscope
             messages = [{"role": "user", "content": prompt}]
         else:
             messages = chat_completion_system_prompt + [{"role": "user", "content": prompt}]
@@ -496,14 +497,15 @@ def image_url_to_base64(image_url: str) -> str:
     return f"data:image/png;base64,{base64.b64encode(buffered.getvalue()).decode()}"
 
 
-def run_nexa_ai_service(model_path_arg=None, is_local_path_arg=False, model_type_arg=None, huggingface=False, projector_local_path_arg=None, **kwargs):
-    global model_path, n_ctx, is_local_path, model_type, is_huggingface, projector_path
+def run_nexa_ai_service(model_path_arg=None, is_local_path_arg=False, model_type_arg=None, huggingface=False, modelscope=False, projector_local_path_arg=None, **kwargs):
+    global model_path, n_ctx, is_local_path, model_type, is_huggingface, is_modelscope, projector_path
     is_local_path = is_local_path_arg
     is_huggingface = huggingface
+    is_modelscope = modelscope
     projector_path = projector_local_path_arg
-    if is_local_path_arg or huggingface:
+    if is_local_path_arg or huggingface or modelscope:
         if not model_path_arg:
-            raise ValueError("model_path must be provided when using --local_path or --huggingface")
+            raise ValueError("model_path must be provided when using --local_path or --huggingface or --modelscope")
         if is_local_path_arg and not model_type_arg:
             raise ValueError("--model_type must be provided when using --local_path")
         model_path = os.path.abspath(model_path_arg) if is_local_path_arg else model_path_arg
@@ -515,6 +517,7 @@ def run_nexa_ai_service(model_path_arg=None, is_local_path_arg=False, model_type
     os.environ["IS_LOCAL_PATH"] = str(is_local_path_arg)
     os.environ["MODEL_TYPE"] = model_type if model_type else ""
     os.environ["HUGGINGFACE"] = str(huggingface)
+    os.environ["MODELSCOPE"] = str(modelscope)
     os.environ["PROJECTOR_PATH"] = projector_path if projector_path else ""
     n_ctx = kwargs.get("nctx", 2048)
     host = kwargs.get("host", "localhost")
@@ -525,11 +528,12 @@ def run_nexa_ai_service(model_path_arg=None, is_local_path_arg=False, model_type
 # Endpoints
 @app.on_event("startup")
 async def startup_event():
-    global model_path, is_local_path, model_type, is_huggingface, projector_path
+    global model_path, is_local_path, model_type, is_huggingface, is_modelscope, projector_path
     model_path = os.getenv("MODEL_PATH", "gemma")
     is_local_path = os.getenv("IS_LOCAL_PATH", "False").lower() == "true"
     model_type = os.getenv("MODEL_TYPE", None)
     is_huggingface = os.getenv("HUGGINGFACE", "False").lower() == "true"
+    is_modelscope = os.getenv("MODELSCOPE", "False").lower() == "true"
     projector_path = os.getenv("PROJECTOR_PATH", None)
     await load_model()
 
@@ -859,12 +863,18 @@ async def create_embedding(request: EmbeddingRequest):
         action="store_true",
         help="Use a Hugging Face model",
     )
+    parser.add_argument(
+        "--modelscope",
+        action="store_true",
+        help="Use a ModelScope model",
+    )
     args = parser.parse_args()
     run_nexa_ai_service(
         args.model_path,
         is_local_path_arg=args.local_path,
         model_type_arg=args.model_type,
         huggingface=args.huggingface,
+        modelscope=args.modelscope,
         nctx=args.nctx,
         host=args.host,
         port=args.port,
diff --git a/nexa/gguf/streamlit/streamlit_audio_lm.py b/nexa/gguf/streamlit/streamlit_audio_lm.py
new file mode 100644
index 00000000..889a8870
--- /dev/null
+++ b/nexa/gguf/streamlit/streamlit_audio_lm.py
@@ -0,0 +1,137 @@
+import io
+import os
+import sys
+import tempfile
+
+import streamlit as st
+from st_audiorec import st_audiorec
+
+from nexa.general import pull_model
+from nexa.gguf.llama._utils_transformers import suppress_stdout_stderr
+from nexa.gguf.nexa_inference_audio_lm import NexaAudioLMInference
+
+# Initialize session state
+if "has_result" not in st.session_state:
+    st.session_state.has_result = False
+    st.session_state.prompt = ""
+    st.session_state.key = 0
+    st.rerun()
+
+default_model = sys.argv[1]
+is_local_path = False if sys.argv[2] == "False" else True
+hf = False if sys.argv[3] == "False" else True
+projector_local_path = sys.argv[4] if len(sys.argv) > 4 else None
+
+@st.cache_resource
+def load_model(model_path):
+    if is_local_path:
+        local_path = model_path
+    elif hf:
+        local_path, _ = pull_model(model_path, hf=True)
+    else:
+        local_path, _ = pull_model(model_path)
+        
+    if is_local_path:
+        nexa_model = NexaAudioLMInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path)
+    else:
+        nexa_model = NexaAudioLMInference(model_path=model_path, local_path=local_path)
+    return nexa_model
+
+def process_audio(nexa_model, audio_file, prompt=""):
+    # Save the uploaded audio data to a temporary file
+    audio_data = audio_file.getvalue()
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
+        temp_audio.write(audio_data)
+        temp_audio_path = temp_audio.name
+
+    try:
+        # Use the model's inference method directly
+        with suppress_stdout_stderr():
+            response = nexa_model.inference(temp_audio_path, prompt)
+        return response
+
+    except Exception as e:
+        st.error(f"Error during audio processing: {e}")
+        return None
+    finally:
+        # Clean up the temporary audio file
+        if os.path.exists(temp_audio_path):
+            os.unlink(temp_audio_path)
+
+def start_new_callback():
+    st.session_state.has_result = False
+    st.session_state.prompt = ""
+    st.session_state.key += 1
+
+st.markdown("# Nexa AI AudioLM Generation [![Nexa SDK](https://img.shields.io/badge/SDK-Nexa-blue)](https://github.com/NexaAI/nexa-sdk)")
+st.caption("Powered by Nexa AI SDK🐙")
+
+# Sidebar configuration
+st.sidebar.header("Model Configuration")
+model_path = st.sidebar.text_input("Model path", default_model)
+
+if not model_path:
+    st.warning("Please enter a valid model path to proceed.")
+    st.stop()
+
+# Initialize or update the model when the path changes
+if ("current_model_path" not in st.session_state 
+    or st.session_state.current_model_path != model_path):
+    st.session_state.current_model_path = model_path
+    st.session_state.nexa_model = load_model(model_path)
+    if st.session_state.nexa_model is None:
+        st.stop()
+
+# Wrap input sections
+input_container = st.container()
+
+with input_container:
+    # Text prompt input
+    prompt = st.text_input("Enter optional prompt text:", value=st.session_state.prompt, key=f"prompt_{st.session_state.key}")
+
+    
+    # Option 1: Upload Audio File
+    st.subheader("Option 1: Upload Audio File")
+    uploaded_file = st.file_uploader("Choose an audio file", type=["wav", "mp3"], key=f"uploader_{st.session_state.key}")
+
+    if uploaded_file is not None:
+        st.audio(uploaded_file, format="audio/wav")
+        
+        if st.button("Process Audio", key="process_upload"):
+            with st.spinner("Processing audio..."):
+                response = process_audio(st.session_state.nexa_model, uploaded_file, prompt)
+                if response:
+                    st.session_state.has_result = True
+            
+            if response:
+                st.subheader("Model Response:")
+                st.write(response)
+                if st.session_state.has_result:
+                    if st.button("Start new", key="start_new_upload", on_click=start_new_callback):
+                        pass
+                    st.write("Start new conversation to try next prompt")
+            else:
+                st.error("Processing failed. Please try again with a different audio file.")
+    
+    # Option 2: Real-time Recording
+    st.subheader("Option 2: Record Audio")
+    wav_audio_data = st_audiorec()
+    
+    if wav_audio_data:
+        if st.button("Process Audio", key="process_record"):
+            with st.spinner("Processing audio..."):
+                response = process_audio(st.session_state.nexa_model, io.BytesIO(wav_audio_data), prompt)
+                if response:
+                    st.session_state.has_result = True
+            
+            if response:
+                st.subheader("Model Response:")
+                st.write(response)
+                if st.session_state.has_result:
+                    if st.button("Start new", key="start_new_record", on_click=start_new_callback):
+                        pass
+                    st.write("Start new conversation to try next prompt")
+            else:
+                st.error("Processing failed. Please try recording again.")
+    else:
+        st.warning("No audio recorded. Please record some audio before processing.")
\ No newline at end of file
diff --git a/nexa/gguf/streamlit/streamlit_image_chat.py b/nexa/gguf/streamlit/streamlit_image_chat.py
index 9bb7e8f8..a54def8e 100644
--- a/nexa/gguf/streamlit/streamlit_image_chat.py
+++ b/nexa/gguf/streamlit/streamlit_image_chat.py
@@ -1,29 +1,97 @@
 import os
 import sys
 from PIL import Image
-from nexa.general import pull_model
 import streamlit as st
+from nexa.general import pull_model
 from nexa.gguf.nexa_inference_image import NexaImageInference
+from nexa.utils import (
+    get_model_options,
+    update_model_options,
+)
+from nexa.constants import (
+    DEFAULT_IMG_GEN_PARAMS_LCM,
+    DEFAULT_IMG_GEN_PARAMS_TURBO,
+    DEFAULT_IMG_GEN_PARAMS,
+    NEXA_RUN_MODEL_MAP_IMAGE,
+    NEXA_RUN_MODEL_MAP_FLUX,
+)
 import io
 
-default_model = sys.argv[1]
-is_local_path = False if sys.argv[2] == "False" else True
-hf = False if sys.argv[3] == "False" else True
-
+specified_run_type = 'Computer Vision'
+model_map = NEXA_RUN_MODEL_MAP_IMAGE | NEXA_RUN_MODEL_MAP_FLUX
 
-@st.cache_resource
-def load_model(model_path):
-    if is_local_path:
-        local_path = model_path
-    elif hf:
-        local_path, _ = pull_model(model_path, hf=True)
+def get_default_params(model_path: str) -> dict:
+    """Get default parameters based on model type."""
+    if "lcm-dreamshaper" in model_path or "flux" in model_path:
+        return DEFAULT_IMG_GEN_PARAMS_LCM.copy()  # fast LCM models: 4 steps @ 1.0 guidance
+    elif "sdxl-turbo" in model_path:
+        return DEFAULT_IMG_GEN_PARAMS_TURBO.copy()  # sdxl-turbo: 5 steps @ 5.0 guidance
     else:
-        local_path, run_type = pull_model(model_path)
-    nexa_model = NexaImageInference(model_path=model_path, local_path=local_path)
-    return nexa_model
+        return DEFAULT_IMG_GEN_PARAMS.copy()  # standard SD models: 20 steps @ 7.5 guidance
+
+@st.cache_resource(show_spinner=False)
+def load_model(model_path: str, is_local: bool = False, is_hf: bool = False):
+    """Load model with proper error handling."""
+    try:
+        if is_local:
+            local_path = model_path
+        elif is_hf:
+            try:
+                local_path, _ = pull_model(model_path, hf=True)
+                update_model_options(specified_run_type, model_map)
+            except Exception as e:
+                st.error(f"Error pulling HuggingFace model: {str(e)}")
+                return None
+        else:
+            try:
+                # model hub case:
+                local_path, run_type = pull_model(model_path)
+                if not local_path or not run_type:
+                    st.error(f"Failed to pull model {model_path} from Nexa Model Hub")
+                    return None
+                update_model_options(specified_run_type, model_map)  # update options after successful pull
+            except ValueError as e:
+                st.error(f"Error pulling model from Nexa Model Hub: {str(e)}")
+                return None
+            except Exception as e:
+                st.error(f"Unexpected error while pulling model: {str(e)}")
+                return None
+
+        try:
+            nexa_model = NexaImageInference(
+                model_path=model_path,
+                local_path=local_path
+            )
+
+            # force refresh of model options after successful load:
+            update_model_options(specified_run_type, model_map)
+
+            return nexa_model
+
+        except Exception as e:
+            st.error(f"Error initializing model: {str(e)}")
+            return None
+
+    except Exception as e:
+        st.error(f"Error in load_model: {str(e)}")
+        return None
 
+@st.cache_resource(show_spinner=False)
+def load_local_model(local_path: str):
+    """Load local model with default parameters."""
+    try:
+        nexa_model = NexaImageInference(
+            model_path="local_model",
+            local_path=local_path
+        )
+        update_model_options(specified_run_type, model_map)  # update options after successful local model load
+        return nexa_model
+    except Exception as e:
+        st.error(f"Error loading local model: {str(e)}")
+        return None
 
 def generate_images(nexa_model: NexaImageInference, prompt: str, negative_prompt: str):
+    """Generate images using the model."""
     output_dir = os.path.dirname(nexa_model.params["output_path"])
     if not os.path.exists(output_dir):
         os.makedirs(output_dir)
@@ -37,93 +105,236 @@ def generate_images(nexa_model: NexaImageInference, prompt: str, negative_prompt
         sample_steps=nexa_model.params["num_inference_steps"],
         seed=nexa_model.params["random_seed"]
     )
-    
+
     return images
 
+# main execution:
+try:
+    # get command line arguments with proper error handling:
+    if len(sys.argv) < 4:
+        st.error("Missing required command line arguments.")
+        sys.exit(1)  # program terminated with an error
 
-st.markdown(
-    r"""
-    <style>
-    .stDeployButton {
-            visibility: hidden;
-        }
-    </style>
-    """,
-    unsafe_allow_html=True,
-)
-st.title("Nexa AI Image Generation")
-st.caption("Powered by Nexa AI SDK🐙")
+    default_model = sys.argv[1]
+    is_local_path = sys.argv[2].lower() == "true"
+    hf = sys.argv[3].lower() == "true"
+
+    # UI setup:
+    st.set_page_config(page_title="Nexa AI Image Generation", layout="wide")
+    st.markdown(
+        r"""
+        <style>
+        .stDeployButton {
+                visibility: hidden;
+            }
+        </style>
+        """,
+        unsafe_allow_html=True,
+    )
+    st.title("Nexa AI Image Generation")
+    st.caption("Powered by Nexa AI SDK🐙")
+
+    # force refresh model options on every page load:
+    if 'model_options' not in st.session_state:
+        st.session_state.model_options = get_model_options(specified_run_type, model_map)
+    else:
+        update_model_options(specified_run_type, model_map)
 
-st.sidebar.header("Model Configuration")
-model_path = st.sidebar.text_input("Model path", default_model)
+    # init session state variables:
+    if 'initialized' not in st.session_state:
+        st.session_state.current_model_path = None
+        st.session_state.current_local_path = None
+        st.session_state.current_hub_model = None
+
+        if not is_local_path and not hf:
+            try:
+                with st.spinner(f"Loading model: {default_model}"):
+                    st.session_state.nexa_model = load_model(default_model)
+                    if st.session_state.nexa_model:
+                        st.session_state.current_hub_model = default_model
+            except Exception as e:
+                st.error(f"Error loading default model: {str(e)}")
+
+            if default_model not in st.session_state.model_options:
+                st.session_state.current_model_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+        else:
+            try:
+                st.session_state.current_model_index = st.session_state.model_options.index(default_model)
+            except ValueError:
+                st.session_state.current_model_index = 0
+
+        st.session_state.initialized = True
+
+    # model selection sidebar:
+    st.sidebar.header("Model Configuration")
+
+    # update selectbox index based on current model
+    if 'nexa_model' in st.session_state:
+        if st.session_state.current_hub_model:
+            current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+        elif st.session_state.current_local_path:
+            current_index = st.session_state.model_options.index("Local Model 📁")
+        elif st.session_state.current_model_path:
+            current_index = st.session_state.model_options.index(st.session_state.current_model_path)
+        else:
+            current_index = st.session_state.current_model_index
+    else:
+        current_index = st.session_state.current_model_index
 
-if not model_path:
-    st.warning(
-        "Please enter a valid path or identifier for the model in Nexa Model Hub to proceed."
+    model_path = st.sidebar.selectbox(
+        "Select a Model",
+        st.session_state.model_options,
+        index=current_index,
+        key='model_selectbox'
     )
-    st.stop()
-
-if (
-    "current_model_path" not in st.session_state
-    or st.session_state.current_model_path != model_path
-):
-    st.session_state.current_model_path = model_path
-    st.session_state.nexa_model = load_model(model_path)
-    if st.session_state.nexa_model is None:
-        st.stop()
-
-st.sidebar.header("Generation Parameters")
-num_inference_steps = st.sidebar.slider(
-    "Number of Inference Steps",
-    1,
-    100,
-    st.session_state.nexa_model.params["num_inference_steps"],
-)
-height = st.sidebar.slider(
-    "Height", 64, 1024, st.session_state.nexa_model.params["height"]
-)
-width = st.sidebar.slider(
-    "Width", 64, 1024, st.session_state.nexa_model.params["width"]
-)
-guidance_scale = st.sidebar.slider(
-    "Guidance Scale", 0.0, 20.0, st.session_state.nexa_model.params["guidance_scale"]
-)
-random_seed = st.sidebar.slider(
-    "Random Seed", 0, 10000, st.session_state.nexa_model.params["random_seed"]
-)
 
-st.session_state.nexa_model.params.update(
-    {
-        "num_inference_steps": num_inference_steps,
-        "height": height,
-        "width": width,
-        "guidance_scale": guidance_scale,
-        "random_seed": random_seed,
-    }
-)
+    # handle model path input:
+    if model_path == "Local Model 📁":
+        local_model_path = st.sidebar.text_input("Enter local model path")
+        if not local_model_path:
+            st.warning("Please enter a valid local model path to proceed.")
+            st.stop()
+        local_model_path = local_model_path.strip()  # remove spaces
 
-prompt = st.text_input("Enter your prompt:")
-negative_prompt = st.text_input("Enter your negative prompt (optional):")
+        # handle local model path changes:
+        if 'nexa_model' not in st.session_state or st.session_state.current_local_path != local_model_path:
+            with st.spinner("Loading local model..."):
+                st.session_state.nexa_model = load_local_model(local_model_path)
+                st.session_state.current_local_path = local_model_path
+
+    elif model_path == "Use Model From Nexa Model Hub 🔍":
+        initial_value = default_model if not is_local_path and not hf else ""
+        hub_model_name = st.sidebar.text_input(
+            "Enter model name from Nexa Model Hub",
+            value=initial_value
+        )
+
+        # empty string check:
+        if not hub_model_name:
+            st.warning("""
+            How to add a model from Nexa Model Hub:
+            \n1. Visit [Nexa Model Hub](https://nexaai.com/models)
+            \n2. Find a vision model using the task filters
+            \n3. Select your desired model and copy either:
+            \n   - The full nexa run command, or (e.g., nexa run stable-diffusion-v1-4:q4_0)
+            \n   - Simply the model name (e.g., stable-diffusion-v1-4:q4_0)
+            \n4. Paste it into the field on the sidebar and press enter
+            """)
+            st.stop()
+
+        # process the input after checking it's not empty:
+        if hub_model_name.startswith("nexa run"):
+            hub_model_name = hub_model_name.split("nexa run")[-1].strip()
+        else:
+            hub_model_name = hub_model_name.strip()
+
+        # handle hub model name changes:
+        if 'nexa_model' not in st.session_state or st.session_state.current_hub_model != hub_model_name:
+            with st.spinner("Loading model from hub..."):
+                st.session_state.nexa_model = load_model(hub_model_name)
+                if st.session_state.nexa_model:  # only update if load was successful
+                    st.session_state.current_hub_model = hub_model_name
 
-if st.button("Generate Image"):
-    if not prompt:
-        st.warning("Please enter a prompt to proceed.")
     else:
-        with st.spinner("Generating images..."):
-            images = generate_images(
-                st.session_state.nexa_model, prompt, negative_prompt
-            )
-            st.success("Images generated successfully!")
-            for i, image in enumerate(images):
-                st.image(image, caption=f"Generated Image", use_column_width=True)
-                
-                img_byte_arr = io.BytesIO()
-                image.save(img_byte_arr, format='PNG')
-                img_byte_arr = img_byte_arr.getvalue()
-
-                st.download_button(
-                    label=f"Download Image",
-                    data=img_byte_arr,
-                    file_name=f"generated_image.png",
-                    mime="image/png"
+        # load selected model if it's not already loaded:
+        if ('nexa_model' not in st.session_state or getattr(st.session_state, 'current_model_path', None) != model_path):
+            with st.spinner(f"Loading model: {model_path}"):
+                st.session_state.nexa_model = load_model(model_path)
+                if st.session_state.nexa_model:  # only update if load was successful
+                    st.session_state.current_model_path = model_path
+
+    # generation params:
+    if 'nexa_model' in st.session_state and st.session_state.nexa_model:
+        st.sidebar.header("Generation Parameters")
+
+        model_to_check = (st.session_state.current_hub_model if st.session_state.current_hub_model else st.session_state.current_local_path if st.session_state.current_local_path else st.session_state.current_model_path)
+
+        # get model specific defaults:
+        default_params = get_default_params(model_to_check)
+
+        # adjust step range based on model type:
+        max_steps = 100
+        if "lcm-dreamshaper" in model_to_check or "flux" in model_to_check:
+            max_steps = 8  # 4-8 steps
+        elif "sdxl-turbo" in model_to_check:
+            max_steps = 10  # 5-10 steps
+
+        # adjust guidance scale range based on model type:
+        max_guidance = 20.0
+        if "lcm-dreamshaper" in model_to_check or "flux" in model_to_check:
+            max_guidance = 2.0  # 1.0-2.0
+        elif "sdxl-turbo" in model_to_check:
+            max_guidance = 10.0  # 5.0-10.0
+
+        num_inference_steps = st.sidebar.slider(
+            "Number of Inference Steps",
+            1,
+            max_steps,
+            default_params["num_inference_steps"]
+        )
+        height = st.sidebar.slider(
+            "Height",
+            64,
+            1024,
+            default_params["height"]
+        )
+        width = st.sidebar.slider(
+            "Width",
+            64,
+            1024,
+            default_params["width"]
+        )
+        guidance_scale = st.sidebar.slider(
+            "Guidance Scale",
+            0.0,
+            max_guidance,
+            default_params["guidance_scale"]
+        )
+        random_seed = st.sidebar.slider(
+            "Random Seed",
+            0,
+            10000,
+            default_params["random_seed"]
+        )
+
+        st.session_state.nexa_model.params.update({
+            "num_inference_steps": num_inference_steps,
+            "height": height,
+            "width": width,
+            "guidance_scale": guidance_scale,
+            "random_seed": random_seed,
+        })
+
+    # image generation interface:
+    prompt = st.text_input("Enter your prompt:")
+    negative_prompt = st.text_input("Enter your negative prompt (optional):")
+
+    if st.button("Generate Image"):
+        if not prompt:
+            st.warning("Please enter a prompt to proceed.")
+        else:
+            with st.spinner("Generating images..."):
+                images = generate_images(
+                    st.session_state.nexa_model,
+                    prompt,
+                    negative_prompt
                 )
+                st.success("Images generated successfully!")
+                for i, image in enumerate(images):
+                    st.image(image, caption=f"Generated Image", use_column_width=True)
+
+                    img_byte_arr = io.BytesIO()
+                    image.save(img_byte_arr, format='PNG')
+                    img_byte_arr = img_byte_arr.getvalue()
+
+                    st.download_button(
+                        label=f"Download Image",
+                        data=img_byte_arr,
+                        file_name=f"generated_image.png",
+                        mime="image/png"
+                    )
+
+except Exception as e:
+    st.error(f"An unexpected error occurred: {str(e)}")
+    import traceback
+    st.error(f"Traceback: {traceback.format_exc()}")
diff --git a/nexa/gguf/streamlit/streamlit_text_chat.py b/nexa/gguf/streamlit/streamlit_text_chat.py
index 542e8059..4adf60e3 100644
--- a/nexa/gguf/streamlit/streamlit_text_chat.py
+++ b/nexa/gguf/streamlit/streamlit_text_chat.py
@@ -1,112 +1,313 @@
 import sys
-from typing import Iterator
-
+import subprocess
+import re
+from typing import Iterator, List
 import streamlit as st
 from nexa.general import pull_model
 from nexa.gguf.nexa_inference_text import NexaTextInference
+from nexa.utils import (
+    get_model_options,
+    update_model_options,
+)
+from nexa.constants import (
+    DEFAULT_TEXT_GEN_PARAMS,
+    NEXA_RUN_MODEL_MAP_TEXT,
+)
 
-default_model = sys.argv[1]
-is_local_path = False if sys.argv[2] == "False" else True
-hf = False if sys.argv[3] == "False" else True
-
-@st.cache_resource
-def load_model(model_path):
-    st.session_state.messages = []
-    if is_local_path:
-        local_path = model_path
-    elif hf:
-        local_path, _ = pull_model(model_path, hf=True)
-    else:
-        local_path, run_type = pull_model(model_path)
-    nexa_model = NexaTextInference(model_path=model_path, local_path=local_path)
-    return nexa_model
+specified_run_type = 'NLP'
+model_map = NEXA_RUN_MODEL_MAP_TEXT
+
+# init:
+DEFAULT_PARAMS = DEFAULT_TEXT_GEN_PARAMS.copy()
+
+@st.cache_resource(show_spinner=False)
+def load_model(model_path: str, is_local: bool = False, is_hf: bool = False):
+    """Load model with proper error handling and state management."""
+    try:
+        st.session_state.messages = []
+
+        if is_local:
+            local_path = model_path
+        elif is_hf:
+            try:
+                local_path, _ = pull_model(model_path, hf=True)
+                update_model_options(specified_run_type, model_map)  # update options after successful pull
+            except Exception as e:
+                st.error(f"Error pulling HuggingFace model: {str(e)}")
+                return None
+        else:
+            try:
+                # model hub case:
+                local_path, run_type = pull_model(model_path)
+                if not local_path or not run_type:
+                    st.error(f"Failed to pull model {model_path} from Nexa Model Hub")
+                    return None
+                update_model_options(specified_run_type, model_map)  # update options after successful pull
+            except ValueError as e:
+                st.error(f"Error pulling model from Nexa Model Hub: {str(e)}")
+                return None
+            except Exception as e:
+                st.error(f"Unexpected error while pulling model: {str(e)}")
+                return None
+
+        try:
+            nexa_model = NexaTextInference(
+                model_path=model_path,
+                local_path=local_path,
+                **DEFAULT_PARAMS
+            )
+
+            # force refresh of model options after successful load:
+            update_model_options(specified_run_type, model_map)
+
+            # reset the model index to include the new model:
+            if model_path in st.session_state.model_options:
+                st.session_state.current_model_index = st.session_state.model_options.index(model_path)
+            return nexa_model
+
+        except Exception as e:
+            st.error(f"Error initializing model: {str(e)}")
+            return None
 
+    except Exception as e:
+        st.error(f"Error in load_model: {str(e)}")
+        return None
+
+@st.cache_resource(show_spinner=False)
+def load_local_model(local_path: str):
+    """Load local model with default parameters."""
+    try:
+        st.session_state.messages = []
+        nexa_model = NexaTextInference(
+            model_path="local_model",
+            local_path=local_path,
+            **DEFAULT_PARAMS
+        )
+        update_model_options(specified_run_type, model_map)  # update options after successful local model load
+        return nexa_model
+    except Exception as e:
+        st.error(f"Error loading local model: {str(e)}")
+        return None
 
 def generate_response(nexa_model: NexaTextInference) -> Iterator:
+    """Generate response from the model."""
     user_input = st.session_state.messages[-1]["content"]
     if hasattr(nexa_model, "chat_format") and nexa_model.chat_format:
         return nexa_model._chat(user_input)
     else:
         return nexa_model._complete(user_input)
 
-st.markdown(
-    r"""
-    <style>
-    .stDeployButton {
-            visibility: hidden;
-        }
-    </style>
-    """,
-    unsafe_allow_html=True,
-)
-st.title("Nexa AI Text Generation")
-st.caption("Powered by Nexa AI SDK🐙")
+# main execution:
+try:
+    # get command line arguments with proper error handling:
+    if len(sys.argv) < 4:
+        st.error("Missing required command line arguments.")
+        sys.exit(1)  # program terminated with an error
 
-st.sidebar.header("Model Configuration")
-model_path = st.sidebar.text_input("Model path", default_model)
+    default_model = sys.argv[1]
+    is_local_path = sys.argv[2].lower() == "true"
+    hf = sys.argv[3].lower() == "true"
 
-if not model_path:
-    st.warning(
-        "Please enter a valid path or identifier for the model in Nexa Model Hub to proceed."
+    # UI setup:
+    st.set_page_config(page_title="Nexa AI Text Generation", layout="wide")
+    st.markdown(
+        r"""
+        <style>
+        .stDeployButton {
+                visibility: hidden;
+            }
+        </style>
+        """,
+        unsafe_allow_html=True,
     )
-    st.stop()
-
-if (
-    "current_model_path" not in st.session_state
-    or st.session_state.current_model_path != model_path
-):
-    st.session_state.current_model_path = model_path
-    st.session_state.nexa_model = load_model(model_path)
-    if st.session_state.nexa_model is None:
-        st.stop()
-
-st.sidebar.header("Generation Parameters")
-temperature = st.sidebar.slider(
-    "Temperature", 0.0, 1.0, st.session_state.nexa_model.params["temperature"]
-)
-max_new_tokens = st.sidebar.slider(
-    "Max New Tokens", 1, 500, st.session_state.nexa_model.params["max_new_tokens"]
-)
-top_k = st.sidebar.slider("Top K", 1, 100, st.session_state.nexa_model.params["top_k"])
-top_p = st.sidebar.slider(
-    "Top P", 0.0, 1.0, st.session_state.nexa_model.params["top_p"]
-)
+    st.title("Nexa AI Text Generation")
+    st.caption("Powered by Nexa AI SDK🐙")
 
-st.session_state.nexa_model.params.update(
-    {
-        "temperature": temperature,
-        "max_new_tokens": max_new_tokens,
-        "top_k": top_k,
-        "top_p": top_p,
-    }
-)
+    # force refresh model options on every page load:
+    if 'model_options' not in st.session_state:
+        st.session_state.model_options = get_model_options(specified_run_type, model_map)
+    else:
+        update_model_options(specified_run_type, model_map)
+
+    # init session state variables:
+    if 'initialized' not in st.session_state:
+        st.session_state.messages = []
+        st.session_state.current_model_path = None
+        st.session_state.current_local_path = None
+        st.session_state.current_hub_model = None
+
+        if not is_local_path and not hf:
+            try:
+                with st.spinner(f"Loading model: {default_model}"):
+                    st.session_state.nexa_model = load_model(default_model)
+                    if st.session_state.nexa_model:
+                        st.session_state.current_hub_model = default_model
+            except Exception as e:
+                st.error(f"Error loading default model: {str(e)}")
+
+            # set to model hub option if not found in list:
+            if default_model not in st.session_state.model_options:
+                st.session_state.current_model_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+        else:
+            try:
+                st.session_state.current_model_index = st.session_state.model_options.index(default_model)
+            except ValueError:
+                st.session_state.current_model_index = 0
+
+        st.session_state.initialized = True
+
+    # model selection sidebar:
+    st.sidebar.header("Model Configuration")
+
+    # update the selectbox index based on the currently loaded model:
+    if 'nexa_model' in st.session_state:
+        if st.session_state.current_hub_model:
+            # if we have a hub model loaded, select the hub option:
+            current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+        elif st.session_state.current_local_path:
+            # if we have a local model loaded, select the local option:
+            current_index = st.session_state.model_options.index("Local Model 📁")
+        elif st.session_state.current_model_path:
+            # if we have a listed model loaded, find its index:
+            current_index = st.session_state.model_options.index(st.session_state.current_model_path)
+        else:
+            current_index = st.session_state.current_model_index
+    else:
+        current_index = st.session_state.current_model_index
+
+    model_path = st.sidebar.selectbox(
+        "Select a Model",
+        st.session_state.model_options,
+        index=current_index,
+        key='model_selectbox'
+    )
+
+    # update current model index when selection changes:
+    current_index = st.session_state.model_options.index(model_path)
+    if current_index != st.session_state.current_model_index:
+        st.session_state.current_model_index = current_index
+        if 'nexa_model' in st.session_state:
+            del st.session_state.nexa_model
+            st.session_state.messages = []
+            st.session_state.current_model_path = None
+            st.session_state.current_local_path = None
+            st.session_state.current_hub_model = None
+
+    # handle model loading based on selection:
+    if model_path == "Local Model 📁":
+        local_model_path = st.sidebar.text_input("Enter local model path")
+        if not local_model_path:
+            st.warning("Please enter a valid local model path to proceed.")
+            st.stop()
+
+        local_model_path = local_model_path.strip()  # remove spaces
+        if 'nexa_model' not in st.session_state or st.session_state.current_local_path != local_model_path:
+            with st.spinner("Loading local model..."):
+                st.session_state.nexa_model = load_local_model(local_model_path)
+                st.session_state.current_local_path = local_model_path
+
+    elif model_path == "Use Model From Nexa Model Hub 🔍":
+        initial_value = default_model if not is_local_path and not hf else ""
+        hub_model_name = st.sidebar.text_input(
+            "Enter model name from Nexa Model Hub",
+            value=initial_value
+        )
+
+        # empty string check:
+        if not hub_model_name:
+            st.warning(f"""
+            How to add a model from Nexa Model Hub:
+            \n1. Visit [Nexa Model Hub](https://nexaai.com/models)
+            \n2. Find a NLP model using the task filters (chat, uncensored, etc.)
+            \n3. Select your desired model and copy either:
+            \n   - The full nexa run command (e.g., nexa run Sao10K/MN-BackyardAI-Party-12B-v1:gguf-q4_K_M), or
+            \n   - Simply the model name (e.g., Sao10K/MN-BackyardAI-Party-12B-v1:gguf-q4_K_M)
+            \n4. Paste it into the "Enter model name from Nexa Model Hub" field on the sidebar and press enter
+            """)
+            st.stop()
+
+        # process the input after checking it's not empty:
+        if hub_model_name.startswith("nexa run"):
+            hub_model_name = hub_model_name.split("nexa run")[-1].strip()
+        else:
+            hub_model_name = hub_model_name.strip()
+
+        if 'nexa_model' not in st.session_state or st.session_state.current_hub_model != hub_model_name:
+            with st.spinner("Loading model from hub..."):
+                st.session_state.nexa_model = load_model(hub_model_name)
+                if st.session_state.nexa_model:  # only update if load was successful
+                    st.session_state.current_hub_model = hub_model_name
+
+    else:
+        # load selected model if it's not already loaded:
+        if ('nexa_model' not in st.session_state or
+            getattr(st.session_state, 'current_model_path', None) != model_path):
+            with st.spinner(f"Loading model: {model_path}"):
+                st.session_state.nexa_model = load_model(model_path)
+                if st.session_state.nexa_model:  # only update if load was successful
+                    st.session_state.current_model_path = model_path
+
+    # generation params:
+    if 'nexa_model' in st.session_state and st.session_state.nexa_model:
+        st.sidebar.header("Generation Parameters")
+        model_params = st.session_state.nexa_model.params
+
+        temperature = st.sidebar.slider(
+            "Temperature", 0.0, 1.0, model_params.get("temperature", DEFAULT_PARAMS["temperature"])
+        )
+        max_new_tokens = st.sidebar.slider(
+            "Max New Tokens", 1, 500, model_params.get("max_new_tokens", DEFAULT_PARAMS["max_new_tokens"])
+        )
+        top_k = st.sidebar.slider(
+            "Top K", 1, 100, model_params.get("top_k", DEFAULT_PARAMS["top_k"])
+        )
+        top_p = st.sidebar.slider(
+            "Top P", 0.0, 1.0, model_params.get("top_p", DEFAULT_PARAMS["top_p"])
+        )
+        nctx = st.sidebar.slider(
+            "Context length", 1000, 9999, model_params.get("nctx", DEFAULT_PARAMS["nctx"])
+        )
+
+        st.session_state.nexa_model.params.update({
+            "temperature": temperature,
+            "max_new_tokens": max_new_tokens,
+            "top_k": top_k,
+            "top_p": top_p,
+            "nctx": nctx,
+        })
+
+    # chat interface:
+    for message in st.session_state.messages:
+        with st.chat_message(message["role"]):
+            st.markdown(message["content"])
+
+    if prompt := st.chat_input("Say something..."):
+        if 'nexa_model' not in st.session_state or not st.session_state.nexa_model:
+            st.error("Please wait for the model to load or select a valid model.")
+        else:
+            st.session_state.messages.append({"role": "user", "content": prompt})
+            with st.chat_message("user"):
+                st.markdown(prompt)
+
+            with st.chat_message("assistant"):
+                response_placeholder = st.empty()
+                full_response = ""
+                for chunk in generate_response(st.session_state.nexa_model):
+                    choice = chunk["choices"][0]
+                    if "delta" in choice:
+                        delta = choice["delta"]
+                        content = delta.get("content", "")
+                    elif "text" in choice:
+                        delta = choice["text"]
+                        content = delta
+
+                    full_response += content
+                    response_placeholder.markdown(full_response, unsafe_allow_html=True)
+                response_placeholder.markdown(full_response)
+
+            st.session_state.messages.append({"role": "assistant", "content": full_response})
 
-if "messages" not in st.session_state:
-    st.session_state.messages = []
-
-for message in st.session_state.messages:
-    with st.chat_message(message["role"]):
-        st.markdown(message["content"])
-
-if prompt := st.chat_input("Say something..."):
-    st.session_state.messages.append({"role": "user", "content": prompt})
-    with st.chat_message("user"):
-        st.markdown(prompt)
-
-    with st.chat_message("assistant"):
-        response_placeholder = st.empty()
-        full_response = ""
-        for chunk in generate_response(st.session_state.nexa_model):
-            choice = chunk["choices"][0]
-            if "delta" in choice:
-                delta = choice["delta"]
-                content = delta.get("content", "")
-            elif "text" in choice:
-                delta = choice["text"]
-                content = delta
-
-            full_response += content
-            response_placeholder.markdown(full_response, unsafe_allow_html=True)
-        response_placeholder.markdown(full_response)
-
-    st.session_state.messages.append({"role": "assistant", "content": full_response})
+except Exception as e:
+    st.error(f"An unexpected error occurred: {str(e)}")
+    import traceback
+    st.error(f"Traceback: {traceback.format_exc()}")
diff --git a/nexa/gguf/streamlit/streamlit_vlm.py b/nexa/gguf/streamlit/streamlit_vlm.py
index 25f48d0e..a581b167 100644
--- a/nexa/gguf/streamlit/streamlit_vlm.py
+++ b/nexa/gguf/streamlit/streamlit_vlm.py
@@ -1,40 +1,65 @@
 import sys
 import tempfile
-from typing import Iterator
-
+import subprocess
+import re
+from typing import List, Iterator
 import streamlit as st
 from PIL import Image
 from nexa.general import pull_model
 from nexa.gguf.nexa_inference_vlm import NexaVLMInference
+from nexa.utils import (
+    get_model_options,
+    update_model_options,
+)
+from nexa.constants import NEXA_RUN_MODEL_MAP_VLM
 
-default_model = sys.argv[1]
-is_local_path = False if sys.argv[2] == "False" else True
-hf = False if sys.argv[3] == "False" else True
-projector_local_path = sys.argv[4] if len(sys.argv) > 4 else None
+specified_run_type = 'Multimodal'
+model_map = NEXA_RUN_MODEL_MAP_VLM
 
+# init from command line args:
+try:
+    default_model = sys.argv[1]
+    is_local_path = sys.argv[2].lower() == "true"
+    hf = sys.argv[3].lower() == "true"
+    projector_local_path = sys.argv[4] if len(sys.argv) > 4 else None
+except IndexError:
+    st.error("Missing required command line arguments.")
+    sys.exit(1)  # terminate with an error
 
-@st.cache_resource
-def load_model(model_path):
-    if is_local_path:
-        local_path = model_path
-    elif hf:
-        local_path, _ = pull_model(model_path, hf=True)
-    else:
-        local_path, run_type = pull_model(model_path)
-        
-    if is_local_path:
-        nexa_model = NexaVLMInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path)
-    else:
-        nexa_model = NexaVLMInference(model_path=model_path, local_path=local_path)
-    return nexa_model
-
+@st.cache_resource(show_spinner=False)
+def load_model(model_path, is_local=False, is_hf=False, projector_path=None):
+    """Load model with model mapping logic."""
+    try:
+        if is_local:
+            local_path = model_path
+            nexa_model = NexaVLMInference(
+                model_path=model_path,
+                local_path=local_path,
+                projector_local_path=projector_path
+            )
+        elif is_hf:
+            local_path, _ = pull_model(model_path, hf=True)
+            nexa_model = NexaVLMInference(model_path=model_path, local_path=local_path)
+        else:
+            # get the actual model name from the mapping if it exists:
+            if model_path in NEXA_RUN_MODEL_MAP_VLM:
+                real_model_path = NEXA_RUN_MODEL_MAP_VLM[model_path]
+                local_path, run_type = pull_model(real_model_path)
+            else:
+                local_path, run_type = pull_model(model_path)
+            nexa_model = NexaVLMInference(model_path=model_path, local_path=local_path)
+        return nexa_model
+    except Exception as e:
+        st.error(f"Error loading model: {str(e)}")
+        return None
 
 def generate_response(
     nexa_model: NexaVLMInference, image_path: str, user_input: str
 ) -> Iterator:
     return nexa_model._chat(user_input, image_path)
 
-
+# UI setup:
+st.set_page_config(page_title="Nexa AI Multimodal Generation", layout="wide")
 st.markdown(
     r"""
     <style>
@@ -45,85 +70,228 @@ def generate_response(
     """,
     unsafe_allow_html=True,
 )
-st.title("Nexa AI VLM Generation")
+st.title("Nexa AI Multimodal Generation")
 st.caption("Powered by Nexa AI SDK🐙")
 
+# force refresh model options on every page load:
+if 'model_options' not in st.session_state:
+    st.session_state.model_options = get_model_options(specified_run_type, model_map)
+else:
+    update_model_options(specified_run_type, model_map)
+
+# init session state variables:
+if 'initialized' not in st.session_state:
+    st.session_state.model_options = get_model_options(specified_run_type, model_map)
+    st.session_state.current_model_path = default_model
+    st.session_state.current_local_path = None
+    st.session_state.current_projector_path = projector_local_path
+    st.session_state.current_hub_model = None
+
+    # init with default model:
+    if is_local_path:
+        try:
+            with st.spinner(f"Loading local model: {default_model}"):
+                st.session_state.nexa_model = load_model(
+                    default_model,
+                    is_local=True,
+                    projector_path=projector_local_path
+                )
+                if st.session_state.nexa_model:
+                    st.session_state.current_local_path = default_model
+                    st.session_state.current_model_path = default_model
+        except Exception as e:
+            st.error(f"Error loading local model: {str(e)}")
+
+    elif hf:
+        try:
+            with st.spinner(f"Loading HuggingFace model: {default_model}"):
+                st.session_state.nexa_model = load_model(default_model, is_hf=True)
+                if st.session_state.nexa_model:
+                    st.session_state.current_hub_model = default_model
+                    st.session_state.current_model_path = default_model
+        except Exception as e:
+            st.error(f"Error loading HuggingFace model: {str(e)}")
+
+    else:
+        try:
+            with st.spinner(f"Loading model: {default_model}"):
+                st.session_state.nexa_model = load_model(default_model)
+                if st.session_state.nexa_model:
+                    st.session_state.current_model_path = default_model
+                    st.session_state.current_hub_model = default_model
+        except Exception as e:
+            st.error(f"Error loading model: {str(e)}")
+
+    st.session_state.initialized = True
+
+# model selection UI:
 st.sidebar.header("Model Configuration")
-model_path = st.sidebar.text_input("Model path", default_model)
 
-if not model_path:
-    st.warning(
-        "Please enter a valid path or identifier for the model in Nexa Model Hub to proceed."
+# update selectbox index based on current model:
+current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+if 'nexa_model' in st.session_state:
+    if st.session_state.current_model_path in st.session_state.model_options:
+        current_index = st.session_state.model_options.index(st.session_state.current_model_path)
+    elif st.session_state.current_local_path:
+        current_index = st.session_state.model_options.index("Local Model 📁")
+    elif st.session_state.current_hub_model:
+        current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+
+selected_option = st.sidebar.selectbox(
+    "Select a Model",
+    st.session_state.model_options,
+    index=current_index
+)
+
+# handle model selection:
+if selected_option == "Local Model 📁":
+    model_path = st.sidebar.text_input(
+        "Enter local model path",
+        value=st.session_state.current_local_path if hasattr(st.session_state, 'current_local_path') else ""
+    )
+
+    projector_path = st.sidebar.text_input(
+        "Enter local projector path",
+        value=st.session_state.current_projector_path if hasattr(st.session_state, 'current_projector_path') else ""
     )
-    st.stop()
-
-if (
-    "current_model_path" not in st.session_state
-    or st.session_state.current_model_path != model_path
-):
-    st.session_state.current_model_path = model_path
-    st.session_state.nexa_model = load_model(model_path)
-    if st.session_state.nexa_model is None:
+
+    if not model_path:
+        st.warning("Please enter a valid local model path to proceed.")
         st.stop()
 
-st.sidebar.header("Generation Parameters")
-temperature = st.sidebar.slider(
-    "Temperature", 0.0, 1.0, st.session_state.nexa_model.params["temperature"]
-)
-max_new_tokens = st.sidebar.slider(
-    "Max New Tokens", 1, 2048, st.session_state.nexa_model.params["max_new_tokens"]
-)
-top_k = st.sidebar.slider("Top K", 1, 100, st.session_state.nexa_model.params["top_k"])
-top_p = st.sidebar.slider(
-    "Top P", 0.0, 1.0, st.session_state.nexa_model.params["top_p"]
-)
+    if not projector_path:
+        st.warning("Please enter a valid local projector path to proceed.")
+        st.stop()
+
+    if (not hasattr(st.session_state, 'current_local_path') or st.session_state.current_local_path != model_path or st.session_state.current_projector_path != projector_path):
+        with st.spinner("Loading local model..."):
+            st.session_state.nexa_model = load_model(
+                model_path,
+                is_local=True,
+                projector_path=projector_path
+            )
+            if st.session_state.nexa_model:
+                st.session_state.current_local_path = model_path
+                st.session_state.current_projector_path = projector_path
+                st.session_state.current_model_path = model_path
+
+elif selected_option == "Use Model From Nexa Model Hub 🔍":
+    model_path = st.sidebar.text_input(
+        "Enter model name from Nexa Model Hub",
+        value=st.session_state.current_hub_model if hasattr(st.session_state, 'current_hub_model') else default_model
+    )
+    if not model_path:
+        st.warning("""
+        How to add a model from Nexa Model Hub:
+        \n1. Visit [Nexa Model Hub](https://nexaai.com/models)
+        \n2. Find a multimodal model using the task filters
+        \n3. Select your desired model and copy either:
+        \n   - The full nexa run command, or
+        \n   - Simply the model name
+        \n4. Paste it into the field on the sidebar and press enter
+        """)
+        st.stop()
+
+    if model_path.startswith("nexa run"):
+        model_path = model_path.split("nexa run")[-1].strip()
 
-st.session_state.nexa_model.params.update(
-    {
+    if (not hasattr(st.session_state, 'current_hub_model') or
+        st.session_state.current_hub_model != model_path):
+        with st.spinner("Loading model from hub..."):
+            st.session_state.nexa_model = load_model(model_path)
+            if st.session_state.nexa_model:
+                st.session_state.current_hub_model = model_path
+                st.session_state.current_model_path = model_path
+
+else:
+    model_path = selected_option
+    if (not hasattr(st.session_state, 'current_model_path') or
+        st.session_state.current_model_path != model_path):
+        with st.spinner(f"Loading model: {model_path}"):
+            st.session_state.nexa_model = load_model(model_path)
+            if st.session_state.nexa_model:
+                st.session_state.current_model_path = model_path
+
+# only show generation params if model is loaded:
+if hasattr(st.session_state, 'nexa_model') and st.session_state.nexa_model:
+    # generation params:
+    st.sidebar.header("Generation Parameters")
+    temperature = st.sidebar.slider(
+        "Temperature",
+        0.0,
+        1.0,
+        st.session_state.nexa_model.params["temperature"]
+    )
+    max_new_tokens = st.sidebar.slider(
+        "Max New Tokens",
+        1,
+        2048,
+        st.session_state.nexa_model.params["max_new_tokens"]
+    )
+    top_k = st.sidebar.slider(
+        "Top K",
+        1,
+        100,
+        st.session_state.nexa_model.params["top_k"]
+    )
+    top_p = st.sidebar.slider(
+        "Top P",
+        0.0,
+        1.0,
+        st.session_state.nexa_model.params["top_p"]
+    )
+
+    st.session_state.nexa_model.params.update({
         "temperature": temperature,
         "max_new_tokens": max_new_tokens,
         "top_k": top_k,
         "top_p": top_p,
-    }
-)
+    })
 
-user_input = st.text_input("Enter your text input:")
-uploaded_file = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"])
+    # generation interface:
+    user_input = st.text_input("Enter your text input:")
+    uploaded_file = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"])
 
-generate_button = st.button("Send")
-spinner_placeholder = st.empty()
-success_label = st.empty()
-response_placeholder = st.empty()
-image_placeholder = st.empty()
+    generate_button = st.button("Send")
+    spinner_placeholder = st.empty()
+    success_label = st.empty()
+    response_placeholder = st.empty()
+    image_placeholder = st.empty()
 
-if uploaded_file:
-    image_placeholder.image(
-        uploaded_file, caption="Uploaded Image", use_column_width=True
-    )
+    if uploaded_file:
+        image_placeholder.image(
+            uploaded_file,
+            caption="Uploaded Image",
+            use_column_width=True
+        )
 
-if generate_button:
-    if not user_input and not uploaded_file:
-        st.warning("Please enter text input and upload an image to proceed.")
-    else:
-        with spinner_placeholder:
-            with st.spinner("Generating description..."):
-                with tempfile.NamedTemporaryFile() as image_path:
-                    full_path = None
-                    if uploaded_file:
-                        ext = uploaded_file.name.split(".")[-1]
-                        full_path = f"{image_path.name}.{ext}"
-                        with Image.open(uploaded_file) as img:
-                            img.save(full_path)
-
-                    full_response = ""
-                    for chunk in generate_response(
-                        st.session_state.nexa_model, full_path, user_input
-                    ):
-                        delta = chunk["choices"][0]["delta"]
-                        if "role" in delta:
-                            print(delta["role"], end=": ", flush=True)
-                        elif "content" in delta:
-                            print(delta["content"], end="", flush=True)
-                            full_response += delta["content"]
-                        response_placeholder.write(full_response)
-                    success_label.success("Response generated successfully.")
+    if generate_button:
+        if not user_input and not uploaded_file:
+            st.warning("Please enter text input and upload an image to proceed.")
+        else:
+            with spinner_placeholder:
+                with st.spinner("Generating description..."):
+                    with tempfile.NamedTemporaryFile() as image_path:
+                        full_path = None
+                        if uploaded_file:
+                            ext = uploaded_file.name.split(".")[-1]
+                            full_path = f"{image_path.name}.{ext}"
+                            with Image.open(uploaded_file) as img:
+                                img.save(full_path)
+
+                        full_response = ""
+                        for chunk in generate_response(
+                            st.session_state.nexa_model,
+                            full_path,
+                            user_input
+                        ):
+                            delta = chunk["choices"][0]["delta"]
+                            if "role" in delta:
+                                print(delta["role"], end=": ", flush=True)
+                            elif "content" in delta:
+                                print(delta["content"], end="", flush=True)
+                                full_response += delta["content"]
+                            response_placeholder.write(full_response)
+                        success_label.success("Response generated successfully.")
+else:
+    st.warning("Please select or load a model to proceed.")
diff --git a/nexa/gguf/streamlit/streamlit_vlm_omni.py b/nexa/gguf/streamlit/streamlit_vlm_omni.py
new file mode 100644
index 00000000..3977597c
--- /dev/null
+++ b/nexa/gguf/streamlit/streamlit_vlm_omni.py
@@ -0,0 +1,95 @@
+import sys
+import tempfile
+
+import streamlit as st
+from PIL import Image
+from nexa.general import pull_model
+from nexa.gguf.nexa_inference_vlm_omni import NexaOmniVlmInference
+import ctypes
+
+default_model = sys.argv[1]
+is_local_path = False if sys.argv[2] == "False" else True
+hf = False if sys.argv[3] == "False" else True
+projector_local_path = sys.argv[4] if len(sys.argv) > 4 else None
+
+@st.cache_resource
+def load_model(model_path):
+    if is_local_path:
+        local_path = model_path
+    elif hf:
+        local_path, _ = pull_model(model_path, hf=True)
+    else:
+        local_path, _ = pull_model(model_path)
+        
+    if is_local_path:
+        nexa_model = NexaOmniVlmInference(model_path=model_path, local_path=local_path, projector_local_path=projector_local_path)
+    else:
+        nexa_model = NexaOmniVlmInference(model_path=model_path, local_path=local_path)
+    return nexa_model
+
+def generate_response(nexa_model: NexaOmniVlmInference, image_path: str, user_input: str) -> str:
+    return nexa_model.inference(user_input, image_path)
+
+st.markdown(
+    r"""
+    <style>
+    .stDeployButton {
+            visibility: hidden;
+        }
+    </style>
+    """,
+    unsafe_allow_html=True,
+)
+st.title("Nexa AI Omni VLM Generation")
+st.caption("Powered by Nexa AI SDK🐙")
+
+st.sidebar.header("Model Configuration")
+model_path = st.sidebar.text_input("Model path", default_model)
+
+if not model_path:
+    st.warning(
+        "Please enter a valid path or identifier for the model in Nexa Model Hub to proceed."
+    )
+    st.stop()
+
+if (
+    "current_model_path" not in st.session_state
+    or st.session_state.current_model_path != model_path
+):
+    st.session_state.current_model_path = model_path
+    st.session_state.nexa_model = load_model(model_path)
+    if st.session_state.nexa_model is None:
+        st.stop()
+
+user_input = st.text_input("Enter your text input:")
+uploaded_file = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"])
+
+generate_button = st.button("Send")
+spinner_placeholder = st.empty()
+success_label = st.empty()
+response_placeholder = st.empty()
+image_placeholder = st.empty()
+
+if uploaded_file:
+    image_placeholder.image(uploaded_file, caption="Uploaded Image")
+
+if generate_button:
+    if not user_input and not uploaded_file:
+        st.warning("Please enter text input and upload an image to proceed.")
+    else:
+        with spinner_placeholder:
+            with st.spinner("Generating description..."):
+                with tempfile.NamedTemporaryFile() as image_path:
+                    full_path = None
+                    if uploaded_file:
+                        ext = uploaded_file.name.split(".")[-1]
+                        full_path = f"{image_path.name}.{ext}"
+                        with Image.open(uploaded_file) as img:
+                            img.save(full_path)
+
+                    response = generate_response(
+                        st.session_state.nexa_model, full_path, user_input
+                    )
+
+                    response_placeholder.write(response)
+                    success_label.success("Response generated successfully.")
\ No newline at end of file
diff --git a/nexa/gguf/streamlit/streamlit_voice_chat.py b/nexa/gguf/streamlit/streamlit_voice_chat.py
index 77c4b3c1..750217f9 100644
--- a/nexa/gguf/streamlit/streamlit_voice_chat.py
+++ b/nexa/gguf/streamlit/streamlit_voice_chat.py
@@ -2,30 +2,56 @@
 import os
 import sys
 import tempfile
-
-import librosa
+import subprocess
+import re
+from typing import List
 import streamlit as st
 from st_audiorec import st_audiorec
-
 from nexa.general import pull_model
 from nexa.gguf.nexa_inference_voice import NexaVoiceInference
+from nexa.utils import (
+    get_model_options,
+    update_model_options,
+)
+from nexa.constants import NEXA_RUN_MODEL_MAP_VOICE
 
-default_model = sys.argv[1]
-is_local_path = False if sys.argv[2] == "False" else True
-hf = False if sys.argv[3] == "False" else True
-
+specified_run_type = 'Audio'
+model_map = NEXA_RUN_MODEL_MAP_VOICE
 
-@st.cache_resource
-def load_model(model_path):
-    if is_local_path:
-        local_path = model_path
-    elif hf:
-        local_path, _ = pull_model(model_path, hf=True)
-    else:
-        local_path, run_type = pull_model(model_path)
-    nexa_model = NexaVoiceInference(model_path=model_path, local_path=local_path)
-    return nexa_model
+# init from command line args:
+try:
+    default_model = sys.argv[1]
+    is_local_path = sys.argv[2].lower() == "true"
+    hf = sys.argv[3].lower() == "true"
+except IndexError:
+    st.error("Missing required command line arguments.")
+    sys.exit(1)  # terminate with an error
 
+@st.cache_resource(show_spinner=False)
+def load_model(model_path, is_local=False, is_hf=False):
+    """Load model with model mapping logic."""
+    try:
+        if is_local:
+            # for local paths, use the path directly:
+            nexa_model = NexaVoiceInference(model_path=model_path, local_path=model_path)
+        else:
+            # for non-local paths:
+            if is_hf:
+                local_path, _ = pull_model(model_path, hf=True)
+                nexa_model = NexaVoiceInference(model_path=model_path, local_path=local_path)
+            else:
+                # handle Model Hub models:
+                if model_path in NEXA_RUN_MODEL_MAP_VOICE:
+                    real_model_path = NEXA_RUN_MODEL_MAP_VOICE[model_path]
+                    local_path, _ = pull_model(real_model_path)
+                    nexa_model = NexaVoiceInference(model_path=real_model_path, local_path=local_path)
+                else:
+                    local_path, _ = pull_model(model_path)
+                    nexa_model = NexaVoiceInference(model_path=model_path, local_path=local_path)
+        return nexa_model
+    except Exception as e:
+        st.error(f"Error loading model: {str(e)}")
+        return None
 
 def transcribe_audio(nexa_model, audio_file):
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
@@ -50,105 +76,223 @@ def transcribe_audio(nexa_model, audio_file):
     finally:
         os.unlink(temp_audio_path)
 
-
+# UI setup:
+st.set_page_config(page_title="Nexa AI Voice Transcription", layout="wide")
 st.title("Nexa AI Voice Transcription")
 st.caption("Powered by Nexa AI SDK🐙")
 
+# force refresh model options on every page load:
+if 'model_options' not in st.session_state:
+    st.session_state.model_options = get_model_options(specified_run_type, model_map)
+else:
+    update_model_options(specified_run_type, model_map)
+
+# init session state variables:
+if 'initialized' not in st.session_state:
+    st.session_state.model_options = get_model_options(specified_run_type, model_map)
+    st.session_state.current_model_path = default_model
+    st.session_state.current_local_path = None
+    st.session_state.current_hub_model = None
+
+    # init with default model:
+    if is_local_path:
+        try:
+            with st.spinner(f"Loading local model: {default_model}"):
+                st.session_state.nexa_model = load_model(
+                    default_model,
+                    is_local=True,
+                    is_hf=hf
+                )
+                if st.session_state.nexa_model:
+                    st.session_state.current_local_path = default_model
+                    st.session_state.current_model_path = default_model
+        except Exception as e:
+            st.error(f"Error loading local model: {str(e)}")
+    elif hf:
+        try:
+            with st.spinner(f"Loading HuggingFace model: {default_model}"):
+                st.session_state.nexa_model = load_model(default_model, is_hf=True)
+                if st.session_state.nexa_model:
+                    st.session_state.current_hub_model = default_model
+                    st.session_state.current_model_path = default_model
+        except Exception as e:
+            st.error(f"Error loading HuggingFace model: {str(e)}")
+
+    else:
+        try:
+            with st.spinner(f"Loading model: {default_model}"):
+                st.session_state.nexa_model = load_model(default_model)
+                if st.session_state.nexa_model:
+                    st.session_state.current_model_path = default_model
+                    st.session_state.current_hub_model = default_model
+        except Exception as e:
+            st.error(f"Error loading model: {str(e)}")
+
+    st.session_state.initialized = True
+
+# model selection UI:
 st.sidebar.header("Model Configuration")
-model_path = st.sidebar.text_input("Model path", default_model)
-
-if not model_path:
-    st.warning("Please enter a valid S3 model filename to proceed.")
-    st.stop()
-
-# Initialize or update the model when the path changes
-if (
-    "current_model_path" not in st.session_state
-    or st.session_state.current_model_path != model_path
-):
-    st.session_state.current_model_path = model_path
-    st.session_state.nexa_model = load_model(model_path)
-    if st.session_state.nexa_model is None:
-        st.stop()
 
-# Add sidebar options for new parameters
-st.sidebar.header("Transcription Parameters")
-beam_size = st.sidebar.slider(
-    "Beam Size", 
-    1, 10, 
-    st.session_state.nexa_model.params["beam_size"]
-)
-task = st.sidebar.selectbox(
-    "Task", 
-    ["transcribe", "translate"], 
-    index=0 if st.session_state.nexa_model.params["task"] == "transcribe" else 1
-)
-temperature = st.sidebar.slider(
-    "Temperature", 
-    0.0, 1.0, 
-    st.session_state.nexa_model.params["temperature"],
-    step=0.1
+# update selectbox index based on current model:
+current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+if 'nexa_model' in st.session_state:
+    if st.session_state.current_model_path in st.session_state.model_options:
+        current_index = st.session_state.model_options.index(st.session_state.current_model_path)
+    elif st.session_state.current_hub_model:
+        current_index = st.session_state.model_options.index("Use Model From Nexa Model Hub 🔍")
+    elif st.session_state.current_local_path:
+        current_index = st.session_state.model_options.index("Local Model 📁")
+
+selected_option = st.sidebar.selectbox(
+    "Select a Model",
+    st.session_state.model_options,
+    index=current_index
 )
 
-# Update model parameters
-st.session_state.nexa_model.params.update(
-    {
+# handle model selection:
+if selected_option == "Local Model 📁":
+    model_path = st.sidebar.text_input(
+        "Enter local model path",
+        value=st.session_state.current_local_path if hasattr(st.session_state, 'current_local_path') else "",
+        help="Enter the full path to your local model directory (e.g., /home/user/.cache/nexa/hub/official/model-name)"
+    )
+
+    if not model_path:
+        st.warning("Please enter a valid local model path to proceed.")
+        st.stop()
+
+    if (not hasattr(st.session_state, 'current_local_path') or
+        st.session_state.current_local_path != model_path):
+        with st.spinner("Loading local model..."):
+            st.session_state.nexa_model = load_model(
+                    model_path,  # use the user input path
+                    is_local=True,
+                    is_hf=hf
+                )
+            if st.session_state.nexa_model:
+                st.session_state.current_local_path = model_path
+                st.session_state.current_model_path = model_path
+
+elif selected_option == "Use Model From Nexa Model Hub 🔍":
+    model_path = st.sidebar.text_input(
+        "Enter model name from Nexa Model Hub",
+        value=st.session_state.current_hub_model if hasattr(st.session_state, 'current_hub_model') else default_model
+    )
+    if not model_path:
+        st.warning("""
+        How to add a model from Nexa Model Hub:
+        \n1. Visit [Nexa Model Hub](https://nexaai.com/models)
+        \n2. Find an audio model using the task filters
+        \n3. Select your desired model and copy either:
+        \n   - The full nexa run command (e.g., nexa run faster-whisper-tiny:bin-cpu-fp16), or
+        \n   - Simply the model name (e.g., faster-whisper-tiny:bin-cpu-fp16)
+        \n4. Paste it into the field on the sidebar and press enter
+        """)
+        st.stop()
+
+    # process the input after checking it's not empty:
+    if model_path.startswith("nexa run"):
+        model_path = model_path.split("nexa run")[-1].strip()
+
+    if (not hasattr(st.session_state, 'current_hub_model') or st.session_state.current_hub_model != model_path):
+        with st.spinner("Loading model from hub..."):
+            st.session_state.nexa_model = load_model(model_path, is_local=False, is_hf=False)
+            if st.session_state.nexa_model:
+                st.session_state.current_hub_model = model_path
+                st.session_state.current_model_path = model_path
+                st.session_state.current_local_path = None  # clear local path state when switching to hub model
+
+else:
+    model_path = selected_option
+    if (not hasattr(st.session_state, 'current_model_path') or
+        st.session_state.current_model_path != model_path):
+        with st.spinner(f"Loading model: {model_path}"):
+            st.session_state.nexa_model = load_model(model_path, is_local=False, is_hf=False)
+            if st.session_state.nexa_model:
+                st.session_state.current_model_path = model_path
+                st.session_state.current_local_path = None
+                st.session_state.current_hub_model = None
+
+# only show transcription parameters if model is loaded:
+if hasattr(st.session_state, 'nexa_model') and st.session_state.nexa_model:
+    # transcription parameters:
+    st.sidebar.header("Transcription Parameters")
+    beam_size = st.sidebar.slider(
+        "Beam Size",
+        1, 10,
+        st.session_state.nexa_model.params["beam_size"]
+    )
+    task = st.sidebar.selectbox(
+        "Task",
+        ["transcribe", "translate"],
+        index=0 if st.session_state.nexa_model.params["task"] == "transcribe" else 1
+    )
+    temperature = st.sidebar.slider(
+        "Temperature",
+        0.0, 1.0,
+        st.session_state.nexa_model.params["temperature"],
+        step=0.1
+    )
+
+    # update model parameters:
+    st.session_state.nexa_model.params.update({
         "beam_size": beam_size,
         "task": task,
         "temperature": temperature,
-    }
-)
+    })
 
-# Option 1: Upload Audio File
-st.header("Option 1: Upload Audio File")
-uploaded_file = st.file_uploader("Choose an audio file", type=["wav", "mp3"])
-
-if uploaded_file is not None:
-    st.audio(uploaded_file, format="audio/wav")
-
-    if st.button("Transcribe Uploaded Audio"):
-        with st.spinner("Transcribing audio..."):
-            transcription = transcribe_audio(st.session_state.nexa_model, uploaded_file)
-
-        if transcription:
-            st.subheader("Transcription:")
-            st.write(transcription)
-
-            # Provide a download button for the transcription
-            transcription_bytes = transcription.encode()
-            st.download_button(
-                label="Download Transcription",
-                data=transcription_bytes,
-                file_name="transcription.txt",
-                mime="text/plain",
-            )
-        else:
-            st.error(
-                "Transcription failed. Please try again with a different audio file."
-            )
-
-# Option 2: Real-time Recording
-st.header("Option 2: Record Audio")
-wav_audio_data = st_audiorec()
-
-if wav_audio_data:
-    if st.button("Transcribe Recorded Audio"):
-        with st.spinner("Transcribing audio..."):
-            transcription = transcribe_audio(st.session_state.nexa_model, io.BytesIO(wav_audio_data))
-
-        if transcription:
-            st.subheader("Transcription:")
-            st.write(transcription)
-
-            # Provide a download button for the transcription
-            transcription_bytes = transcription.encode()
-            st.download_button(
-                label="Download Transcription",
-                data=transcription_bytes,
-                file_name="transcription.txt",
-                mime="text/plain",
-            )
-        else:
-            st.error("Transcription failed. Please try recording again.")
+    # Option 1: Upload Audio File
+    st.header("Option 1: Upload Audio File")
+    uploaded_file = st.file_uploader("Choose an audio file", type=["wav", "mp3"])
+
+    if uploaded_file is not None:
+        st.audio(uploaded_file, format="audio/wav")
+
+        if st.button("Transcribe Uploaded Audio"):
+            with st.spinner("Transcribing audio..."):
+                transcription = transcribe_audio(st.session_state.nexa_model, uploaded_file)
+
+            if transcription:
+                st.subheader("Transcription:")
+                st.write(transcription)
+
+                # Provide a download button for the transcription
+                transcription_bytes = transcription.encode()
+                st.download_button(
+                    label="Download Transcription",
+                    data=transcription_bytes,
+                    file_name="transcription.txt",
+                    mime="text/plain",
+                )
+            else:
+                st.error(
+                    "Transcription failed. Please try again with a different audio file."
+                )
+
+    # Option 2: Real-time Recording
+    st.header("Option 2: Record Audio")
+    wav_audio_data = st_audiorec()
+
+    if wav_audio_data:
+        if st.button("Transcribe Recorded Audio"):
+            with st.spinner("Transcribing audio..."):
+                transcription = transcribe_audio(st.session_state.nexa_model, io.BytesIO(wav_audio_data))
+
+            if transcription:
+                st.subheader("Transcription:")
+                st.write(transcription)
+
+                # Provide a download button for the transcription
+                transcription_bytes = transcription.encode()
+                st.download_button(
+                    label="Download Transcription",
+                    data=transcription_bytes,
+                    file_name="transcription.txt",
+                    mime="text/plain",
+                )
+            else:
+                st.error("Transcription failed. Please try recording again.")
+    else:
+        st.warning("No audio recorded. Please record some audio before transcribing.")
 else:
-    st.warning("No audio recorded. Please record some audio before transcribing.")
+    st.warning("Please select or load a model to proceed.")
diff --git a/nexa/onnx/nexa_inference_image.py b/nexa/onnx/nexa_inference_image.py
index 8392aa31..b38be335 100644
--- a/nexa/onnx/nexa_inference_image.py
+++ b/nexa/onnx/nexa_inference_image.py
@@ -64,10 +64,8 @@ def __init__(self, model_path=None, local_path=None, **kwargs):
         self.params.update(kwargs)
         self.pipeline = None
 
-    def run(self):
-
         if self.download_onnx_folder is None:
-            self.download_onnx_folder, run_type = pull_model(self.model_path, **kwargs)
+            self.download_onnx_folder, _ = pull_model(self.model_path, **kwargs)
 
         if self.download_onnx_folder is None:
             logging.error(
@@ -76,17 +74,19 @@ def run(self):
             )
             exit(1)
 
-        self._load_model(self.download_onnx_folder)
+        self._load_model()
+
+    def run(self):
         self._dialogue_mode()
 
     @SpinningCursorAnimation()
-    def _load_model(self, model_path):
+    def _load_model(self):
         """
         Load the model from the given model path using the appropriate pipeline.
         """
-        logging.debug(f"Loading model from {model_path}")
+        logging.debug(f"Loading model from {self.download_onnx_folder}")
         try:
-            model_index_path = os.path.join(model_path, "model_index.json")
+            model_index_path = os.path.join(self.download_onnx_folder, "model_index.json")
             with open(model_index_path, "r") as index_file:
                 model_index = json.load(index_file)
 
@@ -96,7 +96,7 @@ def _load_model(self, model_path):
             PipelineClass = ORT_PIPELINES_MAPPING.get(
                 pipeline_class_name, ORTStableDiffusionPipeline
             )
-            self.pipeline = PipelineClass.from_pretrained(model_path)
+            self.pipeline = PipelineClass.from_pretrained(self.download_onnx_folder)
             logging.debug(f"Model loaded successfully using {pipeline_class_name}")
         except Exception as e:
             logging.error(f"Error loading model: {e}")
diff --git a/nexa/onnx/nexa_inference_text.py b/nexa/onnx/nexa_inference_text.py
index fdb6db5f..f9a767e9 100644
--- a/nexa/onnx/nexa_inference_text.py
+++ b/nexa/onnx/nexa_inference_text.py
@@ -53,9 +53,21 @@ def __init__(self, model_path=None, local_path=None, **kwargs):
         self.downloaded_onnx_folder = local_path
         self.timings = kwargs.get("timings", False)
         self.device = "cpu"
+        
+        if self.downloaded_onnx_folder is None:
+            self.downloaded_onnx_folder, _ = pull_model(self.model_path, **kwargs)
+
+        if self.downloaded_onnx_folder is None:
+            logging.error(
+                f"Model ({model_path}) is not applicable. Please refer to our docs for proper usage.",
+                exc_info=True,
+            )
+            exit(1)
+
+        self._load_model_and_tokenizer()
 
     @SpinningCursorAnimation()
-    def _load_model_and_tokenizer(self) -> Tuple[Any, Any, Any, bool]:
+    def _load_model_and_tokenizer(self):
         logging.debug(f"Loading model from {self.downloaded_onnx_folder}")
         start_time = time.time()
         self.tokenizer = AutoTokenizer.from_pretrained(self.downloaded_onnx_folder)
@@ -148,18 +160,6 @@ def run(self):
         if self.params.get("streamlit"):
             self.run_streamlit()
         else:
-            if self.downloaded_onnx_folder is None:
-                self.downloaded_onnx_folder, run_type = pull_model(self.model_path, **kwargs)
-
-            if self.downloaded_onnx_folder is None:
-                logging.error(
-                    f"Model ({model_path}) is not applicable. Please refer to our docs for proper usage.",
-                    exc_info=True,
-                )
-                exit(1)
-            
-            self._load_model_and_tokenizer()
-
             if self.model is None or self.tokenizer is None or self.streamer is None:
                 logging.error(
                     "Failed to load model or tokenizer. Exiting.", exc_info=True
diff --git a/nexa/onnx/nexa_inference_tts.py b/nexa/onnx/nexa_inference_tts.py
index fb1f2f9a..26c6d3e4 100644
--- a/nexa/onnx/nexa_inference_tts.py
+++ b/nexa/onnx/nexa_inference_tts.py
@@ -50,8 +50,8 @@ def __init__(self, model_path=None, local_path=None, **kwargs):
         self.downloaded_onnx_folder = local_path
 
         if self.downloaded_onnx_folder is None:
-            self.downloaded_onnx_folder, run_type = pull_model(self.model_path, **kwargs)
-        
+            self.downloaded_onnx_folder, _ = pull_model(self.model_path, **kwargs)
+
         if self.downloaded_onnx_folder is None:
             logging.error(
                 f"Model ({model_path}) is not applicable. Please refer to our docs for proper usage.",
@@ -69,12 +69,10 @@ def _load_model(self):
         logging.debug(f"Loading model from {self.downloaded_onnx_folder}")
         try:
             self.tokenizer = TTSTokenizer(self.config["token"]["list"])
-            print(self.tokenizer)
             self.model = onnxruntime.InferenceSession(
                 os.path.join(self.downloaded_onnx_folder, "model.onnx"),
                 providers=["CPUExecutionProvider"],
             )
-            print(self.model)
             logging.debug("Model and tokenizer loaded successfully")
         except Exception as e:
             logging.error(f"Error loading model or tokenizer: {e}")
diff --git a/nexa/onnx/nexa_inference_voice.py b/nexa/onnx/nexa_inference_voice.py
index e6d7d696..c0f56ab4 100644
--- a/nexa/onnx/nexa_inference_voice.py
+++ b/nexa/onnx/nexa_inference_voice.py
@@ -43,9 +43,8 @@ def __init__(self, model_path=None, local_path=None, **kwargs):
         self.model = None
         self.processor = None
 
-    def run(self):
         if self.downloaded_onnx_folder is None:
-            self.downloaded_onnx_folder, run_type = pull_model(self.model_path, **kwargs)
+            self.downloaded_onnx_folder, _ = pull_model(self.model_path, **kwargs)
 
         if self.downloaded_onnx_folder is None:
             logging.error(
@@ -54,14 +53,16 @@ def run(self):
             )
             exit(1)
 
-        self._load_model(self.downloaded_onnx_folder)
+        self._load_model()
+
+    def run(self):
         self._dialogue_mode()
 
-    def _load_model(self, model_path):
-        logging.debug(f"Loading model from {model_path}")
+    def _load_model(self):
+        logging.debug(f"Loading model from {self.downloaded_onnx_folder}")
         try:
-            self.processor = AutoProcessor.from_pretrained(model_path)
-            self.model = ORTModelForSpeechSeq2Seq.from_pretrained(model_path)
+            self.processor = AutoProcessor.from_pretrained(self.downloaded_onnx_folder)
+            self.model = ORTModelForSpeechSeq2Seq.from_pretrained(self.downloaded_onnx_folder)
             logging.debug("Model and processor loaded successfully")
         except Exception as e:
             logging.error(f"Error loading model or processor: {e}")
diff --git a/nexa/utils.py b/nexa/utils.py
index e7761ece..28440cac 100644
--- a/nexa/utils.py
+++ b/nexa/utils.py
@@ -5,8 +5,97 @@
 import time
 from functools import partial, wraps
 from importlib.metadata import PackageNotFoundError, distribution
+from typing import Dict, List
+import json
+import logging
+import streamlit as st
+from nexa.constants import (
+    EXIT_COMMANDS,
+    EXIT_REMINDER,
+    NEXA_MODEL_LIST_PATH,
+)
+
+
+def get_available_models() -> Dict[str, dict]:
+    """Get list of available computer vision (cv) models from the model list JSON file."""
+    # check whether the model list file exists:
+    if not NEXA_MODEL_LIST_PATH.exists():
+        st.error("Model list file not found")
+        return {}  # empty dict
+
+    try:
+        # read model list from the JSON file:
+        with open(NEXA_MODEL_LIST_PATH, "r") as f:
+            available_models = json.load(f)
+            return available_models
+
+    except json.JSONDecodeError as e:
+        logging.error(f"Invalid JSON in model list file: {e}")
+        return {}
+    except Exception as e:
+        logging.error(f"Error loading available models: {e}")
+        return {}
+
+
+def filter_available_models(
+    models: Dict[str, dict],
+    specified_run_type: str,
+    model_map: Dict[str, str]
+) -> List[str]:
+    """Filter available models by run type and apply model mapping."""
+    if not models:
+        return []
+
+    filtered_models = set()  # to avoid duplicates
+
+    for model_name, model_info in models.items():
+        # skip if run_type doesn't match:
+        if model_info.get('run_type') != specified_run_type or 'projector' in model_name:
+            continue
+
+        if model_name in model_map.values():
+            # find short form from mapping:
+            for short_name, full_name in model_map.items():
+                if full_name == model_name:
+                    filtered_models.add(short_name)
+                    break
+        else:
+            filtered_models.add(model_name)
+
+    return sorted(list(filtered_models))
 
-from nexa.constants import EXIT_COMMANDS, EXIT_REMINDER
+
+def get_model_options(
+    specified_run_type: str,
+    model_map: Dict[str, str]
+) -> List[str]:
+    """Get list of model options including special options."""
+    available_models = get_available_models()
+    models_list = filter_available_models(available_models, specified_run_type, model_map)
+    # add special options at the end of the dropdown menu:
+    models_list.extend(["Use Model From Nexa Model Hub 🔍", "Local Model 📁"])
+    return models_list
+
+
+def update_model_options(
+    specified_run_type: str,
+    model_map: Dict[str, str]
+) -> None:
+    """Update the model options in session state and force a refresh."""
+    try:
+        fresh_options = get_model_options(specified_run_type, model_map)
+        st.session_state.model_options = fresh_options  # update session state with new options
+
+        if hasattr(st.session_state, 'current_model_path') and st.session_state.current_model_path:
+            if st.session_state.current_model_path in fresh_options:
+                st.session_state.current_model_index = fresh_options.index(st.session_state.current_model_path)
+            else:
+                # if current model not in list, reset to Model Hub option:
+                hub_index = fresh_options.index("Use Model From Nexa Model Hub 🔍")
+                st.session_state.current_model_index = hub_index
+
+    except Exception as e:
+        logging.error(f"Error updating model options: {e}")
 
 
 def is_package_installed(package_name: str) -> bool:
@@ -84,14 +173,14 @@ def nexa_prompt(placeholder: str = "Send a message ...") -> str:
         try:
             hint = light_text(placeholder)
             hint_length = len(strip_ansi(hint))
-            
+
             # Print the prompt with placeholder
             print(f">>> {hint}", end='', flush=True)
-            
+
             # Move cursor back to the start of the line
             print('\r', end='', flush=True)
             print(">>> ", end='', flush=True)
-            
+
             user_input = ""
             while True:
                 char = msvcrt.getch().decode()
@@ -108,7 +197,7 @@ def nexa_prompt(placeholder: str = "Send a message ...") -> str:
                 else:
                     user_input += char
                     print(char, end='', flush=True)
-                
+
                 if len(user_input) == 1:  # Clear hint after first character
                     print('\r' + ' ' * (hint_length + 4), end='', flush=True)
                     print(f'\r>>> {user_input}', end='', flush=True)
diff --git a/pyproject.toml b/pyproject.toml
index 071faca5..24b6ee35 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,5 +1,5 @@
 [build-system]
-requires = ["scikit-build-core"]
+requires = ["scikit-build-core", "setuptools>=64.0"]
 build-backend = "scikit_build_core.build"
 
 [project]
@@ -22,6 +22,7 @@ dependencies = [
     "pydantic",
     "pillow",
     "huggingface_hub",
+    "modelscope",
     "prompt_toolkit",
     "tqdm",                     # Shared dependencies
     "tabulate",
@@ -105,6 +106,7 @@ wheel.packages = [
     "nexa.onnx.streamlit",
     "nexa.onnx.server",
     "nexa.eval",
+    "nexa.transformers",
 ]
 sdist.include = [
     "CMakeLists.txt",
diff --git a/requirements.txt b/requirements.txt
index 978b8c1d..6e732a0e 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -19,6 +19,7 @@ pydantic
 pillow
 python-multipart
 huggingface_hub
+modelscope
 
 # For onnx
 optimum[onnxruntime]  # for CPU version
diff --git a/swift/README.md b/swift/README.md
new file mode 100644
index 00000000..0b284330
--- /dev/null
+++ b/swift/README.md
@@ -0,0 +1,84 @@
+# NexaSwift
+
+**NexaSwift** is a Swift wrapper for the [llama.cpp](https://github.com/ggerganov/llama.cpp.git) library. This repository provides a Swifty API, allowing Swift developers to easily integrate and use `llama.cpp` models in their projects.  
+**NOTE:** Currently, we support text inference capabilities.
+
+## Installation
+
+To add NexaSwift to your Swift project, add the following dependency in your `Package.swift` file:
+
+```swift
+.package(url: "https://github.com/NexaAI/nexa-sdk.git", .branch("main"))
+```
+
+## Usage
+
+### 1. Initialize NexaSwift with Model Path
+
+Create a configuration and initialize NexaSwift with the path to your model file:
+
+```swift
+let configuration = NexaSwift.Configuration(
+    maxNewToken: 128,
+    stopTokens: []
+)
+let modelPath = "path/to/your/model"
+let nexaSwift = try NexaSwift.NexaTextInference(modelPath: modelPath, modelConfiguration: configuration)
+```
+
+### 2 Completion chat API
+
+#### Generate messages
+
+```swift
+var messages:[ChatCompletionRequestMessage] = []
+let userMessage = ChatCompletionRequestMessage.user(
+    ChatCompletionRequestUserMessage(content: .text("user input"))
+)
+messages.append(userMessage)
+```
+
+#### Non-Streaming Mode
+
+For non-streaming mode, simply call the start method with your prompt. This will return the complete response once it’s available.
+
+```swift
+let response = try await nexaSwift.createChatCompletion(for: messages)
+print(response.choices[0].message.content ?? "")
+```
+
+#### Streaming Mode
+
+In streaming mode, you can process the response in real-time as it’s generated:
+
+```swift
+for try await response in await nexaSwift.createChatCompletionStream(for: messages) {
+    print(response.choices[0].delta.content ?? "")
+}
+```
+
+### 3 Completion API
+
+#### Non-Streaming Mode
+
+```swift
+if let response = try? await nexaSwift.createCompletion(for: prompt) {
+    print(response.choices[0].text))
+}
+```
+
+#### Streaming Mode
+
+```swift
+for try await response in await nexaSwift.createCompletionStream(for: prompt) {
+    print(response.choices[0].text)
+}
+```
+
+## Quick Start
+
+Open the [swift test project](../examples/swift-test/) folder in Xcode and run the project.
+
+## Download Models
+
+NexaSwift supports all models compatible with llama.cpp. You can download models from the [Nexa AI ModelHub](https://nexa.ai/models).
diff --git a/swift/Sources/NexaSwift/LlamaModel.swift b/swift/Sources/NexaSwift/LlamaModel.swift
new file mode 100644
index 00000000..d8bc6f68
--- /dev/null
+++ b/swift/Sources/NexaSwift/LlamaModel.swift
@@ -0,0 +1,207 @@
+import Foundation
+import llama
+
+class LlamaModel {
+    private let model: Model
+    public var configuration: Configuration
+    private let context: OpaquePointer
+    private var sampler: UnsafeMutablePointer<llama_sampler>
+    private var batch: Batch
+    private var tokens: [Token]
+    private var temporaryInvalidCChars: [CChar] = []
+    private var generatedTokenAccount: Int32 = 0
+    private var totalTokensProcessed: Int32 = 0
+    private var ended = false
+    private let n_ctx: Int32
+    public var arch: String {
+        return getModelDetails().arch
+    }
+    public var modelType: String {
+        return getModelDetails().modelType
+    }
+    public var modelFtype: String {
+        return getModelDetails().modelFtype
+    }
+
+    var shouldContinue: Bool {
+        generatedTokenAccount < configuration.maxNewToken && !ended
+    }
+    
+    public func reset() {
+        generatedTokenAccount = 0
+        ended = false
+    }
+
+    init(path: String, configuration: Configuration = .init()) throws {
+        self.configuration = configuration
+        llama_backend_init()
+        llama_numa_init(GGML_NUMA_STRATEGY_DISABLED)
+        var model_params = llama_model_default_params()
+        #if os(iOS) || targetEnvironment(simulator)
+            model_params.n_gpu_layers = 0
+        #endif
+        guard let model = llama_load_model_from_file(path, model_params) else {
+            throw NexaSwiftError.others("Cannot load model at path \(path)")
+        }
+        
+        self.model = model
+        
+        guard let context = llama_new_context_with_model(model, configuration.contextParameters) else {
+            throw NexaSwiftError.others("Cannot load model context")
+        }
+        self.context = context
+        self.n_ctx = Int32(llama_n_ctx(context))
+        self.tokens = []
+        self.sampler = llama_sampler_chain_init(llama_sampler_chain_default_params())
+        self.batch = llama_batch_init(configuration.nTokens, 0, 1)
+        try checkContextLength()
+    }
+    
+    public func updateSampler() {
+        self.sampler = llama_sampler_chain_init(llama_sampler_chain_default_params())
+        llama_sampler_chain_add(sampler, llama_sampler_init_temp(configuration.temperature))
+        llama_sampler_chain_add(sampler, llama_sampler_init_top_k(configuration.topK))
+        llama_sampler_chain_add(sampler, llama_sampler_init_top_p(configuration.topP, 1))
+        llama_sampler_chain_add(sampler, llama_sampler_init_softmax())
+        llama_sampler_chain_add(sampler, llama_sampler_init_dist(configuration.seed))
+    }
+
+    private func checkContextLength() throws {
+        let n_ctx_train = llama_n_ctx_train(model)
+        if n_ctx > n_ctx_train {
+            throw NexaSwiftError.others("Model was trained on \(n_ctx_train) context but tokens \(n_ctx) specified")
+        }
+    }
+    
+    private func getModelDetails() -> (arch: String, modelType: String, modelFtype: String) {
+        let bufSize = 256
+        var buf = [CChar](repeating: 0, count: bufSize)
+        let result = llama_model_desc(model, &buf, bufSize)
+        
+        if result > 0 {
+            let modelDesc = String(cString: buf)
+            let components = modelDesc.components(separatedBy: " ")
+            let arch = components[0] ?? "Unknown"
+            let modelType = components[1] ?? "Unknown"
+            let modelFtype = components[2] ?? "Unknown"
+            return (arch, modelType, modelFtype)
+        } else {
+            return ("Unknown", "Unknown", "Unknown")
+        }
+    }
+
+    func start(for prompt: String) throws {
+//        print("arch: \(arch), modelType: \(modelType), modelFtype: \(modelFtype)")
+        updateSampler()
+        ended = false
+        tokens = tokenize(text: prompt, addBos: true)
+
+        // Check for token length
+        if tokens.count > n_ctx {
+            let originalCount = tokens.count
+            tokens = Array(tokens.prefix(Int(n_ctx)))
+            print("""
+                WARNING: Input tokens (\(originalCount)) exceed context length (\(n_ctx)).
+                Truncating to first \(n_ctx) tokens. Some content at the end will be ignored.
+                Consider splitting your input into smaller chunks for better results.
+                """)
+        }
+
+        temporaryInvalidCChars = []
+        batch.clear()
+
+        tokens.enumerated().forEach { index, token in
+            batch.add(token: token, position: Int32(index), seqIDs: [0], logit: false)
+        }
+        batch.logits[Int(batch.n_tokens) - 1] = 1
+
+        if llama_decode(context, batch) != 0 {
+            throw NexaSwiftError.decodeError
+        }
+        generatedTokenAccount = 0
+        totalTokensProcessed = batch.n_tokens
+    }
+
+    func `continue`() throws -> String {
+        if totalTokensProcessed >= n_ctx {
+            print("WARNING: Reached maximum context length (\(n_ctx)). Stopping generation.")
+            temporaryInvalidCChars.removeAll()
+            ended = true
+            return ""
+        }
+        
+        let newToken =  llama_sampler_sample(sampler, context, batch.n_tokens - 1)
+
+        if llama_token_is_eog(model, newToken) {
+            temporaryInvalidCChars.removeAll()
+            ended = true
+            return ""
+        }
+
+
+        let newTokenCChars = tokenToCChars(token: newToken)
+        temporaryInvalidCChars.append(contentsOf: newTokenCChars)
+
+        let newTokenStr: String
+        if let validString = String(validating: temporaryInvalidCChars + [0], as: UTF8.self) {
+            newTokenStr = validString
+            temporaryInvalidCChars.removeAll()
+        } else if let suffixIndex = temporaryInvalidCChars.firstIndex(where: { $0 != 0 }),
+                  let validSuffix = String(validating: Array(temporaryInvalidCChars.suffix(from: suffixIndex)) + [0],
+                                           as: UTF8.self) {
+            newTokenStr = validSuffix
+            temporaryInvalidCChars.removeAll()
+        } else {
+            newTokenStr = ""
+        }
+
+        batch.clear()
+        batch.add(token: newToken, position: totalTokensProcessed, seqIDs: [0], logit: true)
+        generatedTokenAccount += 1
+        totalTokensProcessed += 1
+
+        if llama_decode(context, batch) != 0 {
+            throw NexaSwiftError.decodeError
+        }
+        return newTokenStr.filter { $0 != "\0" }
+    }
+
+    private func tokenToCChars(token: llama_token) -> [CChar] {
+        var length: Int32 = 8
+        var piece = Array<CChar>(repeating: 0, count: Int(length))
+
+        let nTokens = llama_token_to_piece(model, token, &piece, length, 0, false)
+        if nTokens >= 0 {
+            return Array(piece.prefix(Int(nTokens)))
+        } else {
+            length = -nTokens
+            piece = Array<CChar>(repeating: 0, count: Int(length))
+            let nNewTokens = llama_token_to_piece(model, token, &piece, length, 0, false)
+            return Array(piece.prefix(Int(nNewTokens)))
+        }
+    }
+
+    private func tokenize(text: String, addBos: Bool) -> [Token] {
+        let utf8Count = text.utf8.count
+        let n_tokens = utf8Count + (addBos ? 1 : 0) + 1
+        
+        return Array(unsafeUninitializedCapacity: n_tokens) { buffer, initializedCount in
+            initializedCount = Int(
+                llama_tokenize(model, text, Int32(utf8Count), buffer.baseAddress, Int32(n_tokens), addBos, false)
+            )
+        }
+    }
+
+    func clear() {
+        tokens.removeAll()
+        temporaryInvalidCChars.removeAll()
+        llama_kv_cache_clear(context)
+    }
+
+    deinit {
+        llama_batch_free(batch)
+        llama_free(context)
+        llama_free_model(model)
+        llama_backend_free()
+    }
+}
diff --git a/swift/Sources/NexaSwift/Models/Batch.swift b/swift/Sources/NexaSwift/Models/Batch.swift
new file mode 100644
index 00000000..ca784716
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/Batch.swift
@@ -0,0 +1,23 @@
+import Foundation
+import llama
+
+extension Batch {
+    mutating func clear() {
+        self.n_tokens = 0
+    }
+
+    mutating func add(token: Token,
+                      position: Position,
+                      seqIDs: [SeqID],
+                      logit: Bool) {
+        let nextIndex = Int(n_tokens)
+        self.token[nextIndex] = token
+        self.pos[nextIndex] = position
+        self.n_seq_id[nextIndex] = Int32(seqIDs.count)
+        seqIDs.enumerated().forEach { index, id in
+            seq_id[nextIndex]?[index] = id
+        }
+        self.logits[nextIndex] = logit ? 1 : 0
+        self.n_tokens += 1
+    }
+}
diff --git a/swift/Sources/NexaSwift/Models/ChatCompletionMessage.swift b/swift/Sources/NexaSwift/Models/ChatCompletionMessage.swift
new file mode 100644
index 00000000..bae89664
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/ChatCompletionMessage.swift
@@ -0,0 +1,517 @@
+import Foundation
+
+
+public struct ChatCompletionRequestSystemMessage: Codable {
+    public var role: Role = .system
+    public let content: String?
+    
+    public init(content: String?) {
+        self.content = content
+    }
+}
+
+public struct ChatCompletionRequestUserMessage: Codable {
+    public var role: Role = .user
+    public let content: UserMessageContent
+    
+    public init(content: UserMessageContent) {
+        self.content = content
+    }
+}
+
+public enum UserMessageContent: Codable {
+    case text(String)
+    case image(ImageContent)
+    
+    enum CodingKeys: String, CodingKey {
+        case type, text, imageUrl
+    }
+
+    enum ContentType: String, Codable {
+        case text
+        case imageUrl
+    }
+
+    public init(from decoder: Decoder) throws {
+        let container = try decoder.container(keyedBy: CodingKeys.self)
+        let type = try container.decode(ContentType.self, forKey: .type)
+        
+        switch type {
+        case .text:
+            let text = try container.decode(String.self, forKey: .text)
+            self = .text(text)
+        case .imageUrl:
+            let imageUrl = try container.decode(ImageContent.self, forKey: .imageUrl)
+            self = .image(imageUrl)
+        }
+    }
+
+    public func encode(to encoder: Encoder) throws {
+        var container = encoder.container(keyedBy: CodingKeys.self)
+        switch self {
+        case .text(let text):
+            try container.encode(ContentType.text, forKey: .type)
+            try container.encode(text, forKey: .text)
+        case .image(let imageUrl):
+            try container.encode(ContentType.imageUrl, forKey: .type)
+            try container.encode(imageUrl, forKey: .imageUrl)
+        }
+    }
+}
+
+public struct ImageContent: Codable {
+    public let url: String
+    public let detail: String?
+    
+    public init(url: String, detail: String? = nil) {
+        self.url = url
+        self.detail = detail
+    }
+}
+
+public struct ChatCompletionRequestAssistantMessage: Codable {
+    public var role: Role = .assistant
+    public let content: String?
+    public let toolCalls: [ChatCompletionMessageToolCall]?
+    public let functionCall: ChatCompletionRequestAssistantMessageFunctionCall?
+    
+    public init(content: String?, toolCalls: [ChatCompletionMessageToolCall]? = nil, functionCall: ChatCompletionRequestAssistantMessageFunctionCall? = nil) {
+        self.content = content
+        self.toolCalls = toolCalls
+        self.functionCall = functionCall
+    }
+}
+
+public struct ChatCompletionRequestToolMessage: Codable {
+    public var role: Role = .tool
+    public let content: String?
+    public let toolCallID: String
+    
+    public init(content: String?, toolCallID: String) {
+        self.content = content
+        self.toolCallID = toolCallID
+    }
+}
+
+public struct ChatCompletionRequestFunctionMessage: Codable {
+    public var role: Role = .function
+    public let content: String?
+    public let name: String
+    
+    public init(content: String?, name: String) {
+        self.content = content
+        self.name = name
+    }
+}
+
+public struct ChatCompletionRequestAssistantMessageFunctionCall: Codable {
+    public let name: String
+    public let arguments: String
+    
+    public init(name: String, arguments: String) {
+        self.name = name
+        self.arguments = arguments
+    }
+}
+
+
+class ChatFormatterRegistry {
+    private var formatters = [String: ChatFormatter]()
+    
+    init() {
+        register(name: ChatCompletionModel.octopusv2.rawValue, formatter: OctopusV2Formatter())
+        register(name: ChatCompletionModel.llama.rawValue, formatter: LlamaFormatter())
+        register(name: ChatCompletionModel.llama3.rawValue, formatter: Llama3Formatter())
+        register(name: ChatCompletionModel.gemma.rawValue, formatter: GemmaFormatter())
+        register(name: ChatCompletionModel.qwen.rawValue, formatter: QwenFormatter())
+        register(name: ChatCompletionModel.mistral.rawValue, formatter: MistralFormatter())
+    }
+    
+    func register(name: String, formatter: ChatFormatter) {
+        formatters[name] = formatter
+    }
+    
+    func getFormatter(name: String?) -> ChatFormatter? {
+        return formatters[getFormatterName(name: name)]
+    }
+    
+    func getFormatterName(name: String?) -> String {
+        return name ?? ChatCompletionModel.llama.rawValue
+    }
+}
+
+//formatter
+public struct ChatFormatterResponse {
+    let prompt: String
+    let stop: [String]
+}
+
+public protocol ChatFormatter {
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse
+}
+
+
+class OctopusV2Formatter: ChatFormatter {
+    private let systemMessage = """
+    Below is the query from the users, please call the correct function and generate the parameters to call the function.
+
+    """
+    private let separator = "\n\n"
+
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        var formattedMessages = mapRoles(messages: messages)
+        
+        // Assuming the last message should be the assistant's response
+        formattedMessages.append(("Response:", nil))
+        
+        var prompt = systemMessage
+        for (role, content) in formattedMessages {
+            if let content = content {
+                prompt += "\(role) \(content.trimmingCharacters(in: .whitespacesAndNewlines))\(separator)"
+            } else {
+                prompt += "\(role) "
+            }
+        }
+        
+        return ChatFormatterResponse(prompt: prompt.trimmingCharacters(in: .whitespacesAndNewlines), stop: [separator])
+    }
+    
+    private func mapRoles(messages: [ChatCompletionRequestMessage]) -> [(String, String?)] {
+        var mappedMessages = [(String, String?)]()
+        let roleMapping: [Role: String] = [
+            .user: "Query:",
+            .assistant: "Response:"
+        ]
+        
+        for message in messages {
+            var rolePrefix = ""
+            var content: String? = nil
+            
+            switch message {
+            case .system(let systemMessage):
+                // Include system message if necessary
+                continue
+            case .user(let userMessage):
+                rolePrefix = roleMapping[.user] ?? "Query:"
+                switch userMessage.content {
+                case .text(let text):
+                    content = text
+                case .image(let imageContent):
+                    content = imageContent.detail ?? imageContent.url
+                }
+            case .assistant(let assistantMessage):
+                rolePrefix = roleMapping[.assistant] ?? "Response:"
+                content = assistantMessage.content
+            case .tool(let toolMessage):
+                rolePrefix = "Tool:"
+                content = toolMessage.content
+            case .function(let functionMessage):
+                rolePrefix = "Function:"
+                content = functionMessage.content
+            }
+            
+            mappedMessages.append((rolePrefix, content))
+        }
+        
+        return mappedMessages
+    }
+}
+
+
+//https://www.llama.com/docs/model-cards-and-prompt-formats/meta-llama-2/
+class LlamaFormatter: ChatFormatter {
+    private let systemTemplate = "<<SYS>>\n{system_message}\n<</SYS>>\n\n"
+    private let roles: [String: String] = [
+        "user": "<s>[INST] ",
+        "assistant": " [/INST] "
+    ]
+    private let endToken = "</s>"
+    
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        let formattedMessages = mapRoles(messages: messages)
+        let systemMessage = getSystemMessage(messages)
+        let formattedSystemMessage = systemMessage.map { msg in
+            systemTemplate.replacingOccurrences(of: "{system_message}", with: msg)
+        }
+        let prompt = formatPrompt(systemMessage: formattedSystemMessage, messages: formattedMessages)
+        return ChatFormatterResponse(prompt: prompt, stop: [endToken])
+    }
+    
+    private func getSystemMessage(_ messages: [ChatCompletionRequestMessage]) -> String? {
+        for message in messages {
+            if case .system(let systemMessage) = message {
+                return systemMessage.content
+            }
+        }
+        return nil
+    }
+    
+    private func mapRoles(messages: [ChatCompletionRequestMessage]) -> [(String, String?)] {
+        return messages.compactMap { message in
+            switch message {
+            case .system:
+                return nil
+            case .user(let userMessage):
+                let content: String?
+                switch userMessage.content {
+                case .text(let text):
+                    content = text
+                case .image(let imageContent):
+                    content = imageContent.detail
+                }
+                return (roles["user"] ?? "", content)
+            case .assistant(let assistantMessage):
+                return (roles["assistant"] ?? "", assistantMessage.content)
+            case .tool, .function:
+                return nil
+            }
+        }
+    }
+    
+    private func formatPrompt(systemMessage: String?, messages: [(String, String?)]) -> String {
+        var conversations: [String] = []
+        var currentConversation = ""
+        
+        for (index, (role, content)) in messages.enumerated() {
+            if index % 2 == 0 { // User message
+                if !currentConversation.isEmpty {
+                    conversations.append(currentConversation + " " + endToken)
+                }
+                currentConversation = role // <s>[INST]
+                if index == 0 && systemMessage != nil {
+                    currentConversation += systemMessage! + content!
+                } else {
+                    currentConversation += content ?? ""
+                }
+            } else { // Assistant message
+                if let content = content {
+                    currentConversation += role + content // [/INST] response
+                }
+            }
+        }
+        
+        // Add the last conversation if it's a user message without response
+        if messages.count % 2 != 0 {
+            currentConversation += roles["assistant"]!
+            conversations.append(currentConversation)
+        } else if !currentConversation.isEmpty {
+            conversations.append(currentConversation + endToken)
+        }
+        
+        return conversations.joined(separator: "\n")
+    }
+}
+
+//https://www.llama.com/docs/model-cards-and-prompt-formats/meta-llama-3/
+class Llama3Formatter: ChatFormatter {
+    private let roles: [String: String] = [
+        "system": "<|start_header_id|>system<|end_header_id|>\n\n",
+        "user": "<|start_header_id|>user<|end_header_id|>\n\n",
+        "assistant": "<|start_header_id|>assistant<|end_header_id|>\n\n"
+    ]
+    private let endToken = "<|eot_id|>"
+
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        var formattedMessages = mapRoles(messages: messages)
+        
+        formattedMessages.append((roles["assistant"] ?? "", nil))
+        
+        let prompt = formatPrompt(formattedMessages)
+        
+        return ChatFormatterResponse(prompt: prompt, stop: [endToken])
+    }
+
+    private func mapRoles(messages: [ChatCompletionRequestMessage]) -> [(String, String?)] {
+        return messages.map { message in
+            var rolePrefix = ""
+            var content: String? = ""
+            
+            switch message {
+            case .system(let systemMessage):
+                rolePrefix = roles["system"] ?? ""
+                content = systemMessage.content
+            case .user(let userMessage):
+                rolePrefix = roles["user"] ?? ""
+                switch userMessage.content {
+                case .text(let text):
+                    content = text
+                case .image(let imageContent):
+                    content = imageContent.detail
+                }
+            case .assistant(let assistantMessage):
+                rolePrefix = roles["assistant"] ?? ""
+                content = assistantMessage.content
+            case .tool(let toolMessage):
+                rolePrefix = roles["tool"] ?? ""
+                content = toolMessage.content
+            case .function(let functionMessage):
+                rolePrefix = roles["function"] ?? ""
+                content = functionMessage.content
+            }
+            
+            return (rolePrefix, content)
+        }
+    }
+
+    private func formatPrompt(_ formattedMessages: [(String, String?)]) -> String {
+        var prompt = "<|begin_of_text|>"
+        for (role, content) in formattedMessages {
+            if let content = content {
+                prompt += "\(role)\(content.trimmingCharacters(in: .whitespacesAndNewlines))\(endToken)"
+            } else {
+                prompt += "\(role) "
+            }
+        }
+        return prompt.trimmingCharacters(in: .whitespacesAndNewlines)
+    }
+}
+
+
+//https://ai.google.dev/gemma/docs/formatting
+class GemmaFormatter: ChatFormatter {
+    private let roles: [String: String] = [
+        "user": "<start_of_turn>user\n",
+        "assistant": "<start_of_turn>model\n"
+    ]
+    
+    private let endToken = "<end_of_turn>"
+    private let separator = "<end_of_turn>\n"
+    
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        var formattedMessages = mapRoles(messages: messages)
+        formattedMessages.append((roles["assistant"]!, nil))
+        let prompt = formatPrompt(formattedMessages)
+        
+        return ChatFormatterResponse(prompt: prompt, stop: [endToken])
+    }
+    
+    private func mapRoles(messages: [ChatCompletionRequestMessage]) -> [(String, String?)] {
+        return messages.compactMap { message in
+            switch message {
+            case .system:
+                return nil
+            case .user(let userMessage):
+                let content: String?
+                switch userMessage.content {
+                case .text(let text):
+                    content = text
+                case .image(let imageContent):
+                    content = imageContent.detail
+                }
+                return (roles["user"] ?? "", content)
+            case .assistant(let assistantMessage):
+                return (roles["assistant"] ?? "", assistantMessage.content)
+            case .tool, .function:
+                return nil
+            }
+        }
+    }
+    
+    private func formatPrompt(_ formattedMessages: [(String, String?)]) -> String {
+        var prompt = ""
+        
+        for (index, (role, content)) in formattedMessages.enumerated() {
+            if index == formattedMessages.count - 1 {
+                prompt += role
+            } else if let content = content {
+                prompt += "\(role)\(content)\(separator)"
+            }
+        }
+        return prompt.trimmingCharacters(in: .whitespacesAndNewlines)
+    }
+}
+
+// https://qwen.readthedocs.io/zh-cn/latest/getting_started/concepts.html#control-tokens-chat-template
+class QwenFormatter: ChatFormatter {
+    private let roles: [String: String] = [
+        "user": "<|im_start|>user",
+        "assistant": "<|im_start|>assistant"
+    ]
+    
+    private let systemTemplate = "<|im_start|>system\n{system_message}"
+    private let defaultSystemMessage = "You are a helpful assistant."
+    private let separator = "<|im_end|>"
+    private let endToken = "<|endoftext|>"
+    
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        let systemMessage = formatSystemMessage()
+        var formattedMessages = mapRoles(messages: messages)
+        formattedMessages.append((roles["assistant"]!, nil))
+        let prompt = formatChatML(systemMessage: systemMessage, messages: formattedMessages)
+        return ChatFormatterResponse(prompt: prompt, stop: [endToken])
+    }
+    
+    private func formatSystemMessage() -> String {
+        return systemTemplate.replacingOccurrences(of: "{system_message}", with: defaultSystemMessage)
+    }
+    
+    private func mapRoles(messages: [ChatCompletionRequestMessage]) -> [(String, String?)] {
+        return messages.compactMap { message in
+            switch message {
+            case .user(let userMessage):
+                let content: String?
+                switch userMessage.content {
+                case .text(let text):
+                    content = text
+                case .image(let imageContent):
+                    content = imageContent.detail
+                }
+                return (roles["user"]!, content)
+            case .assistant(let assistantMessage):
+                return (roles["assistant"]!, assistantMessage.content)
+            case .system, .tool, .function:
+                return nil
+            }
+        }
+    }
+    
+    private func formatChatML(systemMessage: String, messages: [(String, String?)]) -> String {
+        var prompt = systemMessage.isEmpty ? "" : "\(systemMessage)\(separator)\n"
+        for (role, content) in messages {
+            if let content = content {
+                prompt += "\(role)\n\(content)\(separator)\n"
+            } else {
+                prompt += "\(role)\n"
+            }
+        }
+        return prompt.trimmingCharacters(in: .whitespacesAndNewlines)
+    }
+}
+
+// https://www.promptingguide.ai/models/mistral-7b#chat-template-for-mistral-7b-instruct
+class MistralFormatter: ChatFormatter {
+    private let endToken = "</s>"
+    private let conversationStart = "<s>"
+    private let instructStart = "[INST] "
+    private let instructEnd = " [/INST] "
+    
+    func format(messages: [ChatCompletionRequestMessage]) -> ChatFormatterResponse {
+        var prompt = conversationStart  // Add <s> only once at the start
+        
+        for (index, message) in messages.enumerated() {
+            switch message {
+            case .user(let userMessage):
+                switch userMessage.content {
+                case .text(let text):
+                    prompt += "\(instructStart)\(text)"
+                case .image:
+                    continue
+                }
+                
+            case .assistant(let assistantMessage):
+                if let content = assistantMessage.content {
+                    prompt += "\(instructEnd)\(content)\(endToken)"
+                }     
+            default:
+                continue
+            }
+        }
+        
+        // Add instructEnd if the last message was from user (waiting for AI response)
+        if messages.last.map({ if case .user = $0 { return true } else { return false } }) ?? false {
+            prompt += instructEnd
+        }
+        
+        return ChatFormatterResponse(prompt: prompt, stop: [endToken])
+    }
+}
diff --git a/swift/Sources/NexaSwift/Models/ChatCompletionResponse.swift b/swift/Sources/NexaSwift/Models/ChatCompletionResponse.swift
new file mode 100644
index 00000000..396dba5c
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/ChatCompletionResponse.swift
@@ -0,0 +1,91 @@
+import Foundation
+
+
+public struct ChatCompletionMessageToolCallFunction: Codable {
+    public let name: String
+    public let arguments: String
+
+    public init(name: String, arguments: String) {
+        self.name = name
+        self.arguments = arguments
+    }
+}
+
+public struct ChatCompletionMessageToolCall: Codable {
+    public let id: String
+    public var type: Role = .function
+    public let function: ChatCompletionMessageToolCallFunction
+
+    public init(id: String, function: ChatCompletionMessageToolCallFunction) {
+        self.id = id
+        self.function = function
+    }
+}
+
+public struct ChatCompletionResponseFunctionCall:Codable{
+    public let name: String
+    public let arguments: String
+}
+
+public struct ChatCompletionResponseMessage: Codable{
+    public let content: String?
+    public let toolCalls: [ChatCompletionMessageToolCall]?
+    public let role: String?
+    public let functionCall: ChatCompletionResponseFunctionCall?
+}
+
+public struct  ChatCompletionResponseChoice: Codable{
+    public let index: Int
+    public let message: ChatCompletionResponseMessage
+    public let logprobs: CompletionLogprobs?
+    public let finishReason: FinishReason?
+}
+
+public struct ChatCompletionResponse: Codable {
+    public let id: String
+    public let object: String
+    public let created: Int
+    public let model: String
+    public let choices: [ChatCompletionResponseChoice]
+    public let usage: CompletionUsage?
+
+    enum CodingKeys: String, CodingKey {
+        case id
+        case object
+        case created
+        case model
+        case choices
+        case usage
+    }
+}
+
+public struct ChatCompletionStreamResponseDelta: Codable {
+    public var content: String?
+    public var functionCall: ChatCompletionStreamResponseDeltaFunctionCall? // DEPRECATED
+    public var toolCalls: [ChatCompletionMessageToolCallChunk]?
+    public var role: Role?
+    
+}
+
+public struct ChatCompletionStreamResponseDeltaFunctionCall: Codable {
+
+}
+
+public struct ChatCompletionMessageToolCallChunk: Codable {
+
+}
+
+public struct ChatCompletionStreamResponseChoice: Codable {
+    public var index: Int
+    public var delta: ChatCompletionStreamResponseDelta
+    public var finishReason: FinishReason?
+    public var logprobs: CompletionLogprobs?
+}
+
+public struct CreateChatCompletionStreamResponse: Codable {
+    public var id: String
+    public var model: String
+    public var object: String
+    public var created: Int
+    public var choices: [ChatCompletionStreamResponseChoice]
+}
diff --git a/swift/Sources/NexaSwift/Models/Common.swift b/swift/Sources/NexaSwift/Models/Common.swift
new file mode 100644
index 00000000..56cb371c
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/Common.swift
@@ -0,0 +1,28 @@
+public enum Role: String, Codable {
+    case system
+    case user
+    case assistant
+    case tool
+    case function
+}
+
+public enum ChatCompletionRequestMessage {
+    case system(ChatCompletionRequestSystemMessage)
+    case user(ChatCompletionRequestUserMessage)
+    case assistant(ChatCompletionRequestAssistantMessage)
+    case tool(ChatCompletionRequestToolMessage)
+    case function(ChatCompletionRequestFunctionMessage)
+}
+
+public enum FinishReason: String, Codable {
+        case stop, length, toolCalls = "tool_calls", functionCall = "function_call"
+}
+
+public enum ChatCompletionModel: String, Codable {
+    case octopusv2
+    case llama
+    case llama3
+    case gemma
+    case qwen
+    case mistral
+}
diff --git a/swift/Sources/NexaSwift/Models/CompletionResponse.swift b/swift/Sources/NexaSwift/Models/CompletionResponse.swift
new file mode 100644
index 00000000..b3d16519
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/CompletionResponse.swift
@@ -0,0 +1,52 @@
+import Foundation
+
+public struct CompletionUsage: Codable {
+    public let promptTokens: Int
+    public let completionTokens: Int
+    public let totalTokens: Int
+    
+    enum CodingKeys: String, CodingKey {
+        case promptTokens = "prompt_tokens"
+        case completionTokens = "completion_tokens"
+        case totalTokens = "total_tokens"
+    }
+}
+
+public struct CompletionLogprobs: Codable {
+    public let textOffset: [Int]?
+    public let tokenLogprobs: [Float?]?
+    public let tokens: [String]?
+    public let topLogprobs: [Dictionary<String, Float>?]?
+}
+
+public struct CompletionChoice: Codable {
+    public let text: String
+    public let index: Int
+    public let logprobs: CompletionLogprobs?
+    public let finishReason: FinishReason?
+    
+    enum CodingKeys: String, CodingKey {
+        case text
+        case index
+        case logprobs
+        case finishReason = "finish_reason"
+    }
+}
+
+public struct CompletionResponse: Codable {
+    public let id: String
+    public let object: String
+    public let created: Int
+    public let model: String
+    public let choices: [CompletionChoice]
+    public let usage: CompletionUsage?
+    
+    enum CodingKeys: String, CodingKey {
+        case id
+        case object
+        case created
+        case model
+        case choices
+        case usage
+    }
+}
diff --git a/swift/Sources/NexaSwift/Models/Configuration.swift b/swift/Sources/NexaSwift/Models/Configuration.swift
new file mode 100644
index 00000000..b8c3757c
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/Configuration.swift
@@ -0,0 +1,53 @@
+import Foundation
+import llama
+
+public struct Configuration {
+    public var nTokens:Int32
+    public var embd: Int32
+    public var nSeqMax: Int32
+    public var seed: UInt32
+    public var topK: Int32
+    public var topP: Float
+    public var nCTX: Int
+    public var temperature: Float
+    public var maxNewToken: Int
+    public var batchSize: Int
+    public var stopTokens: [String]
+
+    public init(
+        nTokens:Int32 = 2048,
+        embd:Int32 = 512,
+        nSeqMax:Int32 = 2,
+        seed: UInt32 = 1234,
+        topK: Int32 = 50,
+        topP: Float = 1.0,
+        nCTX: Int = 2048,
+        temperature: Float = 0.7,
+        batchSize: Int = 2048,
+        stopSequence: String? = nil,
+        maxNewToken: Int = 128,
+        stopTokens: [String] = []) {
+            self.nTokens = nTokens
+            self.embd = embd
+            self.nSeqMax = nSeqMax
+            self.seed = seed
+            self.topK = topK
+            self.topP = topP
+            self.nCTX = nCTX
+            self.batchSize = batchSize
+            self.temperature = temperature
+            self.maxNewToken = maxNewToken
+            self.stopTokens = stopTokens
+    }
+}
+
+extension Configuration {
+    var contextParameters: ContextParameters {
+        var params = llama_context_default_params()
+        let processorCount = max(1, min(16, ProcessInfo.processInfo.processorCount - 2))
+        params.n_ctx = max(8, UInt32(self.nCTX)) // minimum context size is 8
+        params.n_threads = Int32(processorCount)
+        params.n_threads_batch = Int32(processorCount)
+        return params
+    }
+}
diff --git a/swift/Sources/NexaSwift/Models/SwiftLlamaError.swift b/swift/Sources/NexaSwift/Models/SwiftLlamaError.swift
new file mode 100644
index 00000000..37c04296
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/SwiftLlamaError.swift
@@ -0,0 +1,6 @@
+import Foundation
+
+public enum NexaSwiftError: Error {
+    case decodeError
+    case others(String)
+}
diff --git a/swift/Sources/NexaSwift/Models/TypeAlias.swift b/swift/Sources/NexaSwift/Models/TypeAlias.swift
new file mode 100644
index 00000000..4711efc8
--- /dev/null
+++ b/swift/Sources/NexaSwift/Models/TypeAlias.swift
@@ -0,0 +1,10 @@
+import Foundation
+import llama
+
+typealias Batch = llama_batch
+typealias Model = OpaquePointer
+typealias Context = OpaquePointer
+typealias Token = llama_token
+typealias Position = llama_pos
+typealias SeqID = llama_seq_id
+typealias ContextParameters = llama_context_params
diff --git a/swift/Sources/NexaSwift/NexaSwiftActor.swift b/swift/Sources/NexaSwift/NexaSwiftActor.swift
new file mode 100644
index 00000000..b295dc71
--- /dev/null
+++ b/swift/Sources/NexaSwift/NexaSwiftActor.swift
@@ -0,0 +1,6 @@
+import Foundation
+
+@globalActor
+public actor NexaSwiftActor {
+    public static let shared = NexaSwiftActor()
+}
diff --git a/swift/Sources/NexaSwift/NexaTextInference.swift b/swift/Sources/NexaSwift/NexaTextInference.swift
new file mode 100644
index 00000000..7c137bc7
--- /dev/null
+++ b/swift/Sources/NexaSwift/NexaTextInference.swift
@@ -0,0 +1,362 @@
+import Foundation
+import llama
+import Combine
+
+public class NexaTextInference {
+    private let model: LlamaModel
+    private let modelPath: String
+    private var generatedTokenCache = ""
+    private var contentStarted = false
+    private let chatFormatterRegistry: ChatFormatterRegistry
+
+    var maxLengthOfStopToken: Int {
+        model.configuration.stopTokens.map { $0.count }.max() ?? 0
+    }
+
+    public init(modelPath: String,
+                 modelConfiguration: Configuration = .init()) throws {
+        if modelPath.isEmpty {
+            throw NSError(domain: "InvalidParameterError", code: 400, userInfo: [NSLocalizedDescriptionKey: "Either modelPath or localPath must be provided."])
+        }
+        self.model = try LlamaModel(path: modelPath, configuration: modelConfiguration)
+        self.modelPath = modelPath
+        self.chatFormatterRegistry = .init()
+    }
+    
+    private func updateConfiguration(
+        temperature: Float?,
+        maxNewToken: Int?,
+        topK: Int32?,
+        topP: Float?,
+        stopTokens: [String]?
+    ) {
+        if let temperature = temperature {
+            model.configuration.temperature = temperature
+        }
+        if let maxNewToken = maxNewToken {
+            model.configuration.maxNewToken = maxNewToken
+        }
+        if let topK = topK {
+            model.configuration.topK = topK
+        }
+        if let topP = topP {
+            model.configuration.topP = topP
+        }
+        if let stopTokens = stopTokens {
+            model.configuration.stopTokens = stopTokens
+        }
+    }
+
+    private func getFormatterForModel() -> ChatFormatter? {
+        let modelArch = model.arch.lowercased()
+        let lowerModelPath = modelPath.lowercased()
+
+        let modelType: ChatCompletionModel? = {
+            switch modelArch {
+            case _ where modelArch.contains("gemma"):
+                // For Gemma-based models, check the model path
+                if lowerModelPath.contains("octopus-v2") || lowerModelPath.contains("octopusv2") {
+                    return .octopusv2
+                } else {
+                    return .gemma
+                }
+            case _ where modelArch.contains("qwen"):
+                return .qwen
+            case _ where modelArch.contains("llama"):
+                // For Llama-based models, check the model path
+                if lowerModelPath.contains("llama-2") || lowerModelPath.contains("llama2") {
+                    return .llama
+                } else if lowerModelPath.contains("llama-3") || lowerModelPath.contains("llama3") {
+                    return .llama3
+                } else if lowerModelPath.contains("mistral") {
+                    return .mistral
+                } else {
+                    // If can't determine specific version, default to Llama2
+                    print("Warning: Unable to determine specific Llama model version from path: \(modelPath). Defaulting to Llama2 format.")
+                    return .llama
+                }
+            default:
+                print("Warning: Unknown model architecture: \(modelArch). Defaulting to Llama2 format.")
+                return .llama
+            }
+        }()
+        
+        return chatFormatterRegistry.getFormatter(name: modelType?.rawValue)
+    }
+
+    private func isStopToken() -> Bool {
+        model.configuration.stopTokens.reduce(false) { partialResult, stopToken in
+            generatedTokenCache.hasSuffix(stopToken)
+        }
+    }
+
+    private func response(for prompt: String, output: (String) -> Void, finish: () -> Void) {
+        func finaliseOutput() {
+            model.configuration.stopTokens.forEach {
+                generatedTokenCache = generatedTokenCache.replacingOccurrences(of: $0, with: "")
+            }
+            output(generatedTokenCache)
+            finish()
+            generatedTokenCache = ""
+        }
+        defer { model.clear() }
+        do {
+            try model.start(for: prompt)
+            while model.shouldContinue {
+                var delta = try model.continue()
+                if contentStarted { // remove the prefix empty spaces
+                    if needToStop(after: delta, output: output) {
+                        finish()
+                        break
+                    }
+                } else {
+                    delta = delta.trimmingCharacters(in: .whitespacesAndNewlines)
+                    if !delta.isEmpty {
+                        contentStarted = true
+                        if needToStop(after: delta, output: output) {
+                            finish()
+                            break
+                        }
+                    }
+                }
+            }
+            finaliseOutput()
+        } catch {
+            finaliseOutput()
+        }
+    }
+
+    private func needToStop(after delta: String, output: (String) -> Void) -> Bool {
+        guard maxLengthOfStopToken > 0 else {
+            output(delta)
+            return false
+        }
+        generatedTokenCache += delta
+
+        if generatedTokenCache.count >= maxLengthOfStopToken * 2 {
+            if let stopToken = model.configuration.stopTokens.first(where: { generatedTokenCache.contains($0) }),
+            let index = generatedTokenCache.range(of: stopToken) {
+                let outputCandidate = String(generatedTokenCache[..<index.lowerBound])
+                output(outputCandidate)
+                generatedTokenCache = ""
+                return true
+            } else { 
+                let outputCandidate = String(generatedTokenCache.prefix(maxLengthOfStopToken))
+                generatedTokenCache.removeFirst(outputCandidate.count)
+                output(outputCandidate)
+                return false
+            }
+        }
+        return false
+    }
+
+    
+    @NexaSwiftActor
+    private func run(for prompt: String) -> AsyncThrowingStream<String, Error> {
+        return .init { continuation in
+            Task {
+                response(for: prompt) { [weak self] delta in
+                    continuation.yield(delta)
+                } finish: { [weak self] in
+                    continuation.finish()
+                }
+            }
+        }
+    }
+
+    @NexaSwiftActor
+    public func createCompletion(
+        for prompt: String,
+        temperature: Float? = nil,
+        maxNewToken: Int? = nil,
+        topK: Int32? = nil,
+        topP: Float? = nil,
+        stopTokens: [String]? = nil) async throws -> CompletionResponse {
+            updateConfiguration(
+                temperature: temperature,
+                maxNewToken: maxNewToken,
+                topK: topK,
+                topP: topP,
+                stopTokens: stopTokens
+            )
+            model.reset()
+            var result = ""
+                for try await value in await run(for: prompt) {
+                result += value
+            }
+
+            let completionResponse = CompletionResponse(
+                id: UUID().uuidString,
+                object: "text_completion",
+                created: Int(Date().timeIntervalSince1970),
+                model: "",
+                choices: [
+                    CompletionChoice(
+                        text: result,
+                        index: 0,
+                        logprobs: nil,
+                        finishReason: FinishReason.stop
+                    )
+                ],
+                usage: CompletionUsage(
+                    promptTokens: 0,
+                    completionTokens: 0,
+                    totalTokens: 0
+                )
+            )
+            return completionResponse
+    }
+    
+    @NexaSwiftActor
+    public func createCompletionStream(
+        for prompt: String,
+        temperature: Float? = nil,
+        maxNewToken: Int? = nil,
+        topK: Int32? = nil,
+        topP: Float? = nil,
+        stopTokens: [String]? = nil) -> AsyncThrowingStream<CompletionResponse, Error>  {
+            updateConfiguration(
+                temperature: temperature,
+                maxNewToken: maxNewToken,
+                topK: topK,
+                topP: topP,
+                stopTokens: stopTokens
+            )
+            model.reset()
+            return .init { continuation in
+                Task {
+                    var index = 0
+                    response(for: prompt) { text in
+                        let completionResponse = CompletionResponse(
+                            id: UUID().uuidString,
+                            object: "text_completion",
+                            created: Int(Date().timeIntervalSince1970),
+                            model: "",
+                            choices: [
+                                CompletionChoice(
+                                    text: text,
+                                    index: 0,
+                                    logprobs: nil,
+                                    finishReason: FinishReason.stop
+                                )
+                            ],
+                            usage: CompletionUsage(
+                                promptTokens: 0,
+                                completionTokens: 0,
+                                totalTokens: 0
+                            )
+                    )
+                    
+                    index += 1
+                    continuation.yield(completionResponse)
+                } finish: {
+                    continuation.finish()
+                }
+            }
+        }
+    }
+    
+    @NexaSwiftActor
+    public func createChatCompletion(
+        for messages: [ChatCompletionRequestMessage],
+        temperature: Float? = nil,
+        maxNewToken: Int? = nil,
+        topK: Int32? = nil,
+        topP: Float? = nil,
+        stopTokens: [String]? = nil,
+        modelType: ChatCompletionModel? = nil) async throws -> ChatCompletionResponse {
+            let formatter = modelType.map { chatFormatterRegistry.getFormatter(name: $0.rawValue) } ?? getFormatterForModel()
+            let chatFormatter: ChatFormatterResponse? = formatter?.format(messages: messages)
+            // let chatFormatter: ChatFormatterResponse? = chatFormatterRegistry.getFormatter(name: modelType?.rawValue)?.format(messages: messages) ?? nil
+            updateConfiguration(
+                temperature: temperature,
+                maxNewToken: maxNewToken,
+                topK: topK,
+                topP: topP,
+                stopTokens: stopTokens ?? (!model.configuration.stopTokens.isEmpty ? model.configuration.stopTokens : chatFormatter?.stop) ?? nil
+            )
+            model.reset()
+            
+            var result = ""
+            for try await value in await run(for: chatFormatter?.prompt ?? "") {
+                result += value
+            }
+            
+        let response = ChatCompletionResponse(
+            id: UUID().uuidString,
+            object: "chat.completion",
+            created: Int(Date().timeIntervalSince1970),
+            model: chatFormatterRegistry.getFormatterName(name: modelType?.rawValue),
+            choices: [
+                ChatCompletionResponseChoice(
+                    index: 0,
+                    message: ChatCompletionResponseMessage(
+                        content: result,
+                        toolCalls: nil,
+                        role: nil,
+                        functionCall: nil
+                    ),
+                    logprobs: nil,
+                    finishReason: FinishReason.stop
+                )
+            ],
+            usage: nil
+        )
+        
+        return response
+    }
+    
+   @NexaSwiftActor
+   public func createChatCompletionStream(
+       for messages: [ChatCompletionRequestMessage],
+       temperature: Float? = nil,
+       maxNewToken: Int? = nil,
+       topK: Int32? = nil,
+       topP: Float? = nil,
+       stopTokens: [String]? = nil,
+       modelType: ChatCompletionModel? = nil
+   ) -> AsyncThrowingStream<CreateChatCompletionStreamResponse, Error> {
+           model.reset()
+            let formatter = modelType.map { chatFormatterRegistry.getFormatter(name: $0.rawValue) } ?? getFormatterForModel()
+            let chatFormatter: ChatFormatterResponse? = formatter?.format(messages: messages)
+//            let chatFormatter: ChatFormatterResponse? = chatFormatterRegistry.getFormatter(name: modelType?.rawValue)?.format(messages: messages) ?? nil
+           updateConfiguration(
+               temperature: temperature,
+               maxNewToken: maxNewToken,
+               topK: topK,
+               topP: topP,
+               stopTokens: stopTokens ?? (!model.configuration.stopTokens.isEmpty ? model.configuration.stopTokens : chatFormatter?.stop) ?? nil
+           )
+           return .init { continuation in
+                Task {
+                    var index = 0
+                    response(for: chatFormatter?.prompt ?? "") { text in
+                        let response = CreateChatCompletionStreamResponse(
+                            id: UUID().uuidString,
+                            model: chatFormatterRegistry.getFormatterName(name: modelType?.rawValue),
+                            object: "chat.completion.chunk",
+                            created: Int(Date().timeIntervalSince1970),
+                            choices: [
+                                ChatCompletionStreamResponseChoice(
+                                    index: index,
+                                    delta: ChatCompletionStreamResponseDelta(
+                                        content: text,
+                                        functionCall: nil,
+                                        toolCalls: nil,
+                                        role: nil
+                                    ),
+                                    finishReason: FinishReason.stop,
+                                    logprobs: nil
+                                )
+                            ]
+                        )
+                        
+                        index += 1
+                        continuation.yield(response)
+                    } finish: {
+                        continuation.finish()
+                    }
+                }
+            }
+   }
+}
diff --git a/swift/Tests/NexaSwiftTests/NexaSwiftTests.swift b/swift/Tests/NexaSwiftTests/NexaSwiftTests.swift
new file mode 100644
index 00000000..9661ba10
--- /dev/null
+++ b/swift/Tests/NexaSwiftTests/NexaSwiftTests.swift
@@ -0,0 +1,6 @@
+import XCTest
+@testable import NexaSwift
+
+final class NexaSwiftTests: XCTestCase {
+
+}
diff --git a/tests/test_tts_generation.py b/tests/test_tts_generation.py
index a03195d1..2dc9c526 100644
--- a/tests/test_tts_generation.py
+++ b/tests/test_tts_generation.py
@@ -1,22 +1,24 @@
-from nexa.gguf import NexaTTSInference
+# Temporarily disabled since version v0.0.9.3
 
-def test_tts_generation():
-    tts = NexaTTSInference(
-        model_path="bark-small",
-        local_path=None,
-        n_threads=4,
-        seed=42,
-        sampling_rate=24000,
-        verbosity=1
-    )
+# from nexa.gguf import NexaTTSInference
+
+# def test_tts_generation():
+#     tts = NexaTTSInference(
+#         model_path="bark-small",
+#         local_path=None,
+#         n_threads=4,
+#         seed=42,
+#         sampling_rate=24000,
+#         verbosity=2
+#     )
     
-    # Generate audio from prompt
-    prompt = "Hello, this is a test of the Bark text to speech system."
-    audio_data = tts.audio_generation(prompt)
+#     # Generate audio from prompt
+#     prompt = "Hello, this is a test of the Bark text to speech system."
+#     audio_data = tts.audio_generation(prompt)
     
-    # Save the generated audio
-    tts._save_audio(audio_data, tts.sampling_rate, "tts_output")
-    print("TTS generation test completed successfully!")
+#     # Save the generated audio
+#     tts._save_audio(audio_data, tts.sampling_rate, "tts_output")
+#     print("TTS generation test completed successfully!")
 
-if __name__ == "__main__":
-    test_tts_generation()
\ No newline at end of file
+# if __name__ == "__main__":
+#     test_tts_generation()
\ No newline at end of file