diff --git a/dependency/llama.cpp b/dependency/llama.cpp index 20b9f02c..b535cd94 160000 --- a/dependency/llama.cpp +++ b/dependency/llama.cpp @@ -1 +1 @@ -Subproject commit 20b9f02cee483d09d15832c35e6117e5a020f517 +Subproject commit b535cd941e657ac1984d8022dd5f0c98f2b9e265 diff --git a/nexa/constants.py b/nexa/constants.py index 04ec51fb..67511eaa 100644 --- a/nexa/constants.py +++ b/nexa/constants.py @@ -112,6 +112,7 @@ class ModelType(Enum): NEXA_RUN_MODEL_MAP_AUDIO_LM = { "qwen2audio": "Qwen2-Audio-7.8B-Instruct:model-q4_0", "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:model-fp16", + "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:model-q8_0", "Qwen2-Audio-7.8B-Instruct:q4_0": "Qwen2-Audio-7.8B-Instruct:model-q4_0", "omniaudio": "Octo-omni-audio:model-fp16", "Octo-omni-audio:fp16": "Octo-omni-audio:model-fp16", @@ -185,6 +186,7 @@ class ModelType(Enum): NEXA_RUN_AUDIO_LM_PROJECTOR_MAP = { "qwen2audio": "Qwen2-Audio-7.8B-Instruct:projector-q4_0", "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:projector-fp16", + "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:projector-q8_0", "Qwen2-Audio-7.8B-Instruct:q4_0": "Qwen2-Audio-7.8B-Instruct:projector-q4_0", "omniaudio": "Octo-omni-audio:projector-fp16", "Octo-omni-audio:fp16": "Octo-omni-audio:projector-fp16",