diff --git a/dependency/llama.cpp b/dependency/llama.cpp index ed459776..5859733c 160000 --- a/dependency/llama.cpp +++ b/dependency/llama.cpp @@ -1 +1 @@ -Subproject commit ed459776811d0928ce55a001e9e5a6bc3bf22ca4 +Subproject commit 5859733cb86dbd61091a8045203b33df056e536a diff --git a/nexa/__init__.py b/nexa/__init__.py index af51d3c5..d526f5d5 100644 --- a/nexa/__init__.py +++ b/nexa/__init__.py @@ -1 +1 @@ -__version__ = "0.0.9.6" +__version__ = "0.0.9.7" diff --git a/nexa/constants.py b/nexa/constants.py index 51d6e051..5f6beb69 100644 --- a/nexa/constants.py +++ b/nexa/constants.py @@ -127,9 +127,11 @@ class ModelType(Enum): "Qwen2-Audio-7.8B-Instruct:q6_K": "Qwen2-Audio-7.8B-Instruct:model-q6_K", "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:model-q8_0", "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:model-fp16", - "omniaudio": "omniaudio:model-fp16", - "omniaudio:fp16": "omniaudio:model-fp16", - "omniaudio:q4_0": "omniaudio:model-q4_0", + "omniaudio": "OmniAudio-2.6B:model-q4_K_M", + "OmniAudio-2.6B:fp16": "OmniAudio-2.6B:model-fp16", + "OmniAudio-2.6B:q8_0": "OmniAudio-2.6B:model-q8_0", + "OmniAudio-2.6B:q4_K_M": "OmniAudio-2.6B:model-q4_K_M", + "OmniAudio-2.6B:q4_0": "OmniAudio-2.6B:model-q4_0", } NEXA_RUN_MODEL_MAP_VOICE = { @@ -188,8 +190,10 @@ class ModelType(Enum): "omnivision-preview": "omnivision-preview:projector-fp16", "omnivision-preview:fp16": "omnivision-preview:projector-fp16", "omnivision-preview:q4_0": "omnivision-preview:projector-q4_0", + "omnivlm": "omniVLM:projector-fp16", "omniVLM": "omniVLM:projector-fp16", "omniVLM:fp16": "omniVLM:projector-fp16", + "omniVLM:q8_0": "omniVLM:projector-q8_0", "omnivision-ocr": "omnivision-ocr:projector-fp16", "omnivision-ocr:fp16": "omnivision-ocr:projector-fp16", } @@ -198,8 +202,10 @@ class ModelType(Enum): "omnivision-preview": "omnivision-preview:model-fp16", "omnivision-preview:fp16": "omnivision-preview:model-fp16", "omnivision-preview:q4_0": "omnivision-preview:model-q4_0", + "omnivlm": "omniVLM:model-fp16", "omniVLM": "omniVLM:model-fp16", "omniVLM:fp16": "omniVLM:model-fp16", + "omniVLM:q8_0": "omniVLM:model-q8_0", "omnivision-ocr": "omnivision-ocr:model-fp16", "omnivision-ocr:fp16": "omnivision-ocr:model-fp16", } @@ -221,9 +227,11 @@ class ModelType(Enum): "Qwen2-Audio-7.8B-Instruct:q6_K": "Qwen2-Audio-7.8B-Instruct:projector-q6_K", "Qwen2-Audio-7.8B-Instruct:q8_0": "Qwen2-Audio-7.8B-Instruct:projector-q8_0", "Qwen2-Audio-7.8B-Instruct:fp16": "Qwen2-Audio-7.8B-Instruct:projector-fp16", - "omniaudio": "omniaudio:projector-fp16", - "omniaudio:fp16": "omniaudio:projector-fp16", - "omniaudio:q4_0": "omniaudio:projector-q4_0", + "omniaudio": "OmniAudio-2.6B:projector-q4_K_M", + "OmniAudio-2.6B:fp16": "OmniAudio-2.6B:projector-fp16", + "OmniAudio-2.6B:q8_0": "OmniAudio-2.6B:projector-q8_0", + "OmniAudio-2.6B:q4_K_M": "OmniAudio-2.6B:projector-q4_K_M", + "OmniAudio-2.6B:q4_0": "OmniAudio-2.6B:projector-q4_0", } NEXA_RUN_T5XXL_MAP = { @@ -468,8 +476,8 @@ class ModelType(Enum): "llava-v1.6-vicuna-7b": ModelType.MULTIMODAL, "llava-phi-3-mini": ModelType.MULTIMODAL, "llava-llama-3-8b-v1.1": ModelType.MULTIMODAL, - "omniaudio": ModelType.AUDIOLM, "Qwen2-Audio-7.8B-Instruct": ModelType.AUDIOLM, + "OmniAudio-2.6B": ModelType.AUDIOLM, "faster-whisper-tiny.en": ModelType.AUDIO, "faster-whisper-tiny": ModelType.AUDIO, "faster-whisper-small.en": ModelType.AUDIO,