Skip to content

Commit

Permalink
0.3.4
Browse files Browse the repository at this point in the history
  • Loading branch information
Benjoyo committed May 3, 2024
1 parent 5e79c15 commit 9cb513e
Show file tree
Hide file tree
Showing 3 changed files with 37 additions and 38 deletions.
4 changes: 2 additions & 2 deletions bpm_ai_inference/llm/llama_cpp/_constants.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@

DEFAULT_MODEL = "QuantFactory/Meta-Llama-3-8B-Instruct-GGUF"
DEFAULT_MODEL = "NousResearch/Hermes-2-Pro-Llama-3-8B-GGUF"
DEFAULT_QUANT_LARGE = "*Q8_0.gguf"
DEFAULT_QUANT_BALANCED = "*Q4_K_M.gguf"
DEFAULT_QUANT_BALANCED = "*Q5_K_M.gguf"
DEFAULT_QUANT_SMALL = "*Q2_K.gguf"
DEFAULT_TEMPERATURE = 0.0
DEFAULT_MAX_RETRIES = 8
65 changes: 33 additions & 32 deletions poetry.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

6 changes: 2 additions & 4 deletions pyproject.toml
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
[tool.poetry]
name = "bpm-ai-inference"
version = "0.3.3"
version = "0.3.4"
description = "Inference and server for local AI implementations of bpm-ai-core abstractions."
authors = ["Bennet Krause <[email protected]>"]
repository = "https://github.com/holunda-io/bpm-ai-inference"
Expand All @@ -23,9 +23,7 @@ optimum = {extras = ["onnxruntime"], version = "^1.18.0"}
gliner = "^0.1.6"
scipy = "1.10.1"
py-cpuinfo = "^9.0.0"
llama-cpp-python = "^0.2.65"
#fast-fit = "^1.2.0"
#jupyter = "^1.0.0"
llama-cpp-python = "^0.2.69"


[tool.poetry.group.test.dependencies]
Expand Down

0 comments on commit 9cb513e

Please sign in to comment.