Skip to content

Commit 9cb513e

Browse files
committed
0.3.4
1 parent 5e79c15 commit 9cb513e

File tree

3 files changed

+37
-38
lines changed

3 files changed

+37
-38
lines changed
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11

2-
DEFAULT_MODEL = "QuantFactory/Meta-Llama-3-8B-Instruct-GGUF"
2+
DEFAULT_MODEL = "NousResearch/Hermes-2-Pro-Llama-3-8B-GGUF"
33
DEFAULT_QUANT_LARGE = "*Q8_0.gguf"
4-
DEFAULT_QUANT_BALANCED = "*Q4_K_M.gguf"
4+
DEFAULT_QUANT_BALANCED = "*Q5_K_M.gguf"
55
DEFAULT_QUANT_SMALL = "*Q2_K.gguf"
66
DEFAULT_TEMPERATURE = 0.0
77
DEFAULT_MAX_RETRIES = 8

poetry.lock

Lines changed: 33 additions & 32 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

pyproject.toml

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[tool.poetry]
22
name = "bpm-ai-inference"
3-
version = "0.3.3"
3+
version = "0.3.4"
44
description = "Inference and server for local AI implementations of bpm-ai-core abstractions."
55
authors = ["Bennet Krause <bennet.krause@holisticon.de>"]
66
repository = "https://github.com/holunda-io/bpm-ai-inference"
@@ -23,9 +23,7 @@ optimum = {extras = ["onnxruntime"], version = "^1.18.0"}
2323
gliner = "^0.1.6"
2424
scipy = "1.10.1"
2525
py-cpuinfo = "^9.0.0"
26-
llama-cpp-python = "^0.2.65"
27-
#fast-fit = "^1.2.0"
28-
#jupyter = "^1.0.0"
26+
llama-cpp-python = "^0.2.69"
2927

3028

3129
[tool.poetry.group.test.dependencies]

0 commit comments

Comments
 (0)