Skip to content

Commit 37f6553

Browse files
committed
update llama_cpp_python version
1 parent dfdd4f7 commit 37f6553

File tree

3 files changed

+21
-15
lines changed

3 files changed

+21
-15
lines changed

ai_worker/main.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -262,9 +262,9 @@ async def guess_layers(self, model_path):
262262
return max(0, est_layers - self.conf.layer_offset)
263263

264264
def clear_llama_model(self):
265-
if llama_cpp.server.app.llama:
265+
if llama_cpp.server.app._llama_proxy:
266266
# critical... must del this before creating a new app
267-
llama_cpp.server.app.llama = None
267+
llama_cpp.server.app._llama_proxy = None
268268

269269
self.llama = None
270270
self.llama_cli = None

poetry.lock

+18-12
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

pyproject.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ packages = [{include = "ai_worker"}, {include = "gguf_loader"}]
99

1010
[tool.poetry.dependencies]
1111
python = ">=3.10,<3.12"
12-
llama-cpp-python = {extras = ["server"], version = "0.2.7"}
12+
llama-cpp-python = {version = "0.2.53", extras = ["server"]}
1313
pydantic-settings = "^2.0.3"
1414
fastapi = "^0.103.1"
1515
websockets = "^11.0.3"

0 commit comments

Comments
 (0)