Skip to content

Commit c4d44a5

Browse files
committed
setting n_ctx to 0
1 parent 0d027cf commit c4d44a5

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

ai_worker/main.py

+1
Original file line numberDiff line numberDiff line change
@@ -292,6 +292,7 @@ async def load_model(self, name):
292292

293293
settings = LlamaSettings(model=model_path, n_gpu_layers=await self.guess_layers(model_path), seed=-1,
294294
embedding=True, cache=True, port=8181,
295+
n_ctx=0,
295296
main_gpu=self.conf.main_gpu, tensor_split=sp)
296297
self.llama = create_llama_app(settings)
297298
assert self.llama, "Load llama failed. Try lowering layers."

0 commit comments

Comments
 (0)