diff --git a/poetry.lock b/poetry.lock
index f9f972ef6e3fc63a24ecebe6337f69ca519bf80f..a6d4c7d7cd3d0c90c26e95b6b101431f2191bd7d 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -2269,12 +2269,12 @@ files = [
 
 [[package]]
 name = "llama-cpp-python"
-version = "0.2.87"
+version = "0.2.85"
 description = "Python bindings for the llama.cpp library"
 optional = true
 python-versions = ">=3.8"
 files = [
-    {file = "llama_cpp_python-0.2.87.tar.gz", hash = "sha256:4dff585f533131aa44b7d9e79a62d60172f317aef15d7bf4bafeb074b55a48c4"},
+    {file = "llama_cpp_python-0.2.85.tar.gz", hash = "sha256:31476c2f4331784d3681f9bcd366cc4666ba97ab128bffbd23cb90ee2cebff21"},
 ]
 
 [package.dependencies]
@@ -5382,4 +5382,4 @@ vision = ["pillow", "torch", "torchvision", "transformers"]
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.9,<3.13"
-content-hash = "13067697a82e75e7e3e9211d99a2e5a7971b9d57b9a71c81a97fb72881847499"
+content-hash = "32e1158d0742323cf5e3a7262ceec1229829d80df399caa62b5b693bc430932a"
diff --git a/pyproject.toml b/pyproject.toml
index f70227a05337d8da0c0e127e0aab51391f4c5396..82dca612cf7b20245dfedcdb97efeef549f0ddad 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,7 +29,7 @@ pinecone-text = {version = ">=0.7.1,<0.10.0", optional = true}
 torch = {version = ">=2.1.0,<2.6.0", optional = true}
 transformers = {version = ">=4.36.2", optional = true}
 tokenizers = {version = ">=0.19", optional = true}
-llama-cpp-python = {version = "^0.2.28", optional = true}
+llama-cpp-python = {version = ">=0.2.28,<0.2.86", optional = true}
 colorama = "^0.4.6"
 pinecone-client = {version=">=3.0.0,<4.0.0", optional = true}
 regex = ">=2023.12.25"