diff --git a/libs/ragulate/colbert_chunk_size_and_k.py b/libs/ragulate/colbert_chunk_size_and_k.py index 6a602f25d..a7956cb59 100644 --- a/libs/ragulate/colbert_chunk_size_and_k.py +++ b/libs/ragulate/colbert_chunk_size_and_k.py @@ -25,8 +25,8 @@ batch_size = 640 -astra_token = os.getenv("ASTRA_DB_TOKEN") -database_id = os.getenv("ASTRA_DB_ID") +astra_token = os.environ["ASTRA_DB_TOKEN"] +database_id = os.environ["ASTRA_DB_ID"] keyspace = "colbert" @@ -38,7 +38,7 @@ def get_embedding_model(chunk_size: int) -> ColbertEmbeddingModel: - return ColbertEmbeddingModel(doc_maxlen=chunk_size, batch_size=batch_size) + return ColbertEmbeddingModel(doc_maxlen=chunk_size, chunk_batch_size=batch_size) def get_database(chunk_size: int) -> CassandraDatabase: diff --git a/libs/ragulate/poetry.lock b/libs/ragulate/poetry.lock index f375b67fa..1f423e750 100644 --- a/libs/ragulate/poetry.lock +++ b/libs/ragulate/poetry.lock @@ -3817,13 +3817,13 @@ files = [ [[package]] name = "ragstack-ai-colbert" -version = "1.0.5" +version = "1.0.6" description = "DataStax RAGStack Colbert implementation" optional = false -python-versions = "<3.13,>=3.9" +python-versions = "<4.0,>=3.9" files = [ - {file = "ragstack_ai_colbert-1.0.5-py3-none-any.whl", hash = "sha256:d496cc6469e67894cd6ba755ee649c0315154d752429e0f53f221a67c06d8791"}, - {file = "ragstack_ai_colbert-1.0.5.tar.gz", hash = "sha256:7a8fdf009c0445cac8efc550179bc5626471863a2f9628848159ccf86d873729"}, + {file = "ragstack_ai_colbert-1.0.6-py3-none-any.whl", hash = "sha256:0ac469d0cfcfb6215d6bff6a96beb1c0754accb9ab9d03bdb0a1cd06a74dc50c"}, + {file = "ragstack_ai_colbert-1.0.6.tar.gz", hash = "sha256:1551815047d3570074611da30bda0e88f68ec598b81c5fb5ea2fc6afaa59603e"}, ] [package.dependencies] @@ -3831,6 +3831,7 @@ cassio = ">=0.1.7,<0.2.0" colbert-ai = "0.2.19" pyarrow = "14.0.1" pydantic = ">=2.7.1,<3.0.0" +setuptools = {version = ">=70", markers = "python_version >= \"3.12\""} torch = "2.2.1" [[package]] @@ -6030,4 +6031,4 @@ multidict = ">=4.0" [metadata] lock-version = "2.0" python-versions = ">=3.10,<3.13" -content-hash = "62fea92af7de41cad9955d90cd7d85770be28c2d8c6e1af4cd5ca45f65bececa" +content-hash = "f2ed3737b3633a7642bba052abc99ffb88e199ea32b7bc445a57829065a8cdd9" diff --git a/libs/ragulate/pyproject.toml b/libs/ragulate/pyproject.toml index ae22727fe..5058fd3cb 100644 --- a/libs/ragulate/pyproject.toml +++ b/libs/ragulate/pyproject.toml @@ -42,7 +42,7 @@ types-seaborn = "^0.13.2" types-setuptools = "^70.0.0" types-tqdm = ">=4.66.0" pandas-stubs = ">=2.2.2" -ragstack-ai-colbert = "^1.0.5" +ragstack-ai-colbert = "^1.0.6" ragstack-ai-langchain = "^1.4.0" [build-system] @@ -62,6 +62,5 @@ show_error_codes = true show_error_context = true [[tool.mypy.overrides]] -# TODO: remove ragstack exclusions once packages containing py.typed are published -module = "trulens_eval.*,plotly.*,cerberus.*,transformers.*,ragstack_colbert.*,ragstack_langchain.*" +module = "trulens_eval.*,plotly.*,cerberus.*,transformers.*" ignore_missing_imports = true