From 10e2929d55522dc04d4b7c351ea6bcdab81fc017 Mon Sep 17 00:00:00 2001 From: frayle-ons <194791647+frayle-ons@users.noreply.github.com> Date: Thu, 5 Feb 2026 12:51:35 +0000 Subject: [PATCH 1/3] removed polars methods that required pyarrow dependency --- src/classifai/indexers/main.py | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/src/classifai/indexers/main.py b/src/classifai/indexers/main.py index d35dc2c..99d9495 100644 --- a/src/classifai/indexers/main.py +++ b/src/classifai/indexers/main.py @@ -318,7 +318,9 @@ def reverse_search(self, query: VectorStoreReverseSearchInput, n_results=100) -> ) from e # polars conversion - paired_query = pl.DataFrame({"id": query.id, "doc_id": query.doc_id}) + paired_query = pl.DataFrame( + {"id": query.id.astype(str).to_list(), "doc_id": query.doc_id.astype(str).to_list()} + ) # join query with vdb to get matches joined_table = paired_query.join(self.vectors.rename({"id": "doc_id"}), on="doc_id", how="inner") @@ -333,7 +335,7 @@ def reverse_search(self, query: VectorStoreReverseSearchInput, n_results=100) -> ] ) - result_df = VectorStoreReverseSearchOutput.from_data(final_table.to_pandas()) + result_df = VectorStoreReverseSearchOutput.from_data(final_table.to_dict(as_series=False)) # Check if there is a user defined postprocess hook for the VectorStore reverse search method if "reverse_search_postprocess" in self.hooks: @@ -444,9 +446,9 @@ def search(self, query: VectorStoreSearchInput, n_results=10, batch_size=8) -> V *self.meta_data.keys(), ] ) - # Now that polars has been used for processing convert back to pandas for user familiarity - result_df = VectorStoreSearchOutput.from_data(reordered_df.to_pandas()) + # Specify the 'use_pyarrow=False' option to avoid using pyarrow for conversion + result_df = VectorStoreSearchOutput.from_data(reordered_df.to_dict(as_series=False)) # Check if there is a user defined postprocess hook for the VectorStore search method if "search_postprocess" in self.hooks: From 498992306e8be3009dee367c2b20cb11aa98a891 Mon Sep 17 00:00:00 2001 From: frayle-ons <194791647+frayle-ons@users.noreply.github.com> Date: Thu, 5 Feb 2026 13:59:39 +0000 Subject: [PATCH 2/3] added google-genai name map to toml file for deptry and uv lock version bump --- pyproject.toml | 4 ++++ uv.lock | 2 +- 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/pyproject.toml b/pyproject.toml index 62f7016..9372b73 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -37,6 +37,10 @@ namespaces = false [tool.setuptools.package-data] classifai = [] +[tool.deptry.package_module_name_map] +ollama = "ollama" +google-genai = "google" + [project.optional-dependencies] huggingface = [ "transformers>=4.52.4", diff --git a/uv.lock b/uv.lock index 8082439..758d0b8 100644 --- a/uv.lock +++ b/uv.lock @@ -302,7 +302,7 @@ wheels = [ [[package]] name = "classifai" -version = "0.1.0" +version = "0.2.0" source = { editable = "." } dependencies = [ { name = "fastapi", extra = ["standard"] }, From ddced8e4a7999f72857d10866357c71735fffb21 Mon Sep 17 00:00:00 2001 From: frayle-ons <194791647+frayle-ons@users.noreply.github.com> Date: Thu, 5 Feb 2026 14:59:21 +0000 Subject: [PATCH 3/3] code cleanup --- src/classifai/indexers/main.py | 1 - 1 file changed, 1 deletion(-) diff --git a/src/classifai/indexers/main.py b/src/classifai/indexers/main.py index 99d9495..ced1e25 100644 --- a/src/classifai/indexers/main.py +++ b/src/classifai/indexers/main.py @@ -447,7 +447,6 @@ def search(self, query: VectorStoreSearchInput, n_results=10, batch_size=8) -> V ] ) # Now that polars has been used for processing convert back to pandas for user familiarity - # Specify the 'use_pyarrow=False' option to avoid using pyarrow for conversion result_df = VectorStoreSearchOutput.from_data(reordered_df.to_dict(as_series=False)) # Check if there is a user defined postprocess hook for the VectorStore search method