TileDB-Inc · jparismorgan · Oct 17, 2024 · Jul 3, 2024 · Jul 11, 2024 · Jul 11, 2024
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -15,7 +15,7 @@ repos:
       - id: prettier
 
   - repo: https://github.com/charliermarsh/ruff-pre-commit
-    rev: "v0.0.265"
+    rev: "v0.4.4"
     hooks:
       - id: ruff
         args: [--fix, --exit-non-zero-on-fix]

diff --git a/apis/python/src/tiledb/vector_search/ingestion.py b/apis/python/src/tiledb/vector_search/ingestion.py
@@ -401,13 +401,13 @@ def read_source_metadata(
     ) -> Tuple[int, int, np.dtype]:
         if source_type == "TILEDB_ARRAY":
             schema = tiledb.ArraySchema.load(source_uri)
-            size = schema.domain.dim(1).domain[1] + 1
-            dimensions = schema.domain.dim(0).domain[1] + 1
+            size = np.int64(schema.domain.dim(1).domain[1]) + 1
+            dimensions = np.int64(schema.domain.dim(0).domain[1]) + 1
             return size, dimensions, schema.attr(0).dtype
         if source_type == "TILEDB_SPARSE_ARRAY":
             schema = tiledb.ArraySchema.load(source_uri)
-            size = schema.domain.dim(0).domain[1] + 1
-            dimensions = schema.domain.dim(1).domain[1] + 1
+            size = np.int64(schema.domain.dim(0).domain[1]) + 1
+            dimensions = np.int64(schema.domain.dim(1).domain[1]) + 1
             return size, dimensions, schema.attr(0).dtype
         if source_type == "TILEDB_PARTITIONED_ARRAY":
             with tiledb.open(source_uri, "r", config=config) as source_array:
@@ -2016,7 +2016,7 @@ def consolidate_partition_udf(
                     prev_index = partial_indexes[0]
                     i = 0
                     for partial_index in partial_indexes[1:]:
-                        s = slice(int(prev_index), int(partial_index - 1))
+                        s = slice(int(prev_index), int(partial_index) - 1)
                         if (
                             s.start <= s.stop
                             and s.start != np.iinfo(np.dtype("uint64")).max

diff --git a/pyproject.toml b/pyproject.toml
@@ -17,12 +17,14 @@ classifiers = [
   "Programming Language :: Python :: 3.11",
 ]
 
+# These are the runtime depdendencies.
 dependencies = [
-    "tiledb-cloud>=0.11",
+    "tiledb-cloud>=0.12.15",
     "tiledb>=0.30.2",
     "typing-extensions", # for tiledb-cloud indirect, x-ref https://github.com/TileDB-Inc/TileDB-Cloud-Py/pull/428
+    # scikit-learn>=1.4.2 may be needed?
     "scikit-learn",
-    "numpy<2.0.0",
+    "numpy>=1.25.0",
 ]
 
 [project.optional-dependencies]
@@ -34,8 +36,10 @@ benchmarks = ["boto3", "paramiko"]
 homepage = "https://tiledb.com"
 repository = "https://github.com/TileDB-Inc/tiledb-vector-search"
 
+# These are the build-time depdendencies.
 [build-system]
-requires = ["scikit-build-core[pyproject]", "pybind11", "setuptools-scm"]
+# pybind11>=2.12 may be needed?
+requires = ["scikit-build-core[pyproject]", "pybind11", "setuptools-scm", "numpy>=2.0.0"]
 build-backend = "scikit_build_core.build"
 
 [tool.scikit-build]
@@ -65,10 +69,15 @@ TILEDB_PATH = {env="TILEDB_PATH"}
 [tool.setuptools_scm]
 version_file = "apis/python/src/tiledb/vector_search/version.py"
 
+[tool.ruff.lint]
+select = ["NPY201"]
+
 [tool.ruff]
 extend-select = ["I"]
 ignore = ["F403", "F405", "E501", "E741"]
 exclude = [".ipynb"]
+# Numpy 2 rule: https://numpy.org/devdocs/numpy_2_0_migration_guide.html#ruff-plugin
+# select = ["NPY201"]
 
 [tool.ruff.isort]
 known-first-party = ["tiledb"]