Skip to content

Commit 30b478d

Browse files
authoredMar 26, 2025··
Fix: Consider index passed, even if the current domain is present (#2178)
1 parent 25afe8a commit 30b478d

File tree

3 files changed

+75
-39
lines changed

3 files changed

+75
-39
lines changed
 

‎tiledb/array.py

+10-15
Original file line numberDiff line numberDiff line change
@@ -128,21 +128,6 @@ def index_domain_subarray(array, dom, idx: tuple):
128128

129129
subarray = list()
130130

131-
# In the case that current domain is non-empty, we need to consider it
132-
if (
133-
hasattr(array.schema, "current_domain")
134-
and not array.schema.current_domain.is_empty
135-
):
136-
for i in range(array.schema.domain.ndim):
137-
subarray.append(
138-
(
139-
array.schema.current_domain.ndrectangle.range(i)[0],
140-
array.schema.current_domain.ndrectangle.range(i)[1],
141-
)
142-
)
143-
144-
return subarray
145-
146131
for r in range(ndim):
147132
# extract lower and upper bounds for domain dimension extent
148133
dim = dom.dim(r)
@@ -163,6 +148,16 @@ def index_domain_subarray(array, dom, idx: tuple):
163148

164149
start, stop, step = dim_slice.start, dim_slice.stop, dim_slice.step
165150

151+
# In the case that current domain is non-empty, we need to consider it
152+
if (
153+
hasattr(array.schema, "current_domain")
154+
and not array.schema.current_domain.is_empty
155+
):
156+
if start is None:
157+
dim_lb = array.schema.current_domain.ndrectangle.range(r)[0]
158+
if stop is None:
159+
dim_ub = array.schema.current_domain.ndrectangle.range(r)[1]
160+
166161
if np.issubdtype(dim_dtype, np.str_) or np.issubdtype(dim_dtype, np.bytes_):
167162
if start is None or stop is None:
168163
if start is None:

‎tiledb/multirange_indexing.py

+43-23
Original file line numberDiff line numberDiff line change
@@ -129,18 +129,31 @@ def iter_ranges(
129129
sel: Union[Scalar, slice, Range, List[Scalar], np.ndarray, "pyarrow.Array"],
130130
sparse: bool,
131131
nonempty_domain: Optional[Range] = None,
132+
current_domain: Optional[Range] = None,
132133
) -> Iterator[Range]:
133134
if isinstance(sel, slice):
134135
if sel.step is not None:
135136
raise ValueError("Stepped slice ranges are not supported")
136137

138+
# we always want to be inside the current domain, if this is passed,
139+
# but we also don't want to fall out of the nonempty domain
137140
rstart = sel.start
138-
if rstart is None and nonempty_domain:
139-
rstart = nonempty_domain[0]
141+
if rstart is None:
142+
if current_domain and nonempty_domain:
143+
rstart = max(current_domain[0], nonempty_domain[0])
144+
elif current_domain:
145+
rstart = current_domain[0]
146+
elif nonempty_domain:
147+
rstart = nonempty_domain[0]
140148

141149
rend = sel.stop
142-
if rend is None and nonempty_domain:
143-
rend = nonempty_domain[1]
150+
if rend is None:
151+
if current_domain and nonempty_domain:
152+
rend = min(current_domain[1], nonempty_domain[1])
153+
elif current_domain:
154+
rend = current_domain[1]
155+
elif nonempty_domain:
156+
rend = nonempty_domain[1]
144157

145158
if sparse and sel.start is None and sel.stop is None:
146159
# don't set nonempty_domain for full-domain slices w/ sparse
@@ -188,11 +201,13 @@ def iter_label_range(sel: Union[Scalar, slice, Range, List[Scalar]]):
188201
yield scalar, scalar
189202

190203

191-
def dim_ranges_from_selection(selection, nonempty_domain, is_sparse):
204+
def dim_ranges_from_selection(selection, nonempty_domain, current_domain, is_sparse):
192205
# don't try to index nonempty_domain if None
193206
selection = selection if isinstance(selection, list) else [selection]
194207
return tuple(
195-
rng for sel in selection for rng in iter_ranges(sel, is_sparse, nonempty_domain)
208+
rng
209+
for sel in selection
210+
for rng in iter_ranges(sel, is_sparse, nonempty_domain, current_domain)
196211
)
197212

198213

@@ -206,27 +221,23 @@ def label_ranges_from_selection(selection):
206221
def getitem_ranges(array: Array, idx: Any) -> Sequence[Sequence[Range]]:
207222
ranges: List[Sequence[Range]] = [()] * array.schema.domain.ndim
208223

209-
# In the case that current domain is non-empty, we need to consider it
210-
if (
211-
hasattr(array.schema, "current_domain")
212-
and not array.schema.current_domain.is_empty
213-
):
214-
for i in range(array.schema.domain.ndim):
215-
ranges[i] = [
216-
(
217-
array.schema.current_domain.ndrectangle.range(i)[0],
218-
array.schema.current_domain.ndrectangle.range(i)[1],
219-
)
220-
]
221-
222-
return tuple(ranges)
223-
224224
ned = array.nonempty_domain()
225+
current_domain = (
226+
array.schema.current_domain
227+
if hasattr(array.schema, "current_domain")
228+
and not array.schema.current_domain.is_empty
229+
else None
230+
)
225231
if ned is None:
226232
ned = [None] * array.schema.domain.ndim
227233
is_sparse = array.schema.sparse
228234
for i, dim_sel in enumerate([idx] if not isinstance(idx, tuple) else idx):
229-
ranges[i] = dim_ranges_from_selection(dim_sel, ned[i], is_sparse)
235+
ranges[i] = dim_ranges_from_selection(
236+
dim_sel,
237+
ned[i],
238+
current_domain.ndrectangle.range(i) if current_domain else None,
239+
is_sparse,
240+
)
230241
return tuple(ranges)
231242

232243

@@ -236,6 +247,12 @@ def getitem_ranges_with_labels(
236247
dim_ranges: List[Sequence[Range]] = [()] * array.schema.domain.ndim
237248
label_ranges: Dict[str, Sequence[Range]] = {}
238249
ned = array.nonempty_domain()
250+
current_domain = (
251+
array.schema.current_domain
252+
if hasattr(array.schema, "current_domain")
253+
and not array.schema.current_domain.is_empty
254+
else None
255+
)
239256
if ned is None:
240257
ned = [None] * array.schema.domain.ndim
241258
is_sparse = array.schema.sparse
@@ -244,7 +261,10 @@ def getitem_ranges_with_labels(
244261
label_ranges[labels[dim_idx]] = label_ranges_from_selection(dim_sel)
245262
else:
246263
dim_ranges[dim_idx] = dim_ranges_from_selection(
247-
dim_sel, ned[dim_idx], is_sparse
264+
dim_sel,
265+
ned[dim_idx],
266+
current_domain.ndrectangle.range(dim_idx) if current_domain else None,
267+
is_sparse,
248268
)
249269
return dim_ranges, label_ranges
250270

‎tiledb/tests/test_current_domain.py

+22-1
Original file line numberDiff line numberDiff line change
@@ -304,7 +304,28 @@ def test_take_current_domain_into_account_dense_indexing_sc61914(self):
304304
)
305305

306306
assert_array_equal(A, expected_array)
307-
assert_array_equal(A.df[:], expected_df)
307+
assert_array_equal(A.df[:, :], expected_df)
308+
309+
# check indexing the array inside the range of the current domain
310+
assert_array_equal(A[11:14, 33:35]["a"], expected_array[1:4, 3:5])
311+
filtered_df = expected_df.query(
312+
"d1 >= 11 and d1 <= 14 and d2 >= 33 and d2 <= 35"
313+
).reset_index(drop=True)
314+
assert_array_equal(A.df[11:14, 33:35], filtered_df)
315+
316+
# check only one side of the range
317+
assert_array_equal(A[11:, :35]["a"], expected_array[1:, :5])
318+
filtered_df = expected_df.query("d1 >= 11 and d2 <= 35").reset_index(
319+
drop=True
320+
)
321+
assert_array_equal(A.df[11:, :35], filtered_df)
322+
323+
# check indexing the array outside the range of the current domain - should raise an error
324+
with self.assertRaises(tiledb.TileDBError):
325+
A[11:55, 33:34]
326+
327+
with self.assertRaises(tiledb.TileDBError):
328+
A.df[11:55, 33:34]
308329

309330
def test_take_current_domain_into_account_sparse_indexing_sc61914(self):
310331
uri = self.path("test_sc61914")

0 commit comments

Comments
 (0)
Please sign in to comment.