Reverted granularity of page ranges

ariostas · ariostas · commit 62aaa7d48e14 · 2025-10-02T17:02:15.000-04:00
diff --git a/src/uproot/behaviors/RNTuple.py b/src/uproot/behaviors/RNTuple.py
@@ -754,7 +754,6 @@ def arrays(
 
         for key in target_cols:
             if "column" in key and "union" not in key:
-                # TODO: Need some logic to find the start and stop pages
                 key_nr = int(key.split("-")[1])
                 # Find how many elements should be padded at the beginning
                 n_padding = self.ntuple.column_records[key_nr].first_element_index
@@ -763,7 +762,8 @@ def arrays(
                 if interpreter == "cpu":
                     content = self.ntuple.read_cluster_range(
                         key_nr,
-                        range(start_cluster_idx, stop_cluster_idx),
+                        start_cluster_idx,
+                        stop_cluster_idx,
                         missing_element_padding=n_padding,
                         array_cache=array_cache,
                     )
diff --git a/src/uproot/models/RNTuple.py b/src/uproot/models/RNTuple.py
@@ -662,53 +662,42 @@ def read_page(
     def read_cluster_range(
         self,
         col_idx,
-        cluster_range,
+        cluster_start,
+        cluster_stop,
         missing_element_padding=0,
-        first_cluster_page_start=None,
-        last_cluster_page_stop=None,
         array_cache=None,
     ):
         """
         Args:
-            ncol (int): The column id.
-            cluster_range (range): The range of cluster indices.
+            col_idx (int): The column index.
+            cluster_start (int): The first cluster to include.
+            cluster_stop (int): The first cluster to exclude (i.e. one greater than the last cluster to include).
             missing_element_padding (int): Number of padding elements to add at the start of the array.
-            first_cluster_page_start (None or int): The first page of the first cluster to include. If None, start from the beginning.
-                If negative, count from the end, like a Python slice.
-            last_cluster_page_stop (None or int): The first page of the last cluster to exclude (i.e. one greater
-                than the last page to include). If None, stop at the end. If negative,
-                count from the end, like a Python slice.
             array_cache (None, or MutableMapping): Cache of arrays. If None, do not use a cache.
 
         Returns a numpy array with the data from the column.
         """
         field_metadata = self.get_field_metadata(col_idx)
         arrays = [
-            self.read_page_range(
+            self.read_pages(
                 cluster_idx,
                 col_idx,
                 field_metadata,
-                page_start=first_cluster_page_start if i == 0 else None,
-                page_stop=(
-                    last_cluster_page_stop if i == len(cluster_range) - 1 else None
-                ),
                 array_cache=array_cache,
             )
-            for i, cluster_idx in enumerate(cluster_range)
+            for cluster_idx in range(cluster_start, cluster_stop)
         ]
         res = self.combine_cluster_arrays(
             arrays, field_metadata, missing_element_padding
         )
 
         return res
 
-    def read_page_range(
+    def read_pages(
         self,
         cluster_idx,
         col_idx,
         field_metadata,
-        page_start=None,
-        page_stop=None,
         array_cache=None,
     ):
         """
@@ -717,9 +706,6 @@ def read_page_range(
             col_idx (int): The column index.
             field_metadata (:doc:`uproot.models.RNTuple.FieldClusterMetadata`):
                 The metadata needed to read the field's pages.
-            page_start (None or int): The first page to include. If None, start from the beginning.
-            page_stop (None or int): The first page to exclude (i.e. one greater
-                than the last page to include). If None, stop at the end.
             array_cache (None or MutableMapping): Cache of arrays. If None, do not use a cache.
 
         Returns a numpy array with the data from the column.
@@ -733,7 +719,7 @@ def read_page_range(
                 col_idx
             )  # Update metadata if suppressed
         pagelist = (
-            linklist[field_metadata.ncol].pages[page_start:page_stop]
+            linklist[field_metadata.ncol].pages
             if field_metadata.ncol < len(linklist)
             else []
         )
@@ -742,9 +728,7 @@ def read_page_range(
 
         tracker = 0
         cumsum = 0
-        for page_idx, page_desc in enumerate(
-            pagelist, start=page_start if page_start is not None else 0
-        ):
+        for page_idx, page_desc in enumerate(pagelist):
             n_elements = page_desc.num_elements
             tracker_end = tracker + n_elements
             self.read_page(
diff --git a/tests/test_1191_rntuple_fixes.py b/tests/test_1191_rntuple_fixes.py
@@ -59,7 +59,7 @@ def test_multiple_page_delta_encoding():
     with uproot.open(filename) as f:
         obj = f["ntuple"]
         field_metadata = obj.get_field_metadata(0)
-        data = obj.read_page_range(0, 0, field_metadata)
+        data = obj.read_pages(0, 0, field_metadata)
         # first page has 64 elements, so this checks that data was stitched together correctly
         assert data[64] - data[63] == 2