From 91f3640e784efe84c579373a7e551ac376c00d95 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 13:43:36 -0500
Subject: [PATCH 01/11] feat: add PaginationList for lazy page fetching in
 catalog list operations

Implements a PaginationList[T] class (pyiceberg/utils/pagination.py) that
extends list and lazily fetches subsequent pages from a paginated REST
endpoint only as the caller iterates past items already in memory.

Design:
- First page is pre-loaded on construction; the list is immediately usable
  for callers that only inspect the first page or stop iteration early.
- __iter__ advances through in-memory items and triggers a new HTTP fetch
  only when the iterator would otherwise block on an empty buffer.
- Operations requiring the full result set (__len__, __contains__, __eq__,
  slicing, repr, negative indexing) call _fetch_all() before delegating to
  the underlying list implementation.
- Positive-index __getitem__ calls _fetch_through_index() to fetch only as
  many pages as needed to satisfy the access.
- Subclasses list[T], so isinstance(result, list) remains True and all
  existing call sites that iterate, compare, or extend the return value
  continue to work without changes.

REST catalog integration:
- list_tables, list_views, and list_namespaces in RestCatalog now return
  a PaginationList instead of eagerly collecting all pages in a while loop.
- Each method defines a _fetch_page closure capturing the session, URL and
  params, matching the (items, next_token | None) callback contract.

Tests:
- tests/utils/test_pagination.py: 14 unit tests covering single-page and
  multi-page scenarios, lazy iteration, partial consumption, __len__,
  __contains__, __eq__, slicing, negative indexing, and repr.
- tests/catalog/test_rest.py: adds test_list_tables_returns_pagination_list
  which verifies that iterating only the first two items does not trigger
  the second HTTP request (call_count == 1), and that consuming all items
  triggers exactly one additional request (call_count == 2).

Closes #3365
---
 pyiceberg/catalog/rest/__init__.py |  81 ++++++------
 pyiceberg/utils/pagination.py      | 130 +++++++++++++++++++
 tests/catalog/test_rest.py         |  54 ++++++++
 tests/utils/test_pagination.py     | 192 +++++++++++++++++++++++++++++
 4 files changed, 413 insertions(+), 44 deletions(-)
 create mode 100644 pyiceberg/utils/pagination.py
 create mode 100644 tests/utils/test_pagination.py

diff --git a/pyiceberg/catalog/rest/__init__.py b/pyiceberg/catalog/rest/__init__.py
index d085c6fd87..81c479b674 100644
--- a/pyiceberg/catalog/rest/__init__.py
+++ b/pyiceberg/catalog/rest/__init__.py
@@ -89,6 +89,7 @@
 from pyiceberg.typedef import EMPTY_DICT, UTF8, IcebergBaseModel, Identifier, Properties
 from pyiceberg.types import transform_dict_value_to_str
 from pyiceberg.utils.deprecated import deprecation_message
+from pyiceberg.utils.pagination import PaginationList
 from pyiceberg.utils.properties import get_first_property_value, get_header_properties, property_as_bool, property_as_int
 from pyiceberg.view import View
 from pyiceberg.view.metadata import ViewMetadata, ViewVersion
@@ -1051,26 +1052,24 @@ def list_tables(self, namespace: str | Identifier) -> list[Identifier]:
                 raise ValueError(f"{PAGE_SIZE} must be a positive integer")
             params["pageSize"] = str(page_size)
 
-        tables: list[Identifier] = []
-        page_token: str | None = None
-
-        while True:
-            if page_token:
-                params["pageToken"] = page_token
+        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+            params["pageToken"] = page_token
             response = self._session.get(url, params=params)
             try:
                 response.raise_for_status()
             except HTTPError as exc:
                 _handle_non_200_response(exc, {404: NoSuchNamespaceError})
-
             parsed = ListTablesResponse.model_validate_json(response.text)
-            tables.extend([(*table.namespace, table.name) for table in parsed.identifiers])
-
-            if not parsed.next_page_token:
-                break
-            page_token = parsed.next_page_token
+            return [(*t.namespace, t.name) for t in parsed.identifiers], parsed.next_page_token
 
-        return tables
+        response = self._session.get(url, params=params)
+        try:
+            response.raise_for_status()
+        except HTTPError as exc:
+            _handle_non_200_response(exc, {404: NoSuchNamespaceError})
+        parsed = ListTablesResponse.model_validate_json(response.text)
+        first_page: list[Identifier] = [(*t.namespace, t.name) for t in parsed.identifiers]
+        return PaginationList(first_page, parsed.next_page_token, _fetch_page)
 
     @retry(**_RETRY_ARGS)
     @override
@@ -1165,27 +1164,24 @@ def list_views(self, namespace: str | Identifier) -> list[Identifier]:
                 raise ValueError(f"{PAGE_SIZE} must be a positive integer")
             params["pageSize"] = str(page_size)
 
-        views: list[Identifier] = []
-        page_token: str | None = None
-
-        while True:
-            if page_token:
-                params["pageToken"] = page_token
-
+        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+            params["pageToken"] = page_token
             response = self._session.get(url, params=params)
             try:
                 response.raise_for_status()
             except HTTPError as exc:
                 _handle_non_200_response(exc, {404: NoSuchNamespaceError})
-
             parsed = ListViewsResponse.model_validate_json(response.text)
-            views.extend([(*view.namespace, view.name) for view in parsed.identifiers])
-
-            if not parsed.next_page_token:
-                break
-            page_token = parsed.next_page_token
+            return [(*v.namespace, v.name) for v in parsed.identifiers], parsed.next_page_token
 
-        return views
+        response = self._session.get(url, params=params)
+        try:
+            response.raise_for_status()
+        except HTTPError as exc:
+            _handle_non_200_response(exc, {404: NoSuchNamespaceError})
+        parsed = ListViewsResponse.model_validate_json(response.text)
+        first_page: list[Identifier] = [(*v.namespace, v.name) for v in parsed.identifiers]
+        return PaginationList(first_page, parsed.next_page_token, _fetch_page)
 
     @retry(**_RETRY_ARGS)
     @override
@@ -1279,6 +1275,7 @@ def drop_namespace(self, namespace: str | Identifier) -> None:
     def list_namespaces(self, namespace: str | Identifier = ()) -> list[Identifier]:
         self._check_endpoint(Capability.V1_LIST_NAMESPACES)
         namespace_tuple = self.identifier_to_tuple(namespace)
+        namespaces_url = self.url(Endpoints.list_namespaces)
 
         params: dict[str, str] = {}
         page_size = property_as_int(self.properties, PAGE_SIZE, None)
@@ -1286,30 +1283,26 @@ def list_namespaces(self, namespace: str | Identifier = ()) -> list[Identifier]:
             if page_size <= 0:
                 raise ValueError(f"{PAGE_SIZE} must be a positive integer")
             params["pageSize"] = str(page_size)
+        if namespace_tuple:
+            params["parent"] = self._encode_namespace_path(namespace_tuple)
 
-        namespaces: list[Identifier] = []
-        page_token: str | None = None
-
-        while True:
-            if namespace_tuple:
-                params["parent"] = self._encode_namespace_path(namespace_tuple)
-            if page_token:
-                params["pageToken"] = page_token
-            response = self._session.get(self.url(Endpoints.list_namespaces), params=params)
-
+        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+            params["pageToken"] = page_token
+            response = self._session.get(namespaces_url, params=params)
             try:
                 response.raise_for_status()
             except HTTPError as exc:
                 _handle_non_200_response(exc, {404: NoSuchNamespaceError})
-
             parsed = ListNamespaceResponse.model_validate_json(response.text)
-            namespaces.extend(parsed.namespaces)
+            return list(parsed.namespaces), parsed.next_page_token
 
-            if not parsed.next_page_token:
-                break
-            page_token = parsed.next_page_token
-
-        return namespaces
+        response = self._session.get(namespaces_url, params=params)
+        try:
+            response.raise_for_status()
+        except HTTPError as exc:
+            _handle_non_200_response(exc, {404: NoSuchNamespaceError})
+        parsed = ListNamespaceResponse.model_validate_json(response.text)
+        return PaginationList(list(parsed.namespaces), parsed.next_page_token, _fetch_page)
 
     @retry(**_RETRY_ARGS)
     @override
diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
new file mode 100644
index 0000000000..8c36888028
--- /dev/null
+++ b/pyiceberg/utils/pagination.py
@@ -0,0 +1,130 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Lazy-loading pagination utilities."""
+
+from __future__ import annotations
+
+from collections.abc import Callable, Iterator
+from typing import Generic, TypeVar, overload
+
+T = TypeVar("T")
+
+
+class PaginationList(list, Generic[T]):
+    """A list that lazily fetches subsequent pages from a paginated API.
+
+    The first page is pre-loaded on construction.  Subsequent pages are only
+    fetched when the caller iterates past items already in memory.  Operations
+    that require the complete result set — ``len()``, ``in``, slicing,
+    ``repr()`` — trigger a full fetch of all remaining pages.
+
+    Args:
+        first_page: Items from the first API response.
+        next_page_token: Pagination token returned with the first response,
+            or ``None`` if no further pages exist.
+        fetch_next_page: Callable that accepts a page token and returns a
+            tuple of ``(items, next_page_token_or_None)``.
+    """
+
+    def __init__(
+        self,
+        first_page: list[T],
+        next_page_token: str | None,
+        fetch_next_page: Callable[[str], tuple[list[T], str | None]],
+    ) -> None:
+        super().__init__(first_page)
+        self._next_page_token = next_page_token
+        self._fetch_next_page = fetch_next_page
+
+    # ------------------------------------------------------------------
+    # Internal helpers — use list's own methods to avoid infinite loops.
+    # ------------------------------------------------------------------
+
+    def _fetch_all(self) -> None:
+        """Fetch all remaining pages into the list."""
+        while self._next_page_token:
+            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+            list.extend(self, items)
+
+    def _fetch_through_index(self, idx: int) -> None:
+        """Fetch pages until the list contains at least *idx + 1* items."""
+        while list.__len__(self) <= idx and self._next_page_token:
+            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+            list.extend(self, items)
+
+    # ------------------------------------------------------------------
+    # Lazy iteration
+    # ------------------------------------------------------------------
+
+    def __iter__(self) -> Iterator[T]:
+        """Iterate lazily, fetching pages only as the caller advances."""
+        idx = 0
+        while True:
+            if idx < list.__len__(self):
+                yield list.__getitem__(self, idx)
+                idx += 1
+            elif self._next_page_token:
+                items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+                list.extend(self, items)
+            else:
+                return
+
+    # ------------------------------------------------------------------
+    # Operations that require the complete result set
+    # ------------------------------------------------------------------
+
+    def __len__(self) -> int:
+        self._fetch_all()
+        return list.__len__(self)
+
+    def __contains__(self, item: object) -> bool:
+        self._fetch_all()
+        return list.__contains__(self, item)
+
+    def __repr__(self) -> str:
+        self._fetch_all()
+        return f"PaginationList({list.__repr__(self)})"
+
+    # ------------------------------------------------------------------
+    # Index / slice access
+    # ------------------------------------------------------------------
+
+    def __eq__(self, other: object) -> bool:
+        self._fetch_all()
+        return list.__eq__(self, other)
+
+    def __ne__(self, other: object) -> bool:
+        return not self.__eq__(other)
+
+    @overload
+    def __getitem__(self, idx: int) -> T: ...
+
+    @overload
+    def __getitem__(self, idx: slice) -> list[T]: ...
+
+    def __getitem__(self, idx: int | slice) -> T | list[T]:
+        if isinstance(idx, int):
+            # Negative index requires knowing the length.
+            if idx < 0:
+                self._fetch_all()
+            else:
+                self._fetch_through_index(idx)
+        else:
+            # Slice — fetch all to avoid partial results.
+            self._fetch_all()
+        return list.__getitem__(self, idx)  # type: ignore[return-value]
diff --git a/tests/catalog/test_rest.py b/tests/catalog/test_rest.py
index 1eb9f26a56..8e7c7af663 100644
--- a/tests/catalog/test_rest.py
+++ b/tests/catalog/test_rest.py
@@ -45,6 +45,7 @@
     RestCatalog,
     ScanPlanningMode,
 )
+from pyiceberg.utils.pagination import PaginationList
 from pyiceberg.exceptions import (
     AuthorizationExpiredError,
     NamespaceAlreadyExistsError,
@@ -529,6 +530,59 @@ def test_list_tables_paginated_200(rest_mock: Mocker) -> None:
     ]
 
 
+def test_list_tables_returns_pagination_list(rest_mock: Mocker) -> None:
+    """list_tables returns a PaginationList that defers fetching page 2."""
+    namespace = "examples"
+
+    rest_mock.get(
+        f"{TEST_URI}v1/namespaces/{namespace}/tables",
+        json={
+            "identifiers": [
+                {"namespace": ["examples"], "name": "table1"},
+                {"namespace": ["examples"], "name": "table2"},
+            ],
+            "next-page-token": "pagetoken",
+        },
+        status_code=200,
+        request_headers=TEST_HEADERS,
+    )
+    # Second page — registered but should only be called when iterated past page 1.
+    rest_mock.get(
+        f"{TEST_URI}v1/namespaces/{namespace}/tables?pageToken=pagetoken",
+        json={
+            "identifiers": [
+                {"namespace": ["examples"], "name": "table3"},
+            ],
+        },
+        status_code=200,
+        request_headers=TEST_HEADERS,
+    )
+
+    result = RestCatalog("rest", uri=TEST_URI, token=TEST_TOKEN).list_tables(namespace)
+
+    assert isinstance(result, PaginationList)
+
+    # Consuming only the first two items must not trigger the second HTTP request.
+    first_two = []
+    for item in result:
+        first_two.append(item)
+        if len(first_two) == 2:
+            break
+
+    assert first_two == [("examples", "table1"), ("examples", "table2")]
+    # Only the initial request should have been made so far.
+    assert rest_mock.call_count == 1
+
+    # Consuming all items forces the second request.
+    all_tables = list(result)
+    assert all_tables == [
+        ("examples", "table1"),
+        ("examples", "table2"),
+        ("examples", "table3"),
+    ]
+    assert rest_mock.call_count == 2
+
+
 def test_list_tables_paginated_200_none_next_page_token(rest_mock: Mocker) -> None:
     namespace = "examples"
     # First page with next-page-token
diff --git a/tests/utils/test_pagination.py b/tests/utils/test_pagination.py
new file mode 100644
index 0000000000..a4d0546797
--- /dev/null
+++ b/tests/utils/test_pagination.py
@@ -0,0 +1,192 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+from __future__ import annotations
+
+import pytest
+
+from pyiceberg.utils.pagination import PaginationList
+
+
+def _make_pages(pages: list[list[int]]) -> tuple[list[int], str | None, list[list[int]]]:
+    """Build (first_page, first_token, remaining_pages) for tests."""
+    tokens = [f"tok{i}" for i in range(len(pages))]
+    first = pages[0]
+    first_token = tokens[1] if len(pages) > 1 else None
+    remaining = pages[1:]
+    return first, first_token, remaining
+
+
+def _make_fetch(remaining: list[list[int]], tokens: list[str | None]):
+    """Return a fetch callback that yields successive pages."""
+    idx = 0
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        nonlocal idx
+        items = remaining[idx]
+        next_tok = tokens[idx]
+        idx += 1
+        return items, next_tok
+
+    return fetch
+
+
+def _simple_pagination_list(
+    pages: list[list[int]],
+) -> tuple[PaginationList, list[int]]:
+    """Build a PaginationList and return it with the full expected items."""
+    all_items = [item for page in pages for item in page]
+    next_tokens = [f"tok{i}" for i in range(1, len(pages))] + [None]
+
+    call_count = 0
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        nonlocal call_count
+        # Pages are accessed in order starting from page index 1.
+        page_idx = int(token.replace("tok", ""))
+        call_count += 1
+        return pages[page_idx], next_tokens[page_idx]
+
+    first_token = f"tok1" if len(pages) > 1 else None
+    pl = PaginationList(pages[0], first_token, fetch)
+    return pl, all_items
+
+
+class TestPaginationListSinglePage:
+    """Single-page list behaves like a plain list."""
+
+    def test_iteration(self) -> None:
+        pl, expected = _simple_pagination_list([[1, 2, 3]])
+        assert list(pl) == expected
+
+    def test_len(self) -> None:
+        pl, expected = _simple_pagination_list([[1, 2, 3]])
+        assert len(pl) == len(expected)
+
+    def test_contains(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2, 3]])
+        assert 2 in pl
+        assert 99 not in pl
+
+    def test_getitem(self) -> None:
+        pl, _ = _simple_pagination_list([[10, 20, 30]])
+        assert pl[0] == 10
+        assert pl[2] == 30
+        assert pl[-1] == 30
+
+    def test_slice(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2, 3, 4]])
+        assert pl[1:3] == [2, 3]
+
+    def test_is_list_subclass(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2]])
+        assert isinstance(pl, list)
+
+
+class TestPaginationListMultiPage:
+    """Multi-page list lazily fetches subsequent pages."""
+
+    def test_iteration_fetches_all(self) -> None:
+        pl, expected = _simple_pagination_list([[1, 2], [3, 4], [5]])
+        assert list(pl) == expected
+
+    def test_partial_iteration_stops_early(self) -> None:
+        """Iterating over just the first page should not trigger any fetch."""
+        fetched = []
+
+        def fetch(token: str) -> tuple[list[int], str | None]:
+            fetched.append(token)
+            return [3, 4], None
+
+        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+
+        # Only consume the first two items (already in first page).
+        result = []
+        for item in pl:
+            result.append(item)
+            if item == 2:
+                break
+
+        assert result == [1, 2]
+        assert fetched == [], "No fetch should have occurred for first-page items"
+
+    def test_iteration_triggers_fetch_when_needed(self) -> None:
+        """Consuming past the first page triggers exactly one fetch per page."""
+        fetched_tokens: list[str] = []
+
+        def fetch(token: str) -> tuple[list[int], str | None]:
+            fetched_tokens.append(token)
+            if token == "tok1":
+                return [3], "tok2"
+            return [4, 5], None
+
+        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+        assert list(pl) == [1, 2, 3, 4, 5]
+        assert fetched_tokens == ["tok1", "tok2"]
+
+    def test_len_fetches_all(self) -> None:
+        pl, expected = _simple_pagination_list([[1, 2], [3]])
+        assert len(pl) == len(expected)
+
+    def test_contains_fetches_all(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
+        assert 4 in pl
+        assert 99 not in pl
+
+    def test_getitem_fetches_lazily(self) -> None:
+        fetched: list[str] = []
+
+        def fetch(token: str) -> tuple[list[int], str | None]:
+            fetched.append(token)
+            if token == "tok1":
+                return [3, 4], "tok2"
+            return [5], None
+
+        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+
+        # First page: no fetch needed.
+        assert pl[0] == 1
+        assert fetched == []
+
+        # Index 2 is in the second page: one fetch.
+        assert pl[2] == 3
+        assert fetched == ["tok1"]
+
+        # Index 4 is in the third page.
+        assert pl[4] == 5
+        assert fetched == ["tok1", "tok2"]
+
+    def test_negative_index_fetches_all(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2], [3, 4, 5]])
+        assert pl[-1] == 5
+
+    def test_slice_fetches_all(self) -> None:
+        pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
+        assert pl[1:3] == [2, 3]
+
+    def test_repr_fetches_all(self) -> None:
+        pl, _ = _simple_pagination_list([[1], [2]])
+        r = repr(pl)
+        assert "1" in r and "2" in r
+
+    def test_empty_first_page(self) -> None:
+        pl, expected = _simple_pagination_list([[], [1, 2]])
+        assert list(pl) == expected
+
+    def test_equality_with_plain_list(self) -> None:
+        pl, expected = _simple_pagination_list([[1, 2], [3]])
+        assert pl == expected

From 5a018994a9dde5d6ef97dcf6b971e707be28d954 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 14:23:23 -0500
Subject: [PATCH 02/11] fix(pagination): resolve mypy and ruff lint errors

- Change PaginationList base from 'list, Generic[T]' to 'list[T]' to
  satisfy mypy type-arg requirement
- Replace 'int' with 'SupportsIndex' in __getitem__ overloads to match
  the supertype signature expected by mypy
- Remove now-unnecessary '# type: ignore[return-value]' comment
- Add docstrings to all public methods (ruff D requirement)
- Add return type annotation to _make_fetch in test file
- Use PaginationList[int] with type parameter in test helper signature
- Import Callable from collections.abc in test file
---
 pyiceberg/utils/pagination.py  | 37 +++++++++++++++++++---------------
 tests/utils/test_pagination.py |  6 ++++--
 2 files changed, 25 insertions(+), 18 deletions(-)

diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
index 8c36888028..7c4e746607 100644
--- a/pyiceberg/utils/pagination.py
+++ b/pyiceberg/utils/pagination.py
@@ -20,12 +20,12 @@
 from __future__ import annotations
 
 from collections.abc import Callable, Iterator
-from typing import Generic, TypeVar, overload
+from typing import SupportsIndex, TypeVar, overload
 
 T = TypeVar("T")
 
 
-class PaginationList(list, Generic[T]):
+class PaginationList(list[T]):
     """A list that lazily fetches subsequent pages from a paginated API.
 
     The first page is pre-loaded on construction.  Subsequent pages are only
@@ -89,42 +89,47 @@ def __iter__(self) -> Iterator[T]:
     # ------------------------------------------------------------------
 
     def __len__(self) -> int:
+        """Return the total number of items, fetching all pages first."""
         self._fetch_all()
         return list.__len__(self)
 
     def __contains__(self, item: object) -> bool:
+        """Return True if item is present, fetching all pages first."""
         self._fetch_all()
         return list.__contains__(self, item)
 
     def __repr__(self) -> str:
+        """Return string representation after fetching all pages."""
         self._fetch_all()
         return f"PaginationList({list.__repr__(self)})"
 
-    # ------------------------------------------------------------------
-    # Index / slice access
-    # ------------------------------------------------------------------
-
     def __eq__(self, other: object) -> bool:
+        """Compare equality after fetching all pages."""
         self._fetch_all()
         return list.__eq__(self, other)
 
     def __ne__(self, other: object) -> bool:
+        """Compare inequality after fetching all pages."""
         return not self.__eq__(other)
 
+    # ------------------------------------------------------------------
+    # Index / slice access
+    # ------------------------------------------------------------------
+
     @overload
-    def __getitem__(self, idx: int) -> T: ...
+    def __getitem__(self, idx: SupportsIndex) -> T: ...
 
     @overload
     def __getitem__(self, idx: slice) -> list[T]: ...
 
-    def __getitem__(self, idx: int | slice) -> T | list[T]:
-        if isinstance(idx, int):
-            # Negative index requires knowing the length.
-            if idx < 0:
+    def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
+        """Fetch pages as needed before returning the requested item(s)."""
+        if isinstance(idx, slice):
+            self._fetch_all()
+        else:
+            i = idx.__index__()
+            if i < 0:
                 self._fetch_all()
             else:
-                self._fetch_through_index(idx)
-        else:
-            # Slice — fetch all to avoid partial results.
-            self._fetch_all()
-        return list.__getitem__(self, idx)  # type: ignore[return-value]
+                self._fetch_through_index(i)
+        return list.__getitem__(self, idx)
diff --git a/tests/utils/test_pagination.py b/tests/utils/test_pagination.py
index a4d0546797..3bc2f352d7 100644
--- a/tests/utils/test_pagination.py
+++ b/tests/utils/test_pagination.py
@@ -17,6 +17,8 @@
 
 from __future__ import annotations
 
+from collections.abc import Callable
+
 import pytest
 
 from pyiceberg.utils.pagination import PaginationList
@@ -31,7 +33,7 @@ def _make_pages(pages: list[list[int]]) -> tuple[list[int], str | None, list[lis
     return first, first_token, remaining
 
 
-def _make_fetch(remaining: list[list[int]], tokens: list[str | None]):
+def _make_fetch(remaining: list[list[int]], tokens: list[str | None]) -> Callable[[str], tuple[list[int], str | None]]:
     """Return a fetch callback that yields successive pages."""
     idx = 0
 
@@ -47,7 +49,7 @@ def fetch(token: str) -> tuple[list[int], str | None]:
 
 def _simple_pagination_list(
     pages: list[list[int]],
-) -> tuple[PaginationList, list[int]]:
+) -> tuple[PaginationList[int], list[int]]:
     """Build a PaginationList and return it with the full expected items."""
     all_items = [item for page in pages for item in page]
     next_tokens = [f"tok{i}" for i in range(1, len(pages))] + [None]

From 98d69008af712fc2d13563c4cca3cbdfa9132e4d Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 16:52:24 -0500
Subject: [PATCH 03/11] fix(tests): resolve ruff lint errors and add len()
 performance tests

Ruff fixes:
- Remove unused 'import pytest' (F401)
- Remove extraneous f-prefix from plain string 'tok1' (F541)

Performance tests (requested by reviewer):
- test_len_single_page_makes_no_extra_fetches: verifies that len() on a
  single-page PaginationList does not invoke the fetch callback at all
- test_len_multi_page_fetches_all_pages_once: verifies that len() fetches
  remaining pages exactly once and caches the result for subsequent calls
---
 tests/utils/test_pagination.py | 41 +++++++++++++++++++++++++++++++---
 1 file changed, 38 insertions(+), 3 deletions(-)

diff --git a/tests/utils/test_pagination.py b/tests/utils/test_pagination.py
index 3bc2f352d7..5d6d863ae2 100644
--- a/tests/utils/test_pagination.py
+++ b/tests/utils/test_pagination.py
@@ -19,8 +19,6 @@
 
 from collections.abc import Callable
 
-import pytest
-
 from pyiceberg.utils.pagination import PaginationList
 
 
@@ -63,7 +61,7 @@ def fetch(token: str) -> tuple[list[int], str | None]:
         call_count += 1
         return pages[page_idx], next_tokens[page_idx]
 
-    first_token = f"tok1" if len(pages) > 1 else None
+    first_token = "tok1" if len(pages) > 1 else None
     pl = PaginationList(pages[0], first_token, fetch)
     return pl, all_items
 
@@ -192,3 +190,40 @@ def test_empty_first_page(self) -> None:
     def test_equality_with_plain_list(self) -> None:
         pl, expected = _simple_pagination_list([[1, 2], [3]])
         assert pl == expected
+
+
+class TestPaginationListPerformance:
+    """Verify that PaginationList does not eagerly fetch all pages for len()
+    on a single-page list, and that multi-page len() fetches all pages exactly once."""
+
+    def test_len_single_page_makes_no_extra_fetches(self) -> None:
+        """len() on a single-page PaginationList should not call the fetch callback."""
+        fetched: list[str] = []
+
+        def fetch(token: str) -> tuple[list[int], str | None]:
+            fetched.append(token)
+            return [], None
+
+        pl: PaginationList[int] = PaginationList([1, 2, 3], None, fetch)
+        assert len(pl) == 3
+        assert fetched == [], "No fetch should occur for a single-page list"
+
+    def test_len_multi_page_fetches_all_pages_once(self) -> None:
+        """len() on a multi-page PaginationList fetches remaining pages exactly once."""
+        fetch_count = 0
+
+        def fetch(token: str) -> tuple[list[int], str | None]:
+            nonlocal fetch_count
+            fetch_count += 1
+            if token == "p2":
+                return [3, 4], "p3"
+            return [5], None
+
+        pl: PaginationList[int] = PaginationList([1, 2], "p2", fetch)
+        assert len(pl) == 5
+        assert fetch_count == 2, "Should fetch pages 2 and 3 exactly once each"
+
+        # Second len() call must not trigger further fetches
+        fetch_count = 0
+        assert len(pl) == 5
+        assert fetch_count == 0, "Second len() should use cached data"

From 9fbcdd302262d2bb2966a2c5628fedaaaeeefd60 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 17:50:27 -0500
Subject: [PATCH 04/11] fix(pagination): add docstrings to __getitem__ overload
 stubs for pydocstyle D105

---
 pyiceberg/utils/pagination.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
index 7c4e746607..a3db5ff2f3 100644
--- a/pyiceberg/utils/pagination.py
+++ b/pyiceberg/utils/pagination.py
@@ -117,10 +117,14 @@ def __ne__(self, other: object) -> bool:
     # ------------------------------------------------------------------
 
     @overload
-    def __getitem__(self, idx: SupportsIndex) -> T: ...
+    def __getitem__(self, idx: SupportsIndex) -> T:
+        """Return item at integer index, fetching pages as needed."""
+        ...
 
     @overload
-    def __getitem__(self, idx: slice) -> list[T]: ...
+    def __getitem__(self, idx: slice) -> list[T]:
+        """Return slice, fetching all remaining pages first."""
+        ...
 
     def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
         """Fetch pages as needed before returning the requested item(s)."""

From 10c2ba02238d72d63c0f7659349053874bfccbd8 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 18:35:48 -0500
Subject: [PATCH 05/11] fix(pagination): use noqa:D105 on overload stubs
 instead of docstrings

D418 prohibits docstrings on @overload stubs; suppress D105 (missing
docstring in magic method) with inline noqa comments instead.
---
 pyiceberg/utils/pagination.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
index a3db5ff2f3..ead3c58c8c 100644
--- a/pyiceberg/utils/pagination.py
+++ b/pyiceberg/utils/pagination.py
@@ -117,14 +117,10 @@ def __ne__(self, other: object) -> bool:
     # ------------------------------------------------------------------
 
     @overload
-    def __getitem__(self, idx: SupportsIndex) -> T:
-        """Return item at integer index, fetching pages as needed."""
-        ...
+    def __getitem__(self, idx: SupportsIndex) -> T: ...  # noqa: D105
 
     @overload
-    def __getitem__(self, idx: slice) -> list[T]:
-        """Return slice, fetching all remaining pages first."""
-        ...
+    def __getitem__(self, idx: slice) -> list[T]: ...  # noqa: D105
 
     def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
         """Fetch pages as needed before returning the requested item(s)."""

From 0b08854dc0badfed660c1d6ca78a90d928c47f03 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 18:48:31 -0500
Subject: [PATCH 06/11] fix(pagination): drop @overload stubs to resolve
 D105/D418 pydocstyle conflict
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

pydocstyle D105 requires docstrings on magic methods but D418 prohibits
docstrings on @overload stubs — these rules are irreconcilable for
@overload-decorated __getitem__. Since PaginationList is the only file in
the project using @overload, there is no established project pattern.

Drop the two stubs and keep only the concrete implementation with its
existing docstring. The union signature 'SupportsIndex | slice -> T | list[T]'
is correct; callers lose the narrowed return type but the runtime behaviour
is unchanged. Also removes the now-unused 'overload' import.
---
 pyiceberg/utils/pagination.py | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
index ead3c58c8c..86200a68a2 100644
--- a/pyiceberg/utils/pagination.py
+++ b/pyiceberg/utils/pagination.py
@@ -20,7 +20,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable, Iterator
-from typing import SupportsIndex, TypeVar, overload
+from typing import SupportsIndex, TypeVar
 
 T = TypeVar("T")
 
@@ -116,12 +116,6 @@ def __ne__(self, other: object) -> bool:
     # Index / slice access
     # ------------------------------------------------------------------
 
-    @overload
-    def __getitem__(self, idx: SupportsIndex) -> T: ...  # noqa: D105
-
-    @overload
-    def __getitem__(self, idx: slice) -> list[T]: ...  # noqa: D105
-
     def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
         """Fetch pages as needed before returning the requested item(s)."""
         if isinstance(idx, slice):

From 6a7b6d041c93f752c3e98763b82a03746a6c444b Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 18:53:58 -0500
Subject: [PATCH 07/11] fix(pagination): add D105/D418 to pydocstyle ignore
 list; restore @overload stubs

D105 (missing docstring in magic method) and D418 (@overload stubs must not
have docstrings) are mutually exclusive for @overload-decorated __getitem__.
Removing the stubs silenced pydocstyle but caused 3 mypy [override] errors
because list[T]'s __getitem__ is itself overloaded and the single-signature
Union form is incompatible with the supertype.

Fix: add D105 and D418 to the pydocstyle --ignore list, consistent with
D107 (missing __init__ docstring) which is already suppressed. Restore the
@overload stubs so mypy correctly narrows SupportsIndex -> T and slice ->
list[T]. Verified: mypy passes, ruff passes, pydocstyle passes.
---
 .pre-commit-config.yaml       | 2 +-
 pyiceberg/utils/pagination.py | 8 +++++++-
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index f57bcd0d8d..fcea9644a7 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -58,7 +58,7 @@ repos:
       - id: pydocstyle
         args:
           [
-            "--ignore=D100,D102,D101,D103,D104,D107,D203,D212,D213,D404,D405,D406,D407,D411,D413,D415,D417",
+            "--ignore=D100,D102,D101,D103,D104,D105,D107,D203,D212,D213,D404,D405,D406,D407,D411,D413,D415,D417,D418",
           ]
         additional_dependencies:
           - tomli==2.0.1
diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
index 86200a68a2..7c4e746607 100644
--- a/pyiceberg/utils/pagination.py
+++ b/pyiceberg/utils/pagination.py
@@ -20,7 +20,7 @@
 from __future__ import annotations
 
 from collections.abc import Callable, Iterator
-from typing import SupportsIndex, TypeVar
+from typing import SupportsIndex, TypeVar, overload
 
 T = TypeVar("T")
 
@@ -116,6 +116,12 @@ def __ne__(self, other: object) -> bool:
     # Index / slice access
     # ------------------------------------------------------------------
 
+    @overload
+    def __getitem__(self, idx: SupportsIndex) -> T: ...
+
+    @overload
+    def __getitem__(self, idx: slice) -> list[T]: ...
+
     def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
         """Fetch pages as needed before returning the requested item(s)."""
         if isinstance(idx, slice):

From d71317cb3780b965b18c54b166ce41b847045a3a Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 19:14:25 -0500
Subject: [PATCH 08/11] fix(tests): move PaginationList import to correct
 alphabetical position (isort)

---
 tests/catalog/test_rest.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/catalog/test_rest.py b/tests/catalog/test_rest.py
index 8e7c7af663..884c39ba55 100644
--- a/tests/catalog/test_rest.py
+++ b/tests/catalog/test_rest.py
@@ -45,7 +45,6 @@
     RestCatalog,
     ScanPlanningMode,
 )
-from pyiceberg.utils.pagination import PaginationList
 from pyiceberg.exceptions import (
     AuthorizationExpiredError,
     NamespaceAlreadyExistsError,
@@ -69,6 +68,7 @@
 from pyiceberg.typedef import RecursiveDict
 from pyiceberg.types import StringType
 from pyiceberg.utils.config import Config
+from pyiceberg.utils.pagination import PaginationList
 from pyiceberg.view import View
 from pyiceberg.view.metadata import ViewMetadata, ViewVersion
 

From 1780ae698b468d1ca0e55bbbe94b94ab86de6756 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Wed, 3 Jun 2026 19:28:37 -0500
Subject: [PATCH 09/11] fix(tests): account for RestCatalog config endpoint
 call in call_count assertions

RestCatalog.__init__ calls v1/config which increments rest_mock.call_count.
Capture the baseline after construction and assert relative to it.
---
 tests/catalog/test_rest.py | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/tests/catalog/test_rest.py b/tests/catalog/test_rest.py
index 884c39ba55..372499154f 100644
--- a/tests/catalog/test_rest.py
+++ b/tests/catalog/test_rest.py
@@ -558,7 +558,10 @@ def test_list_tables_returns_pagination_list(rest_mock: Mocker) -> None:
         request_headers=TEST_HEADERS,
     )
 
-    result = RestCatalog("rest", uri=TEST_URI, token=TEST_TOKEN).list_tables(namespace)
+    catalog = RestCatalog("rest", uri=TEST_URI, token=TEST_TOKEN)
+    calls_after_init = rest_mock.call_count  # config endpoint called during __init__
+
+    result = catalog.list_tables(namespace)
 
     assert isinstance(result, PaginationList)
 
@@ -570,8 +573,8 @@ def test_list_tables_returns_pagination_list(rest_mock: Mocker) -> None:
             break
 
     assert first_two == [("examples", "table1"), ("examples", "table2")]
-    # Only the initial request should have been made so far.
-    assert rest_mock.call_count == 1
+    # Only the initial list_tables request should have been made beyond __init__.
+    assert rest_mock.call_count == calls_after_init + 1
 
     # Consuming all items forces the second request.
     all_tables = list(result)
@@ -580,7 +583,7 @@ def test_list_tables_returns_pagination_list(rest_mock: Mocker) -> None:
         ("examples", "table2"),
         ("examples", "table3"),
     ]
-    assert rest_mock.call_count == 2
+    assert rest_mock.call_count == calls_after_init + 2
 
 
 def test_list_tables_paginated_200_none_next_page_token(rest_mock: Mocker) -> None:

From e2bb799c01559d63408efabd2fa56975d2f42c36 Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Sat, 6 Jun 2026 09:28:53 -0500
Subject: [PATCH 10/11] refactor(pagination): move PaginationList to typedef,
 add PageFetchResult alias, flatten tests

- Move PaginationList from pyiceberg/utils/pagination.py into pyiceberg/typedef.py
  alongside the project's other core types; delete the now-empty module
- Introduce _PageFetchResult TypeAlias for tuple[list[Identifier], str | None]
  in rest/__init__.py to avoid repeating the type on every _fetch_page signature
- Flatten TestPaginationList* classes into top-level functions to match the
  style used throughout the rest of the test suite
- Revert D105/D418 additions from .pre-commit-config.yaml; suppress D105
  inline on the two @overload stubs that cannot have docstrings
---
 .pre-commit-config.yaml            |   2 +-
 pyiceberg/catalog/rest/__init__.py |  12 +-
 pyiceberg/typedef.py               |  96 ++++++++-
 pyiceberg/utils/pagination.py      | 135 -------------
 tests/utils/test_pagination.py     | 305 ++++++++++++++---------------
 5 files changed, 248 insertions(+), 302 deletions(-)
 delete mode 100644 pyiceberg/utils/pagination.py

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index fcea9644a7..f57bcd0d8d 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -58,7 +58,7 @@ repos:
       - id: pydocstyle
         args:
           [
-            "--ignore=D100,D102,D101,D103,D104,D105,D107,D203,D212,D213,D404,D405,D406,D407,D411,D413,D415,D417,D418",
+            "--ignore=D100,D102,D101,D103,D104,D107,D203,D212,D213,D404,D405,D406,D407,D411,D413,D415,D417",
           ]
         additional_dependencies:
           - tomli==2.0.1
diff --git a/pyiceberg/catalog/rest/__init__.py b/pyiceberg/catalog/rest/__init__.py
index 81c479b674..190ca0b478 100644
--- a/pyiceberg/catalog/rest/__init__.py
+++ b/pyiceberg/catalog/rest/__init__.py
@@ -21,6 +21,7 @@
 from typing import (
     TYPE_CHECKING,
     Any,
+    TypeAlias,
 )
 from urllib.parse import quote, unquote
 
@@ -86,10 +87,9 @@
     TableRequirement,
     TableUpdate,
 )
-from pyiceberg.typedef import EMPTY_DICT, UTF8, IcebergBaseModel, Identifier, Properties
+from pyiceberg.typedef import EMPTY_DICT, UTF8, IcebergBaseModel, Identifier, PaginationList, Properties
 from pyiceberg.types import transform_dict_value_to_str
 from pyiceberg.utils.deprecated import deprecation_message
-from pyiceberg.utils.pagination import PaginationList
 from pyiceberg.utils.properties import get_first_property_value, get_header_properties, property_as_bool, property_as_int
 from pyiceberg.view import View
 from pyiceberg.view.metadata import ViewMetadata, ViewVersion
@@ -97,6 +97,8 @@
 if TYPE_CHECKING:
     import pyarrow as pa
 
+_PageFetchResult: TypeAlias = tuple[list[Identifier], str | None]
+
 
 class HttpMethod(str, Enum):
     GET = "GET"
@@ -1052,7 +1054,7 @@ def list_tables(self, namespace: str | Identifier) -> list[Identifier]:
                 raise ValueError(f"{PAGE_SIZE} must be a positive integer")
             params["pageSize"] = str(page_size)
 
-        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+        def _fetch_page(page_token: str) -> _PageFetchResult:
             params["pageToken"] = page_token
             response = self._session.get(url, params=params)
             try:
@@ -1164,7 +1166,7 @@ def list_views(self, namespace: str | Identifier) -> list[Identifier]:
                 raise ValueError(f"{PAGE_SIZE} must be a positive integer")
             params["pageSize"] = str(page_size)
 
-        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+        def _fetch_page(page_token: str) -> _PageFetchResult:
             params["pageToken"] = page_token
             response = self._session.get(url, params=params)
             try:
@@ -1286,7 +1288,7 @@ def list_namespaces(self, namespace: str | Identifier = ()) -> list[Identifier]:
         if namespace_tuple:
             params["parent"] = self._encode_namespace_path(namespace_tuple)
 
-        def _fetch_page(page_token: str) -> tuple[list[Identifier], str | None]:
+        def _fetch_page(page_token: str) -> _PageFetchResult:
             params["pageToken"] = page_token
             response = self._session.get(namespaces_url, params=params)
             try:
diff --git a/pyiceberg/typedef.py b/pyiceberg/typedef.py
index 6989144ef9..fc5051ab87 100644
--- a/pyiceberg/typedef.py
+++ b/pyiceberg/typedef.py
@@ -17,7 +17,7 @@
 from __future__ import annotations
 
 from abc import abstractmethod
-from collections.abc import Callable
+from collections.abc import Callable, Iterator
 from datetime import date, datetime, time
 from decimal import Decimal
 from typing import (
@@ -26,9 +26,11 @@
     Generic,
     Literal,
     Protocol,
+    SupportsIndex,
     TypeAlias,
     TypeVar,
     Union,
+    overload,
     runtime_checkable,
 )
 from uuid import UUID
@@ -211,3 +213,95 @@ def __hash__(self) -> int:
 
 TableVersion: TypeAlias = Literal[1, 2, 3]
 ViewVersion: TypeAlias = Literal[1]
+
+
+class PaginationList(list[T]):
+    """A list that lazily fetches subsequent pages from a paginated API.
+
+    The first page is pre-loaded on construction.  Subsequent pages are only
+    fetched when the caller iterates past items already in memory.  Operations
+    that require the complete result set — ``len()``, ``in``, slicing,
+    ``repr()`` — trigger a full fetch of all remaining pages.
+
+    Args:
+        first_page: Items from the first API response.
+        next_page_token: Pagination token returned with the first response,
+            or ``None`` if no further pages exist.
+        fetch_next_page: Callable that accepts a page token and returns a
+            tuple of ``(items, next_page_token_or_None)``.
+    """
+
+    def __init__(
+        self,
+        first_page: list[T],
+        next_page_token: str | None,
+        fetch_next_page: Callable[[str], tuple[list[T], str | None]],
+    ) -> None:
+        super().__init__(first_page)
+        self._next_page_token = next_page_token
+        self._fetch_next_page = fetch_next_page
+
+    def _fetch_all(self) -> None:
+        while self._next_page_token:
+            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+            list.extend(self, items)
+
+    def _fetch_through_index(self, idx: int) -> None:
+        while list.__len__(self) <= idx and self._next_page_token:
+            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+            list.extend(self, items)
+
+    def __iter__(self) -> Iterator[T]:
+        """Iterate lazily, fetching pages only as the caller advances."""
+        idx = 0
+        while True:
+            if idx < list.__len__(self):
+                yield list.__getitem__(self, idx)
+                idx += 1
+            elif self._next_page_token:
+                items, self._next_page_token = self._fetch_next_page(self._next_page_token)
+                list.extend(self, items)
+            else:
+                return
+
+    def __len__(self) -> int:
+        """Return the total number of items, fetching all pages first."""
+        self._fetch_all()
+        return list.__len__(self)
+
+    def __contains__(self, item: object) -> bool:
+        """Return True if item is present, fetching all pages first."""
+        self._fetch_all()
+        return list.__contains__(self, item)
+
+    def __repr__(self) -> str:
+        """Return string representation after fetching all pages."""
+        self._fetch_all()
+        return f"PaginationList({list.__repr__(self)})"
+
+    def __eq__(self, other: object) -> bool:
+        """Compare equality after fetching all pages."""
+        self._fetch_all()
+        return list.__eq__(self, other)
+
+    def __ne__(self, other: object) -> bool:
+        """Compare inequality after fetching all pages."""
+        return not self.__eq__(other)
+
+    @overload
+    def __getitem__(self, idx: SupportsIndex) -> T: ...  # noqa: D105
+
+    @overload
+    def __getitem__(self, idx: slice) -> list[T]: ...  # noqa: D105
+
+    def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
+        """Fetch pages as needed before returning the requested item(s)."""
+        if isinstance(idx, slice):
+            self._fetch_all()
+        else:
+            i = idx.__index__()
+            if i < 0:
+                self._fetch_all()
+            else:
+                self._fetch_through_index(i)
+        return list.__getitem__(self, idx)
diff --git a/pyiceberg/utils/pagination.py b/pyiceberg/utils/pagination.py
deleted file mode 100644
index 7c4e746607..0000000000
--- a/pyiceberg/utils/pagination.py
+++ /dev/null
@@ -1,135 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-"""Lazy-loading pagination utilities."""
-
-from __future__ import annotations
-
-from collections.abc import Callable, Iterator
-from typing import SupportsIndex, TypeVar, overload
-
-T = TypeVar("T")
-
-
-class PaginationList(list[T]):
-    """A list that lazily fetches subsequent pages from a paginated API.
-
-    The first page is pre-loaded on construction.  Subsequent pages are only
-    fetched when the caller iterates past items already in memory.  Operations
-    that require the complete result set — ``len()``, ``in``, slicing,
-    ``repr()`` — trigger a full fetch of all remaining pages.
-
-    Args:
-        first_page: Items from the first API response.
-        next_page_token: Pagination token returned with the first response,
-            or ``None`` if no further pages exist.
-        fetch_next_page: Callable that accepts a page token and returns a
-            tuple of ``(items, next_page_token_or_None)``.
-    """
-
-    def __init__(
-        self,
-        first_page: list[T],
-        next_page_token: str | None,
-        fetch_next_page: Callable[[str], tuple[list[T], str | None]],
-    ) -> None:
-        super().__init__(first_page)
-        self._next_page_token = next_page_token
-        self._fetch_next_page = fetch_next_page
-
-    # ------------------------------------------------------------------
-    # Internal helpers — use list's own methods to avoid infinite loops.
-    # ------------------------------------------------------------------
-
-    def _fetch_all(self) -> None:
-        """Fetch all remaining pages into the list."""
-        while self._next_page_token:
-            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
-            list.extend(self, items)
-
-    def _fetch_through_index(self, idx: int) -> None:
-        """Fetch pages until the list contains at least *idx + 1* items."""
-        while list.__len__(self) <= idx and self._next_page_token:
-            items, self._next_page_token = self._fetch_next_page(self._next_page_token)
-            list.extend(self, items)
-
-    # ------------------------------------------------------------------
-    # Lazy iteration
-    # ------------------------------------------------------------------
-
-    def __iter__(self) -> Iterator[T]:
-        """Iterate lazily, fetching pages only as the caller advances."""
-        idx = 0
-        while True:
-            if idx < list.__len__(self):
-                yield list.__getitem__(self, idx)
-                idx += 1
-            elif self._next_page_token:
-                items, self._next_page_token = self._fetch_next_page(self._next_page_token)
-                list.extend(self, items)
-            else:
-                return
-
-    # ------------------------------------------------------------------
-    # Operations that require the complete result set
-    # ------------------------------------------------------------------
-
-    def __len__(self) -> int:
-        """Return the total number of items, fetching all pages first."""
-        self._fetch_all()
-        return list.__len__(self)
-
-    def __contains__(self, item: object) -> bool:
-        """Return True if item is present, fetching all pages first."""
-        self._fetch_all()
-        return list.__contains__(self, item)
-
-    def __repr__(self) -> str:
-        """Return string representation after fetching all pages."""
-        self._fetch_all()
-        return f"PaginationList({list.__repr__(self)})"
-
-    def __eq__(self, other: object) -> bool:
-        """Compare equality after fetching all pages."""
-        self._fetch_all()
-        return list.__eq__(self, other)
-
-    def __ne__(self, other: object) -> bool:
-        """Compare inequality after fetching all pages."""
-        return not self.__eq__(other)
-
-    # ------------------------------------------------------------------
-    # Index / slice access
-    # ------------------------------------------------------------------
-
-    @overload
-    def __getitem__(self, idx: SupportsIndex) -> T: ...
-
-    @overload
-    def __getitem__(self, idx: slice) -> list[T]: ...
-
-    def __getitem__(self, idx: SupportsIndex | slice) -> T | list[T]:
-        """Fetch pages as needed before returning the requested item(s)."""
-        if isinstance(idx, slice):
-            self._fetch_all()
-        else:
-            i = idx.__index__()
-            if i < 0:
-                self._fetch_all()
-            else:
-                self._fetch_through_index(i)
-        return list.__getitem__(self, idx)
diff --git a/tests/utils/test_pagination.py b/tests/utils/test_pagination.py
index 5d6d863ae2..a1a86f5411 100644
--- a/tests/utils/test_pagination.py
+++ b/tests/utils/test_pagination.py
@@ -17,38 +17,12 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
-
-from pyiceberg.utils.pagination import PaginationList
-
-
-def _make_pages(pages: list[list[int]]) -> tuple[list[int], str | None, list[list[int]]]:
-    """Build (first_page, first_token, remaining_pages) for tests."""
-    tokens = [f"tok{i}" for i in range(len(pages))]
-    first = pages[0]
-    first_token = tokens[1] if len(pages) > 1 else None
-    remaining = pages[1:]
-    return first, first_token, remaining
-
-
-def _make_fetch(remaining: list[list[int]], tokens: list[str | None]) -> Callable[[str], tuple[list[int], str | None]]:
-    """Return a fetch callback that yields successive pages."""
-    idx = 0
-
-    def fetch(token: str) -> tuple[list[int], str | None]:
-        nonlocal idx
-        items = remaining[idx]
-        next_tok = tokens[idx]
-        idx += 1
-        return items, next_tok
-
-    return fetch
+from pyiceberg.typedef import PaginationList
 
 
 def _simple_pagination_list(
     pages: list[list[int]],
 ) -> tuple[PaginationList[int], list[int]]:
-    """Build a PaginationList and return it with the full expected items."""
     all_items = [item for page in pages for item in page]
     next_tokens = [f"tok{i}" for i in range(1, len(pages))] + [None]
 
@@ -56,7 +30,6 @@ def _simple_pagination_list(
 
     def fetch(token: str) -> tuple[list[int], str | None]:
         nonlocal call_count
-        # Pages are accessed in order starting from page index 1.
         page_idx = int(token.replace("tok", ""))
         call_count += 1
         return pages[page_idx], next_tokens[page_idx]
@@ -66,164 +39,176 @@ def fetch(token: str) -> tuple[list[int], str | None]:
     return pl, all_items
 
 
-class TestPaginationListSinglePage:
-    """Single-page list behaves like a plain list."""
+# ---------------------------------------------------------------------------
+# Single-page: behaves like a plain list
+# ---------------------------------------------------------------------------
+
+
+def test_single_page_iteration() -> None:
+    pl, expected = _simple_pagination_list([[1, 2, 3]])
+    assert list(pl) == expected
+
+
+def test_single_page_len() -> None:
+    pl, expected = _simple_pagination_list([[1, 2, 3]])
+    assert len(pl) == len(expected)
+
+
+def test_single_page_contains() -> None:
+    pl, _ = _simple_pagination_list([[1, 2, 3]])
+    assert 2 in pl
+    assert 99 not in pl
+
+
+def test_single_page_getitem() -> None:
+    pl, _ = _simple_pagination_list([[10, 20, 30]])
+    assert pl[0] == 10
+    assert pl[2] == 30
+    assert pl[-1] == 30
+
+
+def test_single_page_slice() -> None:
+    pl, _ = _simple_pagination_list([[1, 2, 3, 4]])
+    assert pl[1:3] == [2, 3]
+
+
+def test_single_page_is_list_subclass() -> None:
+    pl, _ = _simple_pagination_list([[1, 2]])
+    assert isinstance(pl, list)
 
-    def test_iteration(self) -> None:
-        pl, expected = _simple_pagination_list([[1, 2, 3]])
-        assert list(pl) == expected
 
-    def test_len(self) -> None:
-        pl, expected = _simple_pagination_list([[1, 2, 3]])
-        assert len(pl) == len(expected)
+# ---------------------------------------------------------------------------
+# Multi-page: lazily fetches subsequent pages
+# ---------------------------------------------------------------------------
 
-    def test_contains(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2, 3]])
-        assert 2 in pl
-        assert 99 not in pl
 
-    def test_getitem(self) -> None:
-        pl, _ = _simple_pagination_list([[10, 20, 30]])
-        assert pl[0] == 10
-        assert pl[2] == 30
-        assert pl[-1] == 30
+def test_multi_page_iteration_fetches_all() -> None:
+    pl, expected = _simple_pagination_list([[1, 2], [3, 4], [5]])
+    assert list(pl) == expected
 
-    def test_slice(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2, 3, 4]])
-        assert pl[1:3] == [2, 3]
 
-    def test_is_list_subclass(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2]])
-        assert isinstance(pl, list)
+def test_multi_page_partial_iteration_stops_early() -> None:
+    fetched = []
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        fetched.append(token)
+        return [3, 4], None
+
+    pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+
+    result = []
+    for item in pl:
+        result.append(item)
+        if item == 2:
+            break
+
+    assert result == [1, 2]
+    assert fetched == [], "No fetch should have occurred for first-page items"
+
+
+def test_multi_page_iteration_triggers_fetch_when_needed() -> None:
+    fetched_tokens: list[str] = []
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        fetched_tokens.append(token)
+        if token == "tok1":
+            return [3], "tok2"
+        return [4, 5], None
+
+    pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+    assert list(pl) == [1, 2, 3, 4, 5]
+    assert fetched_tokens == ["tok1", "tok2"]
 
 
-class TestPaginationListMultiPage:
-    """Multi-page list lazily fetches subsequent pages."""
+def test_multi_page_len_fetches_all() -> None:
+    pl, expected = _simple_pagination_list([[1, 2], [3]])
+    assert len(pl) == len(expected)
 
-    def test_iteration_fetches_all(self) -> None:
-        pl, expected = _simple_pagination_list([[1, 2], [3, 4], [5]])
-        assert list(pl) == expected
 
-    def test_partial_iteration_stops_early(self) -> None:
-        """Iterating over just the first page should not trigger any fetch."""
-        fetched = []
+def test_multi_page_contains_fetches_all() -> None:
+    pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
+    assert 4 in pl
+    assert 99 not in pl
 
-        def fetch(token: str) -> tuple[list[int], str | None]:
-            fetched.append(token)
-            return [3, 4], None
 
-        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+def test_multi_page_getitem_fetches_lazily() -> None:
+    fetched: list[str] = []
 
-        # Only consume the first two items (already in first page).
-        result = []
-        for item in pl:
-            result.append(item)
-            if item == 2:
-                break
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        fetched.append(token)
+        if token == "tok1":
+            return [3, 4], "tok2"
+        return [5], None
+
+    pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
+
+    assert pl[0] == 1
+    assert fetched == []
+
+    assert pl[2] == 3
+    assert fetched == ["tok1"]
+
+    assert pl[4] == 5
+    assert fetched == ["tok1", "tok2"]
 
-        assert result == [1, 2]
-        assert fetched == [], "No fetch should have occurred for first-page items"
 
-    def test_iteration_triggers_fetch_when_needed(self) -> None:
-        """Consuming past the first page triggers exactly one fetch per page."""
-        fetched_tokens: list[str] = []
+def test_multi_page_negative_index_fetches_all() -> None:
+    pl, _ = _simple_pagination_list([[1, 2], [3, 4, 5]])
+    assert pl[-1] == 5
 
-        def fetch(token: str) -> tuple[list[int], str | None]:
-            fetched_tokens.append(token)
-            if token == "tok1":
-                return [3], "tok2"
-            return [4, 5], None
 
-        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
-        assert list(pl) == [1, 2, 3, 4, 5]
-        assert fetched_tokens == ["tok1", "tok2"]
+def test_multi_page_slice_fetches_all() -> None:
+    pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
+    assert pl[1:3] == [2, 3]
 
-    def test_len_fetches_all(self) -> None:
-        pl, expected = _simple_pagination_list([[1, 2], [3]])
-        assert len(pl) == len(expected)
 
-    def test_contains_fetches_all(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
-        assert 4 in pl
-        assert 99 not in pl
+def test_multi_page_repr_fetches_all() -> None:
+    pl, _ = _simple_pagination_list([[1], [2]])
+    r = repr(pl)
+    assert "1" in r and "2" in r
 
-    def test_getitem_fetches_lazily(self) -> None:
-        fetched: list[str] = []
 
-        def fetch(token: str) -> tuple[list[int], str | None]:
-            fetched.append(token)
-            if token == "tok1":
-                return [3, 4], "tok2"
-            return [5], None
+def test_multi_page_empty_first_page() -> None:
+    pl, expected = _simple_pagination_list([[], [1, 2]])
+    assert list(pl) == expected
 
-        pl: PaginationList[int] = PaginationList([1, 2], "tok1", fetch)
 
-        # First page: no fetch needed.
-        assert pl[0] == 1
-        assert fetched == []
+def test_multi_page_equality_with_plain_list() -> None:
+    pl, expected = _simple_pagination_list([[1, 2], [3]])
+    assert pl == expected
 
-        # Index 2 is in the second page: one fetch.
-        assert pl[2] == 3
-        assert fetched == ["tok1"]
 
-        # Index 4 is in the third page.
-        assert pl[4] == 5
-        assert fetched == ["tok1", "tok2"]
-
-    def test_negative_index_fetches_all(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2], [3, 4, 5]])
-        assert pl[-1] == 5
-
-    def test_slice_fetches_all(self) -> None:
-        pl, _ = _simple_pagination_list([[1, 2], [3, 4]])
-        assert pl[1:3] == [2, 3]
-
-    def test_repr_fetches_all(self) -> None:
-        pl, _ = _simple_pagination_list([[1], [2]])
-        r = repr(pl)
-        assert "1" in r and "2" in r
-
-    def test_empty_first_page(self) -> None:
-        pl, expected = _simple_pagination_list([[], [1, 2]])
-        assert list(pl) == expected
+# ---------------------------------------------------------------------------
+# Performance: len() should not eagerly fetch all pages for a single-page list
+# ---------------------------------------------------------------------------
 
-    def test_equality_with_plain_list(self) -> None:
-        pl, expected = _simple_pagination_list([[1, 2], [3]])
-        assert pl == expected
 
+def test_performance_len_single_page_makes_no_extra_fetches() -> None:
+    fetched: list[str] = []
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        fetched.append(token)
+        return [], None
+
+    pl: PaginationList[int] = PaginationList([1, 2, 3], None, fetch)
+    assert len(pl) == 3
+    assert fetched == [], "No fetch should occur for a single-page list"
 
-class TestPaginationListPerformance:
-    """Verify that PaginationList does not eagerly fetch all pages for len()
-    on a single-page list, and that multi-page len() fetches all pages exactly once."""
 
-    def test_len_single_page_makes_no_extra_fetches(self) -> None:
-        """len() on a single-page PaginationList should not call the fetch callback."""
-        fetched: list[str] = []
-
-        def fetch(token: str) -> tuple[list[int], str | None]:
-            fetched.append(token)
-            return [], None
-
-        pl: PaginationList[int] = PaginationList([1, 2, 3], None, fetch)
-        assert len(pl) == 3
-        assert fetched == [], "No fetch should occur for a single-page list"
-
-    def test_len_multi_page_fetches_all_pages_once(self) -> None:
-        """len() on a multi-page PaginationList fetches remaining pages exactly once."""
-        fetch_count = 0
-
-        def fetch(token: str) -> tuple[list[int], str | None]:
-            nonlocal fetch_count
-            fetch_count += 1
-            if token == "p2":
-                return [3, 4], "p3"
-            return [5], None
-
-        pl: PaginationList[int] = PaginationList([1, 2], "p2", fetch)
-        assert len(pl) == 5
-        assert fetch_count == 2, "Should fetch pages 2 and 3 exactly once each"
-
-        # Second len() call must not trigger further fetches
-        fetch_count = 0
-        assert len(pl) == 5
-        assert fetch_count == 0, "Second len() should use cached data"
+def test_performance_len_multi_page_fetches_all_pages_once() -> None:
+    fetch_count = 0
+
+    def fetch(token: str) -> tuple[list[int], str | None]:
+        nonlocal fetch_count
+        fetch_count += 1
+        if token == "p2":
+            return [3, 4], "p3"
+        return [5], None
+
+    pl: PaginationList[int] = PaginationList([1, 2], "p2", fetch)
+    assert len(pl) == 5
+    assert fetch_count == 2, "Should fetch pages 2 and 3 exactly once each"
+
+    fetch_count = 0
+    assert len(pl) == 5
+    assert fetch_count == 0, "Second len() should use cached data"

From 392a8f5ac8d4e8dddf17886536372e74e0179c9a Mon Sep 17 00:00:00 2001
From: stark256-spec <stark256-spec@users.noreply.github.com>
Date: Sat, 6 Jun 2026 10:11:20 -0500
Subject: [PATCH 11/11] fix: update PaginationList import in test_rest.py

---
 tests/catalog/test_rest.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/catalog/test_rest.py b/tests/catalog/test_rest.py
index 372499154f..dd62c00a89 100644
--- a/tests/catalog/test_rest.py
+++ b/tests/catalog/test_rest.py
@@ -68,7 +68,7 @@
 from pyiceberg.typedef import RecursiveDict
 from pyiceberg.types import StringType
 from pyiceberg.utils.config import Config
-from pyiceberg.utils.pagination import PaginationList
+from pyiceberg.typedef import PaginationList
 from pyiceberg.view import View
 from pyiceberg.view.metadata import ViewMetadata, ViewVersion