feat: Implement automatic pagination for endpoints by parsing Link headers and abstracting page/page_size parameters from the generated API.

AmbientLighter · AmbientLighter · commit 1875cd6c9a1c · 2025-11-30T16:15:59.000+02:00
diff --git a/openapi_python_client/templates/endpoint_macros.py.jinja b/openapi_python_client/templates/endpoint_macros.py.jinja
@@ -89,7 +89,7 @@ _kwargs["json"] = {{ property.python_name }}
 {% endmacro %}
 
 {# The all the kwargs passed into an endpoint (and variants thereof)) #}
-{% macro arguments(endpoint, include_client=True) %}
+{% macro arguments(endpoint, include_client=True, skip_pagination=False) %}
 {# path parameters #}
 {% for parameter in endpoint.path_parameters %}
 {{ parameter.to_string() }},
@@ -117,7 +117,9 @@ body: Union[
 {% endif %}
 {# query parameters #}
 {% for parameter in endpoint.query_parameters %}
+{% if not skip_pagination or parameter.name not in ['page', 'page_size'] %}
 {{ parameter.to_string() }},
+{% endif %}
 {% endfor %}
 {% for parameter in endpoint.header_parameters %}
 {{ parameter.to_string() }},
@@ -129,7 +131,7 @@ body: Union[
 {% endmacro %}
 
 {# Just lists all kwargs to endpoints as name=name for passing to other functions #}
-{% macro kwargs(endpoint, include_client=True) %}
+{% macro kwargs(endpoint, include_client=True, skip_pagination=False) %}
 {% for parameter in endpoint.path_parameters %}
 {{ parameter.python_name }}={{ parameter.python_name }},
 {% endfor %}
@@ -140,7 +142,9 @@ client=client,
 body=body,
 {% endif %}
 {% for parameter in endpoint.query_parameters %}
+{% if not skip_pagination or parameter.name not in ['page', 'page_size'] %}
 {{ parameter.python_name }}={{ parameter.python_name }},
+{% endif %}
 {% endfor %}
 {% for parameter in endpoint.header_parameters %}
 {{ parameter.python_name }}={{ parameter.python_name }},
diff --git a/openapi_python_client/templates/endpoint_module.py.jinja b/openapi_python_client/templates/endpoint_module.py.jinja
@@ -7,6 +7,7 @@ from ...client import AuthenticatedClient, Client
 from ...types import Response, UNSET
 from ... import errors
 
+
 {% for relative in endpoint.relative_imports | sort %}
 {{ relative }}
 {% endfor %}
@@ -22,6 +23,10 @@ from ... import errors
 {% set parsed_responses = (endpoint.responses | length > 0) and return_string != "Any" %}
 {% endif %}
 
+{% if endpoint.name.endswith("_list") and parsed_responses and return_string.startswith("list[") %}
+from ...utils import parse_link_header
+{% endif %}
+
 def _get_kwargs(
     {{ arguments(endpoint, include_client=False) | indent(4) }}
 ) -> dict[str, Any]:
@@ -165,3 +170,162 @@ async def asyncio(
         {{ kwargs(endpoint) }}
     )).parsed
 {% endif %}
+
+{% if endpoint.name.endswith("_list") and parsed_responses and return_string.startswith("list[") %}
+def sync_all(
+    {{ arguments(endpoint, skip_pagination=True) | indent(4) }}
+) -> {{ return_string }}:
+    """Get All Pages
+    
+     Fetch all pages of paginated results. This function automatically handles pagination
+     by following the 'next' link in the Link header until all results are retrieved.
+     
+     Note: page_size will be set to 100 (the maximum allowed) automatically.
+    
+    Args:
+{% set all_parameters = endpoint.list_all_parameters() %}
+{% if all_parameters %}
+{% for parameter in all_parameters %}
+{% if parameter.name not in ['page', 'page_size'] %}
+        {{ parameter.to_docstring() | wordwrap(90) | indent(8) }}
+{% endif %}
+{% endfor %}
+{% endif %}
+
+    Raises:
+        errors.UnexpectedStatus: If the server returns an undocumented status code.
+        httpx.TimeoutException: If the request takes longer than Client.timeout.
+
+    Returns:
+        {{ return_string }}: Combined results from all pages
+    """
+    from urllib.parse import urlencode, parse_qs, urlparse, urlunparse
+    
+    all_results{{ ":" if return_string.startswith("list[") else " =" }} {{ return_string.replace("list[", "list[") if return_string.startswith("list[") else return_string }} = []
+    
+    # Get initial request kwargs
+    kwargs = _get_kwargs(
+        {{ kwargs(endpoint, include_client=False, skip_pagination=True) }}
+    )
+    
+    # Set page_size to maximum
+    if "params" not in kwargs:
+        kwargs["params"] = {}
+    kwargs["params"]["page_size"] = 100
+    
+    # Make initial request
+    response = client.get_httpx_client().request(**kwargs)
+    parsed_response = _parse_response(client=client, response=response)
+    
+    if parsed_response:
+        all_results.extend(parsed_response)
+    
+    # Follow pagination links
+    while True:
+        link_header = response.headers.get("Link", "")
+        links = parse_link_header(link_header)
+        
+        if "next" not in links:
+            break
+            
+        # Extract page number from next URL
+        next_url = links["next"]
+        parsed_url = urlparse(next_url)
+        next_params = parse_qs(parsed_url.query)
+        
+        if "page" not in next_params:
+            break
+        
+        # Update only the page parameter, keep all other params
+        page_number = next_params["page"][0]
+        kwargs["params"]["page"] = page_number
+        
+        # Fetch next page
+        response = client.get_httpx_client().request(**kwargs)
+        parsed_response = _parse_response(client=client, response=response)
+        
+        if parsed_response:
+            all_results.extend(parsed_response)
+    
+    return all_results
+
+
+async def asyncio_all(
+    {{ arguments(endpoint, skip_pagination=True) | indent(4) }}
+) -> {{ return_string }}:
+    """Get All Pages (Async)
+    
+     Fetch all pages of paginated results asynchronously. This function automatically handles pagination
+     by following the 'next' link in the Link header until all results are retrieved.
+     
+     Note: page_size will be set to 100 (the maximum allowed) automatically.
+    
+    Args:
+{% set all_parameters = endpoint.list_all_parameters() %}
+{% if all_parameters %}
+{% for parameter in all_parameters %}
+{% if parameter.name not in ['page', 'page_size'] %}
+        {{ parameter.to_docstring() | wordwrap(90) | indent(8) }}
+{% endif %}
+{% endfor %}
+{% endif %}
+
+    Raises:
+        errors.UnexpectedStatus: If the server returns an undocumented status code.
+        httpx.TimeoutException: If the request takes longer than Client.timeout.
+
+    Returns:
+        {{ return_string }}: Combined results from all pages
+    """
+    from urllib.parse import urlencode, parse_qs, urlparse, urlunparse
+    
+    all_results{{ ":" if return_string.startswith("list[") else " =" }} {{ return_string.replace("list[", "list[") if return_string.startswith("list[") else return_string }} = []
+    
+    # Get initial request kwargs
+    kwargs = _get_kwargs(
+        {{ kwargs(endpoint, include_client=False, skip_pagination=True) }}
+    )
+    
+    # Set page_size to maximum
+    if "params" not in kwargs:
+        kwargs["params"] = {}
+    kwargs["params"]["page_size"] = 100
+    
+    # Make initial request
+    response = await client.get_async_httpx_client().request(**kwargs)
+    parsed_response = _parse_response(client=client, response=response)
+    
+    if parsed_response:
+        all_results.extend(parsed_response)
+    
+    # Follow pagination links
+    while True:
+        link_header = response.headers.get("Link", "")
+        links = parse_link_header(link_header)
+        
+        if "next" not in links:
+            break
+            
+        # Extract page number from next URL
+        next_url = links["next"]
+        parsed_url = urlparse(next_url)
+        next_params = parse_qs(parsed_url.query)
+        
+        if "page" not in next_params:
+            break
+        
+        # Update only the page parameter, keep all other params
+        page_number = next_params["page"][0]
+        kwargs["params"]["page"] = page_number
+        
+        # Fetch next page
+        response = await client.get_async_httpx_client().request(**kwargs)
+        parsed_response = _parse_response(client=client, response=response)
+        
+        if parsed_response:
+            all_results.extend(parsed_response)
+    
+    return all_results
+{% endif %}
+
+
diff --git a/openapi_python_client/templates/utils.py.jinja b/openapi_python_client/templates/utils.py.jinja
@@ -0,0 +1,31 @@
+def parse_link_header(link_header: str) -> dict[str, str]:
+    """
+    Parse Link header to extract pagination URLs.
+    
+    Args:
+        link_header: The Link header string (e.g. '<url>; rel="next"')
+        
+    Returns:
+        Dictionary mapping relation types (next, prev, first, last) to URLs
+    """
+    links = {}
+    if not link_header:
+        return links
+    
+    for link in link_header.split(","):
+        link = link.strip()
+        if not link:
+            continue
+        parts = link.split(";")
+        if len(parts) < 2:
+            continue
+        url = parts[0].strip()
+        if url.startswith("<") and url.endswith(">"):
+            url = url[1:-1]
+        for part in parts[1:]:
+            part = part.strip()
+            if part.startswith("rel="):
+                rel_type = part[4:].strip().strip('"').strip("'")
+                links[rel_type] = url
+                break
+    return links