
    q-Ph                   ^   d dl mZ d dlZd dlZd dlZd dlZd dlmZmZ d dl	m
Z
m	Z	mZmZ d dlmZmZmZ d dlmZmZ d dlmZ d dlmZ d d	lmZmZmZmZmZmZmZ d dlm Z! d d
l"m#Z$ d dl%m&Z&m'Z' d dl(m)Z)m*Z* d dl+m,Z,m-Z- d dl.m/Z/m0Z0m1Z1m2Z2 d dl3m4Z4 d dl5m6Z6m7Z7 d dl8m9Z9 d dl:m;Z; d dl<m=Z=m>Z> d dl?m@Z@mAZAmBZBmCZCmDZDmEZEmFZFmGZGmHZHmIZImJZJ d dlKmLZLmMZM d dlNmOZOmPZPmQZQmRZRmSZSmTZTmUZUmVZVmWZWmXZXmYZYmZZZm[Z[m\Z\m]Z]m^Z^m_Z_m`Z`maZambZbmcZcmdZdmeZemfZfmgZgmhZh d dlimjZj d dlkmlZlmmZmmnZn d dlkmoZp d dlkmqZr d dlsmtZt d dlumvZv d dlwmxZx d dlymzZz d dl{m|Z| d d l}m~Z~mZ d d!lmZ d d"lmZmZ  ej        e          5  d d#lmZmZ ddd           n# 1 swxY w Y   er
d dlZd d$lmZmZmZ d d%lmZ d d&lmZmZ d d'l}mZ  ej        e          5  d d(lmZmZ ddd           n# 1 swxY w Y   d d)l"mZmZmZ d d*l%mZmZmZmZmZmZmZmZmZmZmZmZmZmZmZmZm&Z&mZmZmZmZmZmZmZmZmZmZ d d+lkmZ d d,lmZ d d-lmZ ej        d.k    r	d d/lmZmZ nd d/lmZmZ ej        d0k    rd d1lmZ nd d1lmZ ej        d2k    rd d3lm1Z1 nd d3lm1Z1  ed4          Z ed5          ZdGd9ZdHd=ZdIdDZ G dE dF          ZdS )J    )annotationsN)
CollectionMapping)datedatetimetime	timedelta)	lru_cachepartialreduce)BytesIOStringIO)and_)Path)TYPE_CHECKINGAnyCallableClassVarNoReturnTypeVaroverload)	functions)ParquetMetadataPartitioningScheme)_AioDataFrameResult_GeventDataFrameResult)negate_duration_stringparse_as_duration_string)deprecate_renamed_parameterdeprecate_streaming_parameter
deprecatedissue_deprecation_warning)wrap_parquet_metadata_callback)parse_into_expressionparse_into_list_of_expressions)serialize_polars_object)LazyPolarsSlice)issue_unstable_warningunstable)_is_generatordisplay_dot_graphextend_boolfind_stacklevelis_bool_sequenceis_sequenceissue_warningnormalize_filepathparse_percentilesqualified_type_namerequire_same_type)wrap_df	wrap_expr)DTYPE_TEMPORAL_UNITSN_INFER_DEFAULTBooleanCategoricalDateDatetimeDurationEnumFloat32Float64Int8Int16Int32Int64Int128NullObjectStringTimeUInt8UInt16UInt32UInt64Unknownis_polars_dtypeparse_into_dtype)DataTypeGroup)_PYARROW_AVAILABLEimport_optional
subprocess)polars_cloud)pyarrow)PerformanceWarning)CompatLevel)	GPUEngine)LazyGroupBy)InProcessQuery)DEFAULT_QUERY_OPT_FLAGSforward_old_opt_flags)Schema)by_dtypeexpand_selector)PyLazyFrameget_engine_affinity)	AwaitableIterableSequence)IOBase)IOLiteral)QueryOptFlags)PyExprPyPartitioning)	DataFrameDataTypeExpr)AsofJoinStrategyClosedIntervalColumnNameOrSelectorCsvQuoteStyle
EngineTypeExplainFormatFillNullStrategyFrameInitTypesIntoExprIntoExprColumnIpcCompressionJoinStrategyJoinValidationLabelMaintainOrderJoinOrientationr   	PlanStagePolarsDataTypePythonDataTypeQuantileMethodSchemaDefinition
SchemaDictSerializationFormatStartBySyncOnCloseMethodUniqueKeepStrategy)numpy)CredentialProviderFunction)ParquetFieldOverwrites)   
   )Concatenate	ParamSpec)r      )Self)r      )r!   TPenginers   returnc                .    | dk    rt                      n| S )Nauto)rb   r   s    V/var/www/html/test/jupyter/venv/lib/python3.11/site-packages/polars/lazyframe/frame.py_select_enginer      s    $*f$4$4   &@    path5str | Path | IO[bytes] | IO[str] | PartitioningScheme1str | Path | IO[bytes] | IO[str] | PyPartitioningc                L   t          | t          t          f          rt          |           S t          | t          j                  r| S t          | t                    r| j        S t          t          | dd                     r| S dt          |           d}t          |          )Nwritez!`path` argument has invalid type z), and cannot be turned into a sink target)
isinstancestrr   r1   iorf   r   _py_partitioningcallablegetattrr3   	TypeError)r   msgs     r   _to_sink_targetr      s     $d$$ !$'''	D")	$	$ 		D,	-	- $$	'$..	/	/ x2Ed2K2Kxxxnnr   	streamingbool
backgroundnew_streaming_eager(Callable[[Any, int | None], None] | Nonec               0   t          | t                    x}p| dk    }|s| dv sd| }t          |          |s|s|r|rt          dt                     d}|rd}|sd S t          ddd	
          }|st                      } t          |j        |           S )Ngpu)r   cpuz	in-memoryr   old-streamingr   zInvalid engine argument engine=zUGPU engine does not support streaming or background collection, disabling GPU engine.categoryFcudf_polarsz*GPU engine requested, but required packagezPlease install using the command `pip install cudf-polars-cu12` (or `pip install --extra-index-url=https://pypi.nvidia.com cudf-polars-cu11` if your system has a CUDA 11 driver).)
err_prefixinstall_message)config)r   rY   
ValueErrorr0   UserWarningrS   r   execute_with_cudf)	r   r   r   r   r   is_config_objis_gpur   r   s	            r   _gpu_engine_callbackr      s      *&)<<<mP5FVVV222oo Z = f $ 	
 	
 	
 	

   t!?4		 	 	K  ;0@@@@r   c                     e Zd ZU dZded<    e            Zded<   	 	 ddddedd	ddZe	dd            Z
ddZddZe	ddd dd&            Ze	d'd(dd-            Zedd/            Zedd1            Zedd3            Zedd5            Zdd7Zdd:Zdd=Zdd>Zdd?Zdd@ZddAZddBZddDZddEZdddGZddJZddKZ ddLZ!ddMZ"e#	 ddNd(ddQ            Z$e#dddS            Z$e#dNd(ddU            Z$	 dd'd(ddXZ$d d`Z%	 ddbdcddiZ& e'             e(            djddddddddddddkde)dldd                        Z* e'             e(            ddddddddddddddddkdde)ddd                        Z+dddZ,dddddddZ-ddddZ. e/ddd          ddd	d            Z0 e/ddd          ddd	d            Z1 e(            ddddddddddddddke)dd
d            Z2e#dddddddddddke)ddd            Z3e#dddddddddddkde)ddd            Z3 e'             e(            dddddddddddkde)ddd                        Z3e#dke)ddd            Z4e#ddke)dddÄ            Z4 e'            ddke)dddń            Z4ddƄZ5e#ddddddddkddddNddkde)dɜdd߄            Z6e#ddddddddkdddddkde)ddd            Z6ddddddddkdddddddke)dddZ6e#dddddkddddNdke)ddd            Z7e#dddddkddddke)d
dd            Z7dddddkdddddke)dddZ7e#ddddddddddddddddkddddNdke)ddd            Z8e#ddddddddddddddddkddddke)ddd            Z8ddddddddddddddddkdddddke)dddZ8e#dddkddddNdke)d	dd            Z9e#dddkddddke)ddd	            Z9dddkdddddke)d	dd
Z9 e:d          	 ddddddddddddddd            Z;	 ddddddddddddddddZ<ddZ=ddZ>ddd dZ?d!d"dZ@ddZAddd#d!ZBd$d#ZCd$d$ZDd%d'ZEd%d(ZFdd)d&d,ZG e/dd-d.          dd/dd0d'd9            ZH e/dd-d.          dddd:d:dd;d<d(dC            ZIdddddddDdEdddddddFd)dXZJ e/dYdZd[          	 	 d*dddEd]dddddd^	d+de            ZK eL            dEdfd,dh            ZMd%diZNd%djZO e:dk          d-dm            ZPddd.dpZQddd/dsZRddtZS	 d0ddvd1dzZTdd2d|ZUd3d"d~ZVd3d"dZWd3d"dZXddZYddZZ e:d          dd            Z[d4d5dZ\ e:d          d6d5d            Z]d!d7dZ^	 	 	 d8ddd9dZ_d:dZ`d0d;dZad0d;dZbddZcddZdddZeddZfddZgddZh	 d<d=dZid>dZj	 ddddd?dZk	 dd@dZl	 dd@dZm	 dddddddAdZndddddddddBdZoddZpdCdZqdDdZrdddEdZs eL            	 	 dFdddd:ddGdń            ZtddƄZu e:dǦ          	 	 	 	 dHddȜdId˄            Zv eL            	 	 dJdKd҄            Zw eL            dӐdӐdӐdӐdԐdԐd՜dLd            Zx	 	 ddMdZydS (N  	LazyFrameu  
    Representation of a Lazy computation graph/query against a DataFrame.

    This allows for whole-query optimisation in addition to parallelism, and
    is the preferred (and highest-performance) mode of operation for polars.

    Parameters
    ----------
    data : dict, Sequence, ndarray, Series, or pandas.DataFrame
        Two-dimensional data in various forms; dict input must contain Sequences,
        Generators, or a `range`. Sequence may contain Series or other Sequences.
    schema : Sequence of str, (str,DataType) pairs, or a {str:DataType,} dict
        The LazyFrame schema may be declared in several ways:

        * As a dict of {name:type} pairs; if type is None, it will be auto-inferred.
        * As a list of column names; in this case types are automatically inferred.
        * As a list of (name,type) pairs; this is equivalent to the dictionary form.

        If you supply a list of column names that does not match the names in the
        underlying data, the names given here will overwrite them. The number
        of names given in the schema should match the underlying data dimensions.
    schema_overrides : dict, default None
        Support type specification or override of one or more columns; note that
        any dtypes inferred from the schema param will be overridden.

        The number of entries in the schema should match the underlying data
        dimensions, unless a sequence of dictionaries is being passed, in which case
        a *partial* schema can be declared to prevent specific fields from being loaded.
    strict : bool, default True
        Throw an error if any `data` value does not exactly match the given or inferred
        data type for that column. If set to `False`, values that do not match the data
        type are cast to that data type or, if casting is not possible, set to null
        instead.
    orient : {'col', 'row'}, default None
        Whether to interpret two-dimensional data as columns or as rows. If None,
        the orientation is inferred by matching the columns and data dimensions. If
        this does not yield conclusive results, column orientation is used.
    infer_schema_length : int or None
        The maximum number of rows to scan for schema inference. If set to `None`, the
        full data may be scanned *(this can be slow)*. This parameter only applies if
        the input data is a sequence or generator of rows; other input is read as-is.
    nan_to_null : bool, default False
        If the data comes from one or more numpy arrays, can optionally convert input
        data np.nan values to null instead. This is a no-op for all other input data.

    Notes
    -----
    Initialising `LazyFrame(...)` directly is equivalent to `DataFrame(...).lazy()`.

    Examples
    --------
    Constructing a LazyFrame directly from a dictionary:

    >>> data = {"a": [1, 2], "b": [3, 4]}
    >>> lf = pl.LazyFrame(data)
    >>> lf.collect()
    shape: (2, 2)
    ┌─────┬─────┐
    │ a   ┆ b   │
    │ --- ┆ --- │
    │ i64 ┆ i64 │
    ╞═════╪═════╡
    │ 1   ┆ 3   │
    │ 2   ┆ 4   │
    └─────┴─────┘

    Notice that the dtypes are automatically inferred as Polars Int64:

    >>> lf.collect_schema().dtypes()
    [Int64, Int64]

    To specify a more detailed/specific frame schema you can supply the `schema`
    parameter with a dictionary of (name,dtype) pairs...

    >>> data = {"col1": [0, 2], "col2": [3, 7]}
    >>> lf2 = pl.LazyFrame(data, schema={"col1": pl.Float32, "col2": pl.Int64})
    >>> lf2.collect()
    shape: (2, 2)
    ┌──────┬──────┐
    │ col1 ┆ col2 │
    │ ---  ┆ ---  │
    │ f32  ┆ i64  │
    ╞══════╪══════╡
    │ 0.0  ┆ 3    │
    │ 2.0  ┆ 7    │
    └──────┴──────┘

    ...a sequence of (name,dtype) pairs...

    >>> data = {"col1": [1, 2], "col2": [3, 4]}
    >>> lf3 = pl.LazyFrame(data, schema=[("col1", pl.Float32), ("col2", pl.Int64)])
    >>> lf3.collect()
    shape: (2, 2)
    ┌──────┬──────┐
    │ col1 ┆ col2 │
    │ ---  ┆ ---  │
    │ f32  ┆ i64  │
    ╞══════╪══════╡
    │ 1.0  ┆ 3    │
    │ 2.0  ┆ 4    │
    └──────┴──────┘

    ...or a list of typed Series.

    >>> data = [
    ...     pl.Series("col1", [1, 2], dtype=pl.Float32),
    ...     pl.Series("col2", [3, 4], dtype=pl.Int64),
    ... ]
    >>> lf4 = pl.LazyFrame(data)
    >>> lf4.collect()
    shape: (2, 2)
    ┌──────┬──────┐
    │ col1 ┆ col2 │
    │ ---  ┆ ---  │
    │ f32  ┆ i64  │
    ╞══════╪══════╡
    │ 1.0  ┆ 3    │
    │ 2.0  ┆ 4    │
    └──────┴──────┘

    Constructing a LazyFrame from a numpy ndarray, specifying column names:

    >>> import numpy as np
    >>> data = np.array([(1, 2), (3, 4)], dtype=np.int64)
    >>> lf5 = pl.LazyFrame(data, schema=["a", "b"], orient="col")
    >>> lf5.collect()
    shape: (2, 2)
    ┌─────┬─────┐
    │ a   ┆ b   │
    │ --- ┆ --- │
    │ i64 ┆ i64 │
    ╞═════╪═════╡
    │ 1   ┆ 3   │
    │ 2   ┆ 4   │
    └─────┴─────┘

    Constructing a LazyFrame from a list of lists, row orientation specified:

    >>> data = [[1, 2, 3], [4, 5, 6]]
    >>> lf6 = pl.LazyFrame(data, schema=["a", "b", "c"], orient="row")
    >>> lf6.collect()
    shape: (2, 3)
    ┌─────┬─────┬─────┐
    │ a   ┆ b   ┆ c   │
    │ --- ┆ --- ┆ --- │
    │ i64 ┆ i64 ┆ i64 │
    ╞═════╪═════╪═════╡
    │ 1   ┆ 2   ┆ 3   │
    │ 4   ┆ 5   ┆ 6   │
    └─────┴─────┴─────┘
    ra   _ldfzClassVar[set[str]]
_accessorsNTF)schema_overridesstrictorientinfer_schema_lengthnan_to_nulldataFrameInitTypes | NoneschemaSchemaDefinition | Noner   SchemaDict | Noner   r   r   Orientation | Noner   
int | Noner   r   Nonec          	     n    ddl m}  ||||||||                                          j        | _        d S )Nr   )rl   )r   r   r   r   r   r   r   )polars.dataframerl   lazyr   )	selfr   r   r   r   r   r   r   rl   s	            r   __init__zLazyFrame.__init__  sZ     	/..... I!1$7'   TVV 				r   ldfc                >    |                      |           }||_        |S N)__new__r   )clsr   r   s      r   _from_pyldfzLazyFrame._from_pyldf  s    {{3	r   bytesc                *    |                                  S r   )	serializer   s    r   __getstate__zLazyFrame.__getstate__  s    ~~r   statec                ^    |                      t          |                    j        | _        d S r   )deserializer   r   )r   r   s     r   __setstate__zLazyFrame.__setstate__  s$    $$WU^^449			r   rV   validate_schema1pa.schema | SchemaDict | Callable[[], SchemaDict]scan_fnr   rV   r   c                  |                      |           }t          |t                    r=t          j        t          |                                          |||          |_        nht          rEt          |t          j
                  r+t          j        t          |          |||          |_        nt          j        |||          |_        |S )Nr   )r   )r   r   r   ra   #scan_from_python_function_pl_schemalistitemsr   rR   par^   &scan_from_python_function_arrow_schema)scan_from_python_function_schema_function)r   r   r   rV   r   r   s         r   _scan_python_functionzLazyFrame._scan_python_function  s     {{3fg&& 	#GV\\^^$$ /	  DII   	Jvry$A$A 	#JVgw  DII $M  DI r   binary)formatsourcestr | Path | IOBaser   r   c                  t          |t                    r4t          |                                                                          }n+t          |t
          t          f          rt          |          }|dk    rt          j	        }n'|dk    rt          j
        }nd|}t          |          |                      ||                    S )u  
        Read a logical plan from a file to construct a LazyFrame.

        Parameters
        ----------
        source
            Path to a file or a file-like object (by file-like object, we refer to
            objects that have a `read()` method, such as a file handler (e.g.
            via builtin `open` function) or `BytesIO`).
        format
            The format with which the LazyFrame was serialized. Options:

            - `"binary"`: Deserialize from binary format (bytes). This is the default.
            - `"json"`: Deserialize from JSON format (string).

        Warnings
        --------
        This function uses :mod:`pickle` if the logical plan contains Python UDFs,
        and as such inherits the security implications. Deserializing can execute
        arbitrary code, so it should only be attempted on trusted data.

        See Also
        --------
        LazyFrame.serialize

        Notes
        -----
        Serialization is not stable across Polars versions: a LazyFrame serialized
        in one Polars version may not be deserializable in another Polars version.

        Examples
        --------
        >>> import io
        >>> lf = pl.LazyFrame({"a": [1, 2, 3]}).sum()
        >>> bytes = lf.serialize()
        >>> pl.LazyFrame.deserialize(io.BytesIO(bytes)).collect()
        shape: (1, 1)
        ┌─────┐
        │ a   │
        │ --- │
        │ i64 │
        ╞═════╡
        │ 6   │
        └─────┘
        r   json0`format` must be one of {'binary', 'json'}, got )r   r   r   getvalueencoder   r   r1   ra   deserialize_binarydeserialize_jsonr   r   )r   r   r   deserializerr   s        r   r   zLazyFrame.deserialize  s    b fh'' 	0V__..557788FFd,, 	0'//FX&9LLv&7LLQvQQCS//!||F33444r   	list[str]c                z    t          dt                     |                                                                 S )ar  
        Get the column names.

        Returns
        -------
        list of str
            A list containing the name of each column in order.

        Warnings
        --------
        Determining the column names of a LazyFrame requires resolving its schema,
        which is a potentially expensive operation.
        Using :meth:`collect_schema` is the idiomatic way of resolving the schema.
        This property exists only for symmetry with the DataFrame class.

        See Also
        --------
        collect_schema
        Schema.names

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6, 7, 8],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... ).select("foo", "bar")
        >>> lf.columns  # doctest: +SKIP
        ['foo', 'bar']
        zDetermining the column names of a LazyFrame requires resolving its schema, which is a potentially expensive operation. Use `LazyFrame.collect_schema().names()` to get the column names without this warning.r   )r0   rW   collect_schemanamesr   s    r   columnszLazyFrame.columns	  sF    D 	= (		
 	
 	
 	
 ""$$**,,,r   list[DataType]c                z    t          dt                     |                                                                 S )ax  
        Get the column data types.

        Returns
        -------
        list of DataType
            A list containing the data type of each column in order.

        Warnings
        --------
        Determining the data types of a LazyFrame requires resolving its schema,
        which is a potentially expensive operation.
        Using :meth:`collect_schema` is the idiomatic way to resolve the schema.
        This property exists only for symmetry with the DataFrame class.

        See Also
        --------
        collect_schema
        Schema.dtypes

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.dtypes  # doctest: +SKIP
        [Int64, Float64, String]
        zDetermining the data types of a LazyFrame requires resolving its schema, which is a potentially expensive operation. Use `LazyFrame.collect_schema().dtypes()` to get the data types without this warning.r   )r0   rW   r   dtypesr   s    r   r  zLazyFrame.dtypes3  sF    D 	; (		
 	
 	
 	
 ""$$++---r   r^   c                V    t          dt                     |                                 S )a  
        Get an ordered mapping of column names to their data type.

        Warnings
        --------
        Resolving the schema of a LazyFrame is a potentially expensive operation.
        Using :meth:`collect_schema` is the idiomatic way to resolve the schema.
        This property exists only for symmetry with the DataFrame class.

        See Also
        --------
        collect_schema
        Schema

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.schema  # doctest: +SKIP
        Schema({'foo': Int64, 'bar': Float64, 'ham': String})
        zResolving the schema of a LazyFrame is a potentially expensive operation. Use `LazyFrame.collect_schema()` to get the schema without this warning.r   )r0   rW   r   r   s    r   r   zLazyFrame.schema]  s8    8 	X'	
 	
 	
 	

 ""$$$r   intc                z    t          dt                     |                                                                 S )a  
        Get the number of columns.

        Returns
        -------
        int

        Warnings
        --------
        Determining the width of a LazyFrame requires resolving its schema,
        which is a potentially expensive operation.
        Using :meth:`collect_schema` is the idiomatic way to resolve the schema.
        This property exists only for symmetry with the DataFrame class.

        See Also
        --------
        collect_schema
        Schema.len

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [4, 5, 6],
        ...     }
        ... )
        >>> lf.width  # doctest: +SKIP
        2
        zdetermining the width of a LazyFrame requires resolving its schema, which is a potentially expensive operation. Use `LazyFrame.collect_schema().len()` to get the width without this warning.r   )r0   rW   r   lenr   s    r   widthzLazyFrame.width  sF    @ 	6 (		
 	
 	
 	
 ""$$((***r   r   c                $    d}t          |          )Nztthe truth value of a LazyFrame is ambiguous

LazyFrames cannot be used in boolean context with and/or/not operators.r   )r   r   s     r   __bool__zLazyFrame.__bool__  s    Z 	 nnr   operatorr   c                ,    d|d}t          |          )N"z0" comparison not supported for LazyFrame objectsr  )r   r  r   s      r   _comparison_errorzLazyFrame._comparison_error  s    N(NNNnnr   otherobjectc                0    |                      d           d S )Nz==r  r   r  s     r   __eq__zLazyFrame.__eq__      t$$$$$r   c                0    |                      d           d S )Nz!=r  r  s     r   __ne__zLazyFrame.__ne__  r  r   c                0    |                      d           d S )N>r  r  s     r   __gt__zLazyFrame.__gt__      s#####r   c                0    |                      d           d S )N<r  r  s     r   __lt__zLazyFrame.__lt__  r  r   c                0    |                      d           d S )Nz>=r  r  s     r   __ge__zLazyFrame.__ge__  r  r   c                0    |                      d           d S )Nz<=r  r  s     r   __le__zLazyFrame.__le__  r  r   keyc                .    ||                                  v S r   )r   )r   r&  s     r   __contains__zLazyFrame.__contains__  s    d))++++r   c                *    |                                  S r   cloner   s    r   __copy__zLazyFrame.__copy__      zz||r   memoc                *    |                                  S r   r*  )r   r.  s     r   __deepcopy__zLazyFrame.__deepcopy__  r-  r   itemint | range | slicec                    t          |t                    sd}t          |          t          |                               |          S )NzZLazyFrame is not subscriptable (aside from slicing)

Use `select()` or `filter()` instead.)r   slicer   r'   apply)r   r1  r   s      r   __getitem__zLazyFrame.__getitem__  sH    $&& 	!<  C.. t$$**4000r   c                4    d|                      d           S )NzOnaive plan: (run LazyFrame.explain(optimized=True) to see the optimized plan)

F	optimized)explainr   s    r   __str__zLazyFrame.__str__  s)       	r   c                D    d| j         j         dt          |           ddS )Nr   z at 0xXr  )	__class____name__idr   s    r   __repr__zLazyFrame.__repr__  s)    ?4>*??"T((?????r   c                >   	 | j                             d          }t          j        g d|                                           }d|                                 S # t          $ r3 |                     d                              dd          }d| d	cY S w xY w)
NFr8  )dotz-Nshape=boxz-Tsvg)inputz^<h4>NAIVE QUERY PLAN</h4><p>run <b>LazyFrame.show_graph()</b> to see the optimized version</p>
z<p></p>zq<i>naive plan: (run <b>LazyFrame.explain(optimized=True)</b> to see the optimized plan)</i>
    <p></p>
    <div>z</div>)	r   to_dotrT   check_outputr   decode	Exceptionr:  replace)r   rC  svginserts       r   _repr_html_zLazyFrame._repr_html_  s    	)""U"33C)///#x7H7H  C<-0ZZ\\< <  	 	 	\\E\22::4KKF      	s   AA :BB.fileLiteral['binary']c                   d S r    r   rN  r   s      r   r   zLazyFrame.serialize  s	     r   Literal['json']c                   d S r   rQ  rR  s      r   r   zLazyFrame.serialize  s    NQcr   IOBase | str | Pathc                   d S r   rQ  rR  s      r   r   zLazyFrame.serialize  s	     sr   IOBase | str | Path | Nonebytes | str | Nonec                   |dk    r| j         j        }nK|dk    r1d}t          j        |t	                                 | j         j        }nd|}t          |          t          |||          S )u(  
        Serialize the logical plan of this LazyFrame to a file or string in JSON format.

        Parameters
        ----------
        file
            File path to which the result should be written. If set to `None`
            (default), the output is returned as a string instead.
        format
            The format in which to serialize. Options:

            - `"binary"`: Serialize to binary format (bytes). This is the default.
            - `"json"`: Serialize to JSON format (string) (deprecated).

        See Also
        --------
        LazyFrame.deserialize

        Notes
        -----
        Serialization is not stable across Polars versions: a LazyFrame serialized
        in one Polars version may not be deserializable in another Polars version.

        Examples
        --------
        Serialize the logical plan into a binary representation.

        >>> lf = pl.LazyFrame({"a": [1, 2, 3]}).sum()
        >>> bytes = lf.serialize()

        The bytes can later be deserialized back into a LazyFrame.

        >>> import io
        >>> pl.LazyFrame.deserialize(io.BytesIO(bytes)).collect()
        shape: (1, 1)
        ┌─────┐
        │ a   │
        │ --- │
        │ i64 │
        ╞═════╡
        │ 6   │
        └─────┘
        r   r   z6'json' serialization format of LazyFrame is deprecated)
stacklevelr   )r   serialize_binarywarningswarnr-   serialize_jsonr   r&   )r   rN  r   
serializerr   s        r   r   zLazyFrame.serialize  s    b X3JJvJCM*,,    1JJQvQQCS//!&z4@@@r   function&Callable[Concatenate[LazyFrame, P], T]argsP.argskwargsP.kwargsr   c                     || g|R i |S )u  
        Offers a structured way to apply a sequence of user-defined functions (UDFs).

        Parameters
        ----------
        function
            Callable; will receive the frame as the first parameter,
            followed by any given args/kwargs.
        *args
            Arguments to pass to the UDF.
        **kwargs
            Keyword arguments to pass to the UDF.

        Examples
        --------
        >>> def cast_str_to_int(lf: pl.LazyFrame, col_name: str) -> pl.LazyFrame:
        ...     return lf.with_columns(pl.col(col_name).cast(pl.Int64))
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": ["10", "20", "30", "40"],
        ...     }
        ... )
        >>> lf.pipe(cast_str_to_int, col_name="b").collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 10  │
        │ 2   ┆ 20  │
        │ 3   ┆ 30  │
        │ 4   ┆ 40  │
        └─────┴─────┘

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "b": [1, 2],
        ...         "a": [3, 4],
        ...     }
        ... )
        >>> lf.collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ b   ┆ a   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 3   │
        │ 2   ┆ 4   │
        └─────┴─────┘
        >>> lf.pipe(lambda lf: lf.select(sorted(lf.collect_schema()))).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 3   ┆ 1   │
        │ 4   ┆ 2   │
        └─────┴─────┘
        rQ  )r   r`  rb  rd  s       r   pipezLazyFrame.pipeB  s%    J x.t...v...r   g      ?g      ?g      ?nearest)interpolationpercentilesSequence[float] | float | Nonerj  r   rl   c          	     \	   ddl m} |                                 }|sd}t          |          g d}t	          |          x}r|                    d |D                        |                    d           t          dd            }t                      t                      c}	g }
t          j
        d          }|                                D ]\  }|                                }| o|                                }t          j                                                  j                            d          t          j                                                  j                            d          g}|s|s|t&          k    r&t          j                                                  n|}|r&t          j                                                  n|} ||          s&t          j                                                  n|} ||          s&t          j                                                  n|}g }|D ]}|s|r|rMt          j                                                                      ||                              |          n't          j                                      ||          }|	                               n|}|                    |                    | d                      |s$|                                s|t<          t&          fv r                               |
                    g ||                    d           |                    d           |                    d           ||                    d                       |	r|                     d |	D                       n| j         |
 !                                tE          |          fdtG          |"                                          D             }tI          tK          ||                    }|D ]fd|         D             |<    ||          }|&                    dtO          j(        d|                     |S )uh  
        Creates a summary of statistics for a LazyFrame, returning a DataFrame.

        Parameters
        ----------
        percentiles
            One or more percentiles to include in the summary statistics.
            All values must be in the range `[0, 1]`.

        interpolation : {'nearest', 'higher', 'lower', 'midpoint', 'linear', 'equiprobable'}
            Interpolation method used when calculating percentiles.

        Returns
        -------
        DataFrame

        Notes
        -----
        The median is included by default as the 50% percentile.

        Warnings
        --------
        * This method does *not* maintain the laziness of the frame, and will `collect`
          the final result. This could potentially be an expensive operation.
        * We do not guarantee the output of `describe` to be stable. It will show
          statistics that we deem informative, and may be updated in the future.
          Using `describe` programmatically (versus interactive exploration) is
          not recommended for this reason.

        Examples
        --------
        >>> from datetime import date, time
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "float": [1.0, 2.8, 3.0],
        ...         "int": [40, 50, None],
        ...         "bool": [True, False, True],
        ...         "str": ["zz", "xx", "yy"],
        ...         "date": [date(2020, 1, 1), date(2021, 7, 5), date(2022, 12, 31)],
        ...         "time": [time(10, 20, 30), time(14, 45, 50), time(23, 15, 10)],
        ...     }
        ... )

        Show default frame statistics:

        >>> lf.describe()
        shape: (9, 7)
        ┌────────────┬──────────┬──────────┬──────────┬──────┬─────────────────────┬──────────┐
        │ statistic  ┆ float    ┆ int      ┆ bool     ┆ str  ┆ date                ┆ time     │
        │ ---        ┆ ---      ┆ ---      ┆ ---      ┆ ---  ┆ ---                 ┆ ---      │
        │ str        ┆ f64      ┆ f64      ┆ f64      ┆ str  ┆ str                 ┆ str      │
        ╞════════════╪══════════╪══════════╪══════════╪══════╪═════════════════════╪══════════╡
        │ count      ┆ 3.0      ┆ 2.0      ┆ 3.0      ┆ 3    ┆ 3                   ┆ 3        │
        │ null_count ┆ 0.0      ┆ 1.0      ┆ 0.0      ┆ 0    ┆ 0                   ┆ 0        │
        │ mean       ┆ 2.266667 ┆ 45.0     ┆ 0.666667 ┆ null ┆ 2021-07-02 16:00:00 ┆ 16:07:10 │
        │ std        ┆ 1.101514 ┆ 7.071068 ┆ null     ┆ null ┆ null                ┆ null     │
        │ min        ┆ 1.0      ┆ 40.0     ┆ 0.0      ┆ xx   ┆ 2020-01-01          ┆ 10:20:30 │
        │ 25%        ┆ 2.8      ┆ 40.0     ┆ null     ┆ null ┆ 2021-07-05          ┆ 14:45:50 │
        │ 50%        ┆ 2.8      ┆ 50.0     ┆ null     ┆ null ┆ 2021-07-05          ┆ 14:45:50 │
        │ 75%        ┆ 3.0      ┆ 50.0     ┆ null     ┆ null ┆ 2022-12-31          ┆ 23:15:10 │
        │ max        ┆ 3.0      ┆ 50.0     ┆ 1.0      ┆ zz   ┆ 2022-12-31          ┆ 23:15:10 │
        └────────────┴──────────┴──────────┴──────────┴──────┴─────────────────────┴──────────┘

        Customize which percentiles are displayed, applying linear interpolation:

        >>> with pl.Config(tbl_rows=12):
        ...     lf.describe(
        ...         percentiles=[0.1, 0.3, 0.5, 0.7, 0.9],
        ...         interpolation="linear",
        ...     )
        shape: (11, 7)
        ┌────────────┬──────────┬──────────┬──────────┬──────┬─────────────────────┬──────────┐
        │ statistic  ┆ float    ┆ int      ┆ bool     ┆ str  ┆ date                ┆ time     │
        │ ---        ┆ ---      ┆ ---      ┆ ---      ┆ ---  ┆ ---                 ┆ ---      │
        │ str        ┆ f64      ┆ f64      ┆ f64      ┆ str  ┆ str                 ┆ str      │
        ╞════════════╪══════════╪══════════╪══════════╪══════╪═════════════════════╪══════════╡
        │ count      ┆ 3.0      ┆ 2.0      ┆ 3.0      ┆ 3    ┆ 3                   ┆ 3        │
        │ null_count ┆ 0.0      ┆ 1.0      ┆ 0.0      ┆ 0    ┆ 0                   ┆ 0        │
        │ mean       ┆ 2.266667 ┆ 45.0     ┆ 0.666667 ┆ null ┆ 2021-07-02 16:00:00 ┆ 16:07:10 │
        │ std        ┆ 1.101514 ┆ 7.071068 ┆ null     ┆ null ┆ null                ┆ null     │
        │ min        ┆ 1.0      ┆ 40.0     ┆ 0.0      ┆ xx   ┆ 2020-01-01          ┆ 10:20:30 │
        │ 10%        ┆ 1.36     ┆ 41.0     ┆ null     ┆ null ┆ 2020-04-20          ┆ 11:13:34 │
        │ 30%        ┆ 2.08     ┆ 43.0     ┆ null     ┆ null ┆ 2020-11-26          ┆ 12:59:42 │
        │ 50%        ┆ 2.8      ┆ 45.0     ┆ null     ┆ null ┆ 2021-07-05          ┆ 14:45:50 │
        │ 70%        ┆ 2.88     ┆ 47.0     ┆ null     ┆ null ┆ 2022-02-07          ┆ 18:09:34 │
        │ 90%        ┆ 2.96     ┆ 49.0     ┆ null     ┆ null ┆ 2022-09-13          ┆ 21:33:18 │
        │ max        ┆ 3.0      ┆ 50.0     ┆ 1.0      ┆ zz   ┆ 2022-12-31          ┆ 23:15:10 │
        └────────────┴──────────┴──────────┴──────────┴──────┴─────────────────────┴──────────┘
        r   )	from_dictz/cannot describe a LazyFrame that has no columns)count
null_countmeanstdminc              3  (   K   | ]}|d z  ddV  dS )d   g%NrQ  ).0qs     r   	<genexpr>z%LazyFrame.describe.<locals>.<genexpr>  s.      >>qa#g????>>>>>>r   maxdtr   r   r   c                n    |                                  p!| t          t          t          t          t
          fv S r   )	is_nestedr:   r>   rF   rG   rN   )r|  s    r   skip_minmaxz'LazyFrame.describe.<locals>.skip_minmax  s%    <<>>URKtVW+U%UUr   Nzcount:znull_count::zmean:zstd:zmin:zmax:c              3  b   K   | ]*}t          j        |                                          V  +d S r   )Fcolsort)rx  cs     r   rz  z%LazyFrame.describe.<locals>.<genexpr>7  s2      !E!Ea!%((--//!E!E!E!E!E!Er   c                \    g | ](}                     d           |z  |dz   z           )S )r      )row)rx  n
df_metrics	n_metricss     r   
<listcomp>z&LazyFrame.describe.<locals>.<listcomp>A  sL     
 
 
 NN1q9}Q)0CCD
 
 
r   c                    g | ]=}|t          |t                    rd n!v rt          |          nt          |          >S r   )r   dictfloatr   )rx  vr  has_numeric_results     r   r  z&LazyFrame.describe.<locals>.<listcomp>I  s`         	Z4%8%8	 D'(,>'>'>%(((SVV	  r   	statistic)r|  r   r   r   ))polars.convertrn  r   r   r2   extendappendr
   setr  litr   
is_numericis_temporalr  ro  nameprefixrp  r9   rq  rr  rs  r{  to_physicalquantilecastaddaliasr~  rF   with_columnsselectcollectr	  ranger  zipinsert_columnplSeries)r   rk  rj  rn  r   r   metrics	quantilesr  	sort_colsmetric_exprsnulldtyper  r  count_exprs	mean_exprexpr_stdmin_exprmax_expr	pct_exprsppct_exprcolumn_metricssummary
df_summaryr  r  r  r  s                             @@@@r   describezLazyFrame.describe  s   ~ 	-,,,,,$$&& 	!CCC..  @??)+6669 	?NN>>I>>>>>>u		V 	V 	V 
	V
 ),suu%I#%uT{{ 0	 0	HAu))++J(.@U->->-@-@K a  %,,X66a##%%*11-@@K ",050@0@ a  *4=quQxx||~~~H-8[-?-?IquQxx||~~~TH-8[-?-?IquQxx||~~~TH I 
= 
= $ $ 'Aa,,..77=IINNuUUUU1XX..q-@@ 
 MM!$$$$#H  1

q

!;!;<<<< *U__.. *%D'?2J2J"&&q)))  OOKAKK00 NN:!::.. NN:!::..	
  NN:!::..	 	 	 	 !!!E!E9!E!E!EEEE\# WYY 	 LL	
 
 
 
 
6::<<((
 
 
 s6>2233  	 	A     !  GAJJ Yw''
  BIk7$C$CDDDr   plainr   )r   r9  type_coercionpredicate_pushdownprojection_pushdownsimplify_expressionslice_pushdowncomm_subplan_elimcomm_subexpr_elimcluster_with_columnscollapse_joinsr   r   tree_formatoptimizationsrt   r9  r  r  r  r  r  r  r  r  r  r   r   rs   r  bool | Noner  ri   c                  |t          dd           |rd}t          |          }|dv rt          d           |r|                                }|dk    |j        _        |d	k    |j        _        | j                            |j                  }|dk    r|	                                S |
                                S |dk    r| j                                        S | j                                        S )
a  
        Create a string representation of the query plan.

        Different optimizations can be turned on or off.

        Parameters
        ----------
        format : {'plain', 'tree'}
            The format to use for displaying the logical plan.
        optimized
            Return an optimized query plan. Defaults to `True`.
            If this is set to `True` the subsequent
            optimization flags control which optimizations
            run.
        type_coercion
            Do type coercion optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        predicate_pushdown
            Do predicate pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        projection_pushdown
            Do projection pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        simplify_expression
            Run simplify expressions optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        slice_pushdown
            Slice pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subplan_elim
            Will try to cache branching subplans that occur on self-joins or unions.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subexpr_elim
            Common subexpressions will be cached and reused.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        cluster_with_columns
            Combine sequential independent calls to with_columns

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        collapse_joins
            Collapse a join and filters into a faster join

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query
            is run using the polars in-memory engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars in-memory
            engine. If set to `"gpu"`, the GPU engine is used. Fine-grained
            control over the GPU engine, for example which device to use
            on a system with multiple devices, is possible by providing a
            :class:`~.GPUEngine` object with configuration options.

            .. note::
               GPU mode is considered **unstable**. Not all queries will run
               successfully on the GPU, however, they should fall back transparently
               to the default engine if execution is not supported.

               Running with `POLARS_VERBOSE=1` will provide information if a query
               falls back (and why).

            .. note::
               The GPU engine does not support streaming, if streaming
               is enabled then GPU execution is switched off.
        optimizations
            The optimization passes done during query optimization.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        tree_format
            Format the output as a tree.

            .. deprecated:: 0.20.30
                Use `format="tree"` instead.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a", maintain_order=True).agg(pl.all().sum()).sort(
        ...     "a"
        ... ).explain()  # doctest: +SKIP
        Nzethe `tree_format` parameter for `LazyFrame.explain` is deprecated Use the `format` parameter instead.z0.20.30versiontreer   r   &streaming mode is considered unstable.r   r   )r"   r   r(   r,  _pyoptflagsr   old_streamingr   with_optimizationsdescribe_optimized_plan_treedescribe_optimized_plandescribe_plan_treedescribe_plan)r   r   r9  r  r  r  r  r  r  r  r  r  r   r   r  r  r   s                    r   r:  zLazyFrame.explainW  s   @ "%7!   
   ''333"#KLLL 		5)2244M28K2GM%/6<6OM%3)..}/HIIC7799922444V9//1119**,,,r   )g      0@g      (@ir)r9  showoutput_path
raw_outputfigsizer  _type_checkr  r  r  r  r  r  r  r  r   
plan_stage_check_orderr  r  r  str | Path | Noner  r  tuple[float, float]r  r  r   r  
str | Nonec                  t          |          }|dv rt          d           |                                }|dk    |j        _        |dk    |j        _        | j                            |j                  }|dk    r|                    |          }nM|dk    r2|dk    r|	                    |          }n+|                    |          }nd| d}t          |          t          |||||	          S )
a  
        Show a plot of the query plan.

        Note that Graphviz must be installed to render the visualization (if not
        already present, you can download it here: `<https://graphviz.org/download>`_).

        Parameters
        ----------
        optimized
            Optimize the query plan.
        show
            Show the figure.
        output_path
            Write the figure to disk.
        raw_output
            Return dot syntax. This cannot be combined with `show` and/or `output_path`.
        figsize
            Passed to matplotlib if `show == True`.
        type_coercion
            Do type coercion optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        predicate_pushdown
            Do predicate pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        projection_pushdown
            Do projection pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        simplify_expression
            Run simplify expressions optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        slice_pushdown
            Slice pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subplan_elim
            Will try to cache branching subplans that occur on self-joins or unions.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subexpr_elim
            Common subexpressions will be cached and reused.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        cluster_with_columns
            Combine sequential independent calls to with_columns.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        collapse_joins
            Collapse a join and filters into a faster join.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query
            is run using the polars in-memory engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars in-memory
            engine. If set to `"gpu"`, the GPU engine is used. Fine-grained
            control over the GPU engine, for example which device to use
            on a system with multiple devices, is possible by providing a
            :class:`~.GPUEngine` object with configuration options.

            .. note::
               GPU mode is considered **unstable**. Not all queries will run
               successfully on the GPU, however, they should fall back transparently
               to the default engine if execution is not supported.

               Running with `POLARS_VERBOSE=1` will provide information if a query
               falls back (and why).

            .. note::
               The GPU engine does not support streaming, if streaming
               is enabled then GPU execution is switched off.
        plan_stage : {'ir', 'physical'}
            Select the stage to display. Currently only the streaming engine has a
            separate physical stage, for the other engines both IR and physical are the
            same.


        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a", maintain_order=True).agg(pl.all().sum()).sort(
        ...     "a"
        ... ).show_graph()  # doctest: +SKIP
        r  r  r   r   r  physicalzinvalid plan stage '')rC  r  r  r  r  )r   r(   r,  r  r  r   r   r  rF  to_dot_streaming_physr   r+   )r   r9  r  r  r  r  r  r  r  r  r  r  r  r  r  r  r   r  r  r  r   rC  	error_msgs                          r   
show_graphzLazyFrame.show_graph  s   D  ''333"#KLLL%..0028O2K!/.4.C!+y++M,EFF++i((CC:%%$$00;;kk),,<z<<<II&&& #!
 
 
 	
r   {}fmtc                @    dfd}|                      |dd          S )a
  
        Inspect a node in the computation graph.

        Print the value that this node in the computation graph evaluates to and pass on
        the value.

        Examples
        --------
        >>> lf = pl.LazyFrame({"foo": [1, 1, -2, 3]})
        >>> (
        ...     lf.with_columns(pl.col("foo").cum_sum().alias("bar"))
        ...     .inspect()  # print the node before the filter
        ...     .filter(pl.col("bar") == pl.col("foo"))
        ... )  # doctest: +ELLIPSIS
        <LazyFrame at ...>
        srl   r   c                L    t                              |                      | S r   )printr   )r  r  s    r   inspectz"LazyFrame.inspect.<locals>.inspect  s     #**Q--   Hr   T)r  r  )r  rl   r   rl   )map_batches)r   r  r  s    ` r   r  zLazyFrame.inspect  sG    $	 	 	 	 	 	 $   
 
 	
r   )
descending
nulls_lastmaintain_ordermultithreadedbyIntoExpr | Iterable[IntoExpr]more_byrw   r  bool | Sequence[bool]r  r  r  c          	        t          |t                    r]|s[t          |t                    rFt          |t                    r1|                     | j                            |||||                    S t          |g|R  }t          |t          |          dd          }t          |t          |          dd          }|                     | j        	                    |||||                    S )u  
        Sort the LazyFrame by the given columns.

        Parameters
        ----------
        by
            Column(s) to sort by. Accepts expression input, including selectors. Strings
            are parsed as column names.
        *more_by
            Additional columns to sort by, specified as positional arguments.
        descending
            Sort in descending order. When sorting by multiple columns, can be specified
            per column by passing a sequence of booleans.
        nulls_last
            Place null values last; can specify a single boolean applying to all columns
            or a sequence of booleans for per-column control.
        maintain_order
            Whether the order should be maintained if elements are equal.
            Note that if `true` streaming is not possible and performance might be
            worse since this requires a stable search.
        multithreaded
            Sort using multiple threads.

        Examples
        --------
        Pass a single column name to sort by that column.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, None],
        ...         "b": [6.0, 5.0, 4.0],
        ...         "c": ["a", "c", "b"],
        ...     }
        ... )
        >>> lf.sort("a").collect()
        shape: (3, 3)
        ┌──────┬─────┬─────┐
        │ a    ┆ b   ┆ c   │
        │ ---  ┆ --- ┆ --- │
        │ i64  ┆ f64 ┆ str │
        ╞══════╪═════╪═════╡
        │ null ┆ 4.0 ┆ b   │
        │ 1    ┆ 6.0 ┆ a   │
        │ 2    ┆ 5.0 ┆ c   │
        └──────┴─────┴─────┘

        Sorting by expressions is also supported.

        >>> lf.sort(pl.col("a") + pl.col("b") * 2, nulls_last=True).collect()
        shape: (3, 3)
        ┌──────┬─────┬─────┐
        │ a    ┆ b   ┆ c   │
        │ ---  ┆ --- ┆ --- │
        │ i64  ┆ f64 ┆ str │
        ╞══════╪═════╪═════╡
        │ 2    ┆ 5.0 ┆ c   │
        │ 1    ┆ 6.0 ┆ a   │
        │ null ┆ 4.0 ┆ b   │
        └──────┴─────┴─────┘

        Sort by multiple columns by passing a list of columns.

        >>> lf.sort(["c", "a"], descending=True).collect()
        shape: (3, 3)
        ┌──────┬─────┬─────┐
        │ a    ┆ b   ┆ c   │
        │ ---  ┆ --- ┆ --- │
        │ i64  ┆ f64 ┆ str │
        ╞══════╪═════╪═════╡
        │ 2    ┆ 5.0 ┆ c   │
        │ null ┆ 4.0 ┆ b   │
        │ 1    ┆ 6.0 ┆ a   │
        └──────┴─────┴─────┘

        Or use positional arguments to sort by multiple columns in the same way.

        >>> lf.sort("c", "a", descending=[False, True]).collect()
        shape: (3, 3)
        ┌──────┬─────┬─────┐
        │ a    ┆ b   ┆ c   │
        │ ---  ┆ --- ┆ --- │
        │ i64  ┆ f64 ┆ str │
        ╞══════╪═════╪═════╡
        │ 1    ┆ 6.0 ┆ a   │
        │ null ┆ 4.0 ┆ b   │
        │ 2    ┆ 5.0 ┆ c   │
        └──────┴─────┴─────┘
        r  r  r  )
r   r   r   r   r   r  r%   r,   r	  sort_by_exprs)r   r  r  r  r  r  r  s          r   r  zLazyFrame.sort  s    F r3
	
	 :t,,
	 :t,,	
	 ##	
J    ,B9999 SWWlDII
 SWWlDII
I##J
NM 
 
 	
r   r   )
table_namequeryr  c                   ddl m} t          d            |dd          5 }|r|nd}|                    ||            |                    |          cddd           S # 1 swxY w Y   dS )	u  
        Execute a SQL query against the LazyFrame.

        .. versionadded:: 0.20.23

        .. warning::
            This functionality is considered **unstable**, although it is close to
            being considered stable. It may be changed at any point without it being
            considered a breaking change.

        Parameters
        ----------
        query
            SQL query to execute.
        table_name
            Optionally provide an explicit name for the table that represents the
            calling frame (defaults to "self").

        Notes
        -----
        * The calling frame is automatically registered as a table in the SQL context
          under the name "self". If you want access to the DataFrames and LazyFrames
          found in the current globals, use the top-level :meth:`pl.sql <polars.sql>`.
        * More control over registration and execution behaviour is available by
          using the :class:`SQLContext` object.

        See Also
        --------
        SQLContext

        Examples
        --------
        >>> lf1 = pl.LazyFrame({"a": [1, 2, 3], "b": [6, 7, 8], "c": ["z", "y", "x"]})
        >>> lf2 = pl.LazyFrame({"a": [3, 2, 1], "d": [125, -654, 888]})

        Query the LazyFrame using SQL:

        >>> lf1.sql("SELECT c, b FROM self WHERE a > 1").collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ c   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ y   ┆ 7   │
        │ x   ┆ 8   │
        └─────┴─────┘

        Apply SQL transforms (aliasing "self" to "frame") then filter
        natively (you can freely mix SQL and native operations):

        >>> lf1.sql(
        ...     query='''
        ...         SELECT
        ...             a,
        ...             (a % 2 == 0) AS a_is_even,
        ...             (b::float4 / 2) AS "b/2",
        ...             CONCAT_WS(':', c, c, c) AS c_c_c
        ...         FROM frame
        ...         ORDER BY a
        ...     ''',
        ...     table_name="frame",
        ... ).filter(~pl.col("c_c_c").str.starts_with("x")).collect()
        shape: (2, 4)
        ┌─────┬───────────┬─────┬───────┐
        │ a   ┆ a_is_even ┆ b/2 ┆ c_c_c │
        │ --- ┆ ---       ┆ --- ┆ ---   │
        │ i64 ┆ bool      ┆ f32 ┆ str   │
        ╞═════╪═══════════╪═════╪═══════╡
        │ 1   ┆ false     ┆ 3.0 ┆ z:z:z │
        │ 2   ┆ true      ┆ 3.5 ┆ y:y:y │
        └─────┴───────────┴─────┴───────┘
        r   )
SQLContextzS`sql` is considered **unstable** (although it is close to being considered stable).F)register_globalseagerr   )r  frameN)
polars.sqlr  r(   registerexecute)r   r  r  r  ctxr  s         r   sqlzLazyFrame.sql&  s    T 	*)))))a	
 	
 	
 Ze<<< 	&!+7::DLLd$L///;;u%%	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	& 	&s   2A""A&)A&reversez1.0.0r  )r  kc                   t          |          }t          |t          |          dd          }|                     | j                            |||                    S )u'  
        Return the `k` largest rows.

        Non-null elements are always preferred over null elements, regardless of
        the value of `reverse`. The output is not guaranteed to be in any
        particular order, call :func:`sort` after this function if you wish the
        output to be sorted.

        .. versionchanged:: 1.0.0
            The `descending` parameter was renamed `reverse`.

        Parameters
        ----------
        k
            Number of rows to return.
        by
            Column(s) used to determine the top rows.
            Accepts expression input. Strings are parsed as column names.
        reverse
            Consider the `k` smallest elements of the `by` column(s) (instead of the `k`
            largest). This can be specified per column by passing a sequence of
            booleans.

        See Also
        --------
        bottom_k

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [2, 1, 1, 3, 2, 1],
        ...     }
        ... )

        Get the rows which contain the 4 largest values in column b.

        >>> lf.top_k(4, by="b").collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ b   ┆ 3   │
        │ a   ┆ 2   │
        │ b   ┆ 2   │
        │ b   ┆ 1   │
        └─────┴─────┘

        Get the rows which contain the 4 largest values when sorting on column b and a.

        >>> lf.top_k(4, by=["b", "a"]).collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ b   ┆ 3   │
        │ b   ┆ 2   │
        │ a   ┆ 2   │
        │ c   ┆ 1   │
        └─────┴─────┘
        r  r  r  r  )r%   r,   r	  r   r   top_kr   r  r  r  s       r   r  zLazyFrame.top_kz  sS    T ,B//gs2ww	4@@	b' J JKKKr   c                   t          |          }t          |t          |          dd          }|                     | j                            |||                    S )u0  
        Return the `k` smallest rows.

        Non-null elements are always preferred over null elements, regardless of
        the value of `reverse`. The output is not guaranteed to be in any
        particular order, call :func:`sort` after this function if you wish the
        output to be sorted.

        .. versionchanged:: 1.0.0
            The `descending` parameter was renamed `reverse`.

        Parameters
        ----------
        k
            Number of rows to return.
        by
            Column(s) used to determine the bottom rows.
            Accepts expression input. Strings are parsed as column names.
        reverse
            Consider the `k` largest elements of the `by` column(s) (instead of the `k`
            smallest). This can be specified per column by passing a sequence of
            booleans.

        See Also
        --------
        top_k

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [2, 1, 1, 3, 2, 1],
        ...     }
        ... )

        Get the rows which contain the 4 smallest values in column b.

        >>> lf.bottom_k(4, by="b").collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ b   ┆ 1   │
        │ a   ┆ 1   │
        │ c   ┆ 1   │
        │ a   ┆ 2   │
        └─────┴─────┘

        Get the rows which contain the 4 smallest values when sorting on column a and b.

        >>> lf.bottom_k(4, by=["a", "b"]).collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ a   ┆ 1   │
        │ a   ┆ 2   │
        │ b   ┆ 1   │
        │ b   ┆ 2   │
        └─────┴─────┘
        r  r  r  )r%   r,   r	  r   r   bottom_kr	  s       r   r  zLazyFrame.bottom_k  sV    T ,B//gs2ww	4@@	 2 21W 2 M MNNNr   r   )      )r  r  r  r  no_optimizationr  r  r  r  r  	show_plottruncate_nodesr  r   r  r  r  r  tuple[int, int]_kwargstuple[DataFrame, DataFrame]c               (   |D ]}|dvrd| d}t          |          t          |          }|                                }|dk    |j        _        | j                            |j                  }t          ||dk    ddd          }|                    d          |                    d          }|	                    |          \  }}t          |          t          |          }}|rt          d	d
           ddlm} |                    d|          \  }}|d         d         }|                                }|dk    r/d}|                    t#          j        ddg          dz            }n7|dk    r/d}|                    t#          j        ddg          dz            }nd}|dk    rC|                    t#          j        d          j                            d|          dz             }|d         d         }|                    |d         |d         |d         z
  |d                    |                    d           |                    d| d| |            |                    d           |                                 ||fS ) u@  
        Profile a LazyFrame.

        This will run the query and return a tuple
        containing the materialized DataFrame and a DataFrame that
        contains profiling information of each node that is executed.

        The units of the timings are microseconds.

        Parameters
        ----------
        type_coercion
            Do type coercion optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        predicate_pushdown
            Do predicate pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        projection_pushdown
            Do projection pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        simplify_expression
            Run simplify expressions optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        no_optimization
            Turn off (certain) optimizations.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        slice_pushdown
            Slice pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subplan_elim
            Will try to cache branching subplans that occur on self-joins or unions.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subexpr_elim
            Common subexpressions will be cached and reused.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        cluster_with_columns
            Combine sequential independent calls to with_columns

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        collapse_joins
            Collapse a join and filters into a faster join

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        show_plot
            Show a gantt chart of the profiling result
        truncate_nodes
            Truncate the label lengths in the gantt chart to this number of
            characters.
        figsize
            matplotlib figsize of the profiling plot
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query
            is run using the polars in-memory engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars in-memory
            engine. If set to `"gpu"`, the GPU engine is used. Fine-grained
            control over the GPU engine, for example which device to use
            on a system with multiple devices, is possible by providing a
            :class:`~.GPUEngine` object with configuration options.

            .. note::
               GPU mode is considered **unstable**. Not all queries will run
               successfully on the GPU, however, they should fall back transparently
               to the default engine if execution is not supported.

               Running with `POLARS_VERBOSE=1` will provide information if a query
               falls back (and why).

            .. note::
               The GPU engine does not support streaming, if streaming
               is enabled then GPU execution is switched off.
        optimizations
            The optimization passes done during query optimization.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.


        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a", maintain_order=True).agg(pl.all().sum()).sort(
        ...     "a"
        ... ).profile()  # doctest: +SKIP
        (shape: (3, 3)
         ┌─────┬─────┬─────┐
         │ a   ┆ b   ┆ c   │
         │ --- ┆ --- ┆ --- │
         │ str ┆ i64 ┆ i64 │
         ╞═════╪═════╪═════╡
         │ a   ┆ 4   ┆ 10  │
         │ b   ┆ 11  ┆ 10  │
         │ c   ┆ 6   ┆ 1   │
         └─────┴─────┴─────┘,
         shape: (3, 3)
         ┌─────────────────────────┬───────┬──────┐
         │ node                    ┆ start ┆ end  │
         │ ---                     ┆ ---   ┆ ---  │
         │ str                     ┆ u64   ┆ u64  │
         ╞═════════════════════════╪═══════╪══════╡
         │ optimization            ┆ 0     ┆ 5    │
         │ group_by_partitioned(a) ┆ 5     ┆ 470  │
         │ sort(a)                 ┆ 475   ┆ 1964 │
         └─────────────────────────┴───────┴──────┘)
        )post_opt_callbackz.profile() got an unexpected keyword argument 'r  r   Fr   r   r   r   r  N
matplotlibz+should be installed to show profiling plots)
err_suffixr   r  )r  endg    eAr  starti@B g    .Amsi  usnodez...)r
  leftzProfiling resultznode duration in [z	], total nodes)r   r   r,  r  r  r   r  r   getprofiler5   rS   matplotlib.pyplotpyplotsubplotsr  r  r  r  r   r4  barhtitle
set_xlabel
set_ylabelr  )r   r  r  r  r  r  r  r  r  r  r  r  r  r  r   r  r  r  r  r   callbackdftimingsplt_figaxmax_valtimings_unitmax_in_units                                 r   r"  zLazyFrame.profile  s   r  	+ 	+A    RQQQQ		***	
  ''%..0028O2K!/i**=+DEE'/
 
 
 ;;*++7{{#677Hkk(++GWW%5%5W #	H    ,+++++||Aw|77HD"enR(G((H}}#007G1H1H91TUU3#007G1H1H41OPP!!#00E&MM%++A~>>F  #5/!,KGG uo(99g&     II()))MMQtQQkQ4QQRRRMM'"""HHJJJ7{r   )r  r  r  r  r  r  r  r  r  r  r   r  r   Literal[True]r[   c                   d S r   rQ  r   r  r  r  r  r  r  r  r  r  r  r   r   r  s                 r   r  zLazyFrame.collect  s	    " r   )r  r  r  r  r  r  r  r  r  r  r   r   r  Literal[False]c                   d S r   rQ  r6  s                 r   r  zLazyFrame.collect  s	    " Cr   DataFrame | InProcessQueryc               `   |D ]}|dvrd| d}t          |          t          |          }|                    dd          pt                      dk    }|rd}|dv rt	          d           t          ||d	k    |||j        j        
          }t          |t                    rd}| j
                            |j                  }|r0t	          d           t          |                                          S |                    d|          }t          |                    ||                    S )u  
        Materialize this LazyFrame into a DataFrame.

        By default, all query optimizations are enabled. Individual optimizations may
        be disabled by setting the corresponding parameter to `False`.

        Parameters
        ----------
        type_coercion
            Do type coercion optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        predicate_pushdown
            Do predicate pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        projection_pushdown
            Do projection pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        simplify_expression
            Run simplify expressions optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        slice_pushdown
            Slice pushdown optimization.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subplan_elim
            Will try to cache branching subplans that occur on self-joins or unions.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        comm_subexpr_elim
            Common subexpressions will be cached and reused.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        cluster_with_columns
            Combine sequential independent calls to with_columns

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        collapse_joins
            Collapse a join and filters into a faster join

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        no_optimization
            Turn off (certain) optimizations.

            .. deprecated:: 1.30.0
                Use the `optimizations` parameters.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query
            is run using the polars in-memory engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars in-memory
            engine. If set to `"gpu"`, the GPU engine is used. Fine-grained
            control over the GPU engine, for example which device to use
            on a system with multiple devices, is possible by providing a
            :class:`~.GPUEngine` object with configuration options.

            .. note::
               GPU mode is considered **unstable**. Not all queries will run
               successfully on the GPU, however, they should fall back transparently
               to the default engine if execution is not supported.

               Running with `POLARS_VERBOSE=1` will provide information if a query
               falls back (and why).

            .. note::
               The GPU engine does not support streaming, or running in the
               background. If either are enabled, then GPU execution is switched off.
        background
            Run the query in the background and get a handle to the query.
            This handle can be used to fetch the result or cancel the query.

            .. warning::
                Background mode is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        optimizations
            The optimization passes done during query optimization.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        DataFrame

        See Also
        --------
        explain : Print the query plan that is evaluated with collect.
        profile : Collect the LazyFrame and time each node in the computation graph.
        polars.collect_all : Collect multiple LazyFrames at the same time.
        polars.Config.set_streaming_chunk_size : Set the size of streaming batches.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a").agg(pl.all().sum()).collect()  # doctest: +SKIP
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 4   ┆ 10  │
        │ b   ┆ 11  ┆ 10  │
        │ c   ┆ 6   ┆ 1   │
        └─────┴─────┴─────┘

        Collect in streaming mode

        >>> lf.group_by("a").agg(pl.all().sum()).collect(
        ...     engine="streaming"
        ... )  # doctest: +SKIP
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 4   ┆ 10  │
        │ b   ┆ 11  ┆ 10  │
        │ c   ┆ 6   ┆ 1   │
        └─────┴─────┴─────┘

        Collect in GPU mode

        >>> lf.group_by("a").agg(pl.all().sum()).collect(engine="gpu")  # doctest: +SKIP
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ b   ┆ 11  ┆ 10  │
        │ a   ┆ 4   ┆ 10  │
        │ c   ┆ 6   ┆ 1   │
        └─────┴─────┴─────┘

        With control over the device used

        >>> lf.group_by("a").agg(pl.all().sum()).collect(
        ...     engine=pl.GPUEngine(device=1)
        ... )  # doctest: +SKIP
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ b   ┆ 11  ┆ 10  │
        │ a   ┆ 4   ┆ 10  │
        │ c   ┆ 6   ┆ 1   │
        └─────┴─────┴─────┘
        )r   r  z.collect() got an unexpected keyword argument 'r  r   Fr   )r   r   r  r   r  r   z'background mode is considered unstable.r  )r   r   r!  rb   r(   r   r  r  r   rY   r   r  r[   collect_concurrentlyr5   r  )r   r  r  r  r  r  r  r  r  r  r  r   r   r  r  r  r  r   r*  r   s                       r   r  zLazyFrame.collect  sp   B  	+ 	+A    RQQQQ		***  '' KK//W3F3H3HK3W 	  	! F333"#KLLL'/!' ,2
 
 
 fi(( 	Fi**=+DEE 	>"#LMMM!#":":"<"<=== ;;2H==s{{6844555r   )r   r  gevent!_GeventDataFrameResult[DataFrame]c                   d S r   rQ  r   r<  r   r  s       r   collect_asynczLazyFrame.collect_async  s	     -0Cr   )r<  r   r  Awaitable[DataFrame]c                   d S r   rQ  r?  s       r   r@  zLazyFrame.collect_async	  s	      #sr   8Awaitable[DataFrame] | _GeventDataFrameResult[DataFrame]c                   t          |          }|dv rt          d           | j                            |j                  }|rt                      nt                      }|                    ||j                   |S )u~  
        Collect DataFrame asynchronously in thread pool.

        .. warning::
            This functionality is considered **unstable**. It may be changed
            at any point without it being considered a breaking change.

        Collects into a DataFrame (like :func:`collect`) but, instead of returning
        a DataFrame directly, it is scheduled to be collected inside a thread pool,
        while this method returns almost instantly.

        This can be useful if you use `gevent` or `asyncio` and want to release
        control to other greenlets/tasks while LazyFrames are being collected.

        Parameters
        ----------
        gevent
            Return wrapper to `gevent.event.AsyncResult` instead of Awaitable
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query
            is run using the polars in-memory engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars in-memory
            engine.

            .. note::
               The GPU engine does not support async, or running in the
               background. If either are enabled, then GPU execution is switched off.
        optimizations
            The optimization passes done during query optimization.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        If `gevent=False` (default) then returns an awaitable.

        If `gevent=True` then returns wrapper that has a
        `.get(block=True, timeout=None)` method.

        See Also
        --------
        polars.collect_all : Collect multiple LazyFrames at the same time.
        polars.collect_all_async : Collect multiple LazyFrames at the same time lazily.

        Notes
        -----
        In case of error `set_exception` is used on
        `asyncio.Future`/`gevent.event.AsyncResult` and will be reraised by them.

        Examples
        --------
        >>> import asyncio
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> async def main():
        ...     return await (
        ...         lf.group_by("a", maintain_order=True)
        ...         .agg(pl.all().sum())
        ...         .collect_async()
        ...     )
        >>> asyncio.run(main())
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 4   ┆ 10  │
        │ b   ┆ 11  ┆ 10  │
        │ c   ┆ 6   ┆ 1   │
        └─────┴─────┴─────┘
        r  r  )	r   r(   r   r  r  r   r   collect_with_callback	_callback)r   r<  r   r  r   results         r   r@  zLazyFrame.collect_async	  s    t  ''333"#KLLLi**=+DEE )/I"$$$4G4I4I 	 	!!&&*:;;;r   c                R    t          | j                                        d          S )a  
        Resolve the schema of this LazyFrame.

        Examples
        --------
        Determine the schema.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.collect_schema()
        Schema({'foo': Int64, 'bar': Float64, 'ham': String})

        Access various properties of the schema.

        >>> schema = lf.collect_schema()
        >>> schema["bar"]
        Float64
        >>> schema.names()
        ['foo', 'bar', 'ham']
        >>> schema.dtypes()
        [Int64, Float64, String]
        >>> schema.len()
        3
        F)check_dtypes)r^   r   r   r   s    r   r   zLazyFrame.collect_schemaw	  s%    < di..00uEEEEr   zstd   )compressioncompression_level
statisticsrow_group_sizedata_page_sizer  storage_optionscredential_providerretriessync_on_closemkdirr   field_overwritesr   metadatar  r   +str | Path | IO[bytes] | PartitioningSchemerL  rM  rN  bool | str | dict[str, bool]rO  rP  rQ  dict[str, Any] | NonerR  3CredentialProviderFunction | Literal['auto'] | NonerS  rT  SyncOnCloseMethod | NonerU  r   rV  gParquetFieldOverwrites | Sequence[ParquetFieldOverwrites] | Mapping[str, ParquetFieldOverwrites] | NonerW  ParquetMetadata | Nonec                   d S r   rQ  r   r   rL  rM  rN  rO  rP  r  rQ  rR  rS  rT  rU  r   rV  r   rW  r  s                     r   sink_parquetzLazyFrame.sink_parquet	  s	    4 sr   )rL  rM  rN  rO  rP  r  rQ  rR  rS  rT  rU  rV  r   rW  r  c                   d S r   rQ  r`  s                     r   ra  zLazyFrame.sink_parquet	  s	    4 Cr   )rL  rM  rN  rO  rP  r  rQ  rR  rS  rT  rW  rU  r   rV  r   r  LazyFrame | Nonec                  t          |          }|d}t          |           t          |t                    r
|rddddd}n't          |t                    r|si }n|dk    rddddd}ddlm}  ||	||d	          }~	|r"t          |                                          }nd}t          |          }|pd
||d}t          |t                    r'|r"t          |                                          }n!d}nt          |          rt          |          }g }|ddl}ddlm}m}m t          ||          r |          g}n}t          ||j        j                  r |t          |                    }nJt          ||j        j                  rfd|D             }n!dt)          |           }t+          |          | j                            |||||||||
|||          }|sL|                    |j                  }t4                              |          }|                    |           dS t4                              |          S )a?  
        Evaluate the query in streaming mode and write to a Parquet file.

        This allows streaming results that are larger than RAM to be written to disk.

        Parameters
        ----------
        path
            File path to which the file should be written.
        compression : {'lz4', 'uncompressed', 'snappy', 'gzip', 'lzo', 'brotli', 'zstd'}
            Choose "zstd" for good compression performance.
            Choose "lz4" for fast compression/decompression.
            Choose "snappy" for more backwards compatibility guarantees
            when you deal with older parquet readers.
        compression_level
            The level of compression to use. Higher compression means smaller files on
            disk.

            - "gzip" : min-level: 0, max-level: 9.
            - "brotli" : min-level: 0, max-level: 11.
            - "zstd" : min-level: 1, max-level: 22.
        statistics
            Write statistics to the parquet headers. This is the default behavior.

            Possible values:

            - `True`: enable default set of statistics (default). Some
              statistics may be disabled.
            - `False`: disable all statistics
            - "full": calculate and write all available statistics. Cannot be
              combined with `use_pyarrow`.
            - `{ "statistic-key": True / False, ... }`. Cannot be combined with
              `use_pyarrow`. Available keys:

              - "min": column minimum value (default: `True`)
              - "max": column maximum value (default: `True`)
              - "distinct_count": number of unique column values (default: `False`)
              - "null_count": number of null values in column (default: `True`)
        row_group_size
            Size of the row groups in number of rows.
            If None (default), the chunks of the `DataFrame` are
            used. Writing in smaller chunks may reduce memory pressure and improve
            writing speeds.
        data_page_size
            Size limit of individual data pages.
            If not set defaults to 1024 * 1024 bytes
        maintain_order
            Maintain the order in which data is processed.
            Setting this to `False` will be slightly faster.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        storage_options
            Options that indicate how to connect to a cloud provider.

            The cloud providers currently supported are AWS, GCP, and Azure.
            See supported keys here:

            * `aws <https://docs.rs/object_store/latest/object_store/aws/enum.AmazonS3ConfigKey.html>`_
            * `gcp <https://docs.rs/object_store/latest/object_store/gcp/enum.GoogleConfigKey.html>`_
            * `azure <https://docs.rs/object_store/latest/object_store/azure/enum.AzureConfigKey.html>`_
            * Hugging Face (`hf://`): Accepts an API key under the `token` parameter:             `{'token': '...'}`, or by setting the `HF_TOKEN` environment variable.

            If `storage_options` is not provided, Polars will try to infer the
            information from environment variables.
        credential_provider
            Provide a function that can be called to provide cloud storage
            credentials. The function is expected to return a dictionary of
            credential keys along with an optional credential expiry time.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        retries
            Number of retries if accessing a cloud instance fails.
        sync_on_close: { None, 'data', 'all' }
            Sync to disk when before closing a file.

            * `None` does not sync.
            * `data` syncs the file contents.
            * `all` syncs the file contents and metadata.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        metadata
            A dictionary or callback to add key-values to the file-level Parquet
            metadata.

            .. warning::
                This functionality is considered **experimental**. It may be removed or
                changed at any point without it being considered a breaking change.
        mkdir: bool
            Recursively create all the directories in the path.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        lazy: bool
            Wait to start execution until `collect` is called.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        field_overwrites
            Property overwrites for individual Parquet fields.

            This allows more control over the writing process to the granularity of a
            Parquet field.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query is run
            using the polars streaming engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars streaming
            engine.
        optimizations
            The optimization passes done during query optimization.

            This has no effect if `lazy` is set to `True`.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        DataFrame

        Examples
        --------
        >>> lf = pl.scan_csv("/path/to/my_larger_than_ram_file.csv")  # doctest: +SKIP
        >>> lf.sink_parquet("out.parquet")  # doctest: +SKIP
        Nz/`metadata` parameter is considered experimentalTF)rs  r{  distinct_countrp  fullr   !_init_credential_provider_builderra  nonerT  r  rU  )r   +_parquet_field_overwrites_dict_to_dict_list!_parquet_field_overwrites_to_dictc                &    g | ]} |          S rQ  rQ  )rx  r  rl  s     r   r  z*LazyFrame.sink_parquet.<locals>.<listcomp>
  s2     * * *=>55a88* * *r   z$field_overwrites got the wrong type )targetrL  rM  rN  rO  rP  cloud_optionsrR  rS  sink_optionsrW  rV  r   )r   r(   r   r   ,polars.io.cloud.credential_provider._builderrh  r   r   r   r  r   r#   collections"polars.io.parquet.field_overwritesr   rk  rl  abcr   re   typer   r   ra  r  r  r   r   r  )r   r   rL  rM  rN  rO  rP  r  rQ  rR  rS  rT  rW  rU  r   rV  r   r  r   rh  credential_provider_builderrn  rp  field_overwrites_dictsrr  r   rk  r   rl  s                               @r   ra  zLazyFrame.sink_parquet	  sW   N  ''CC"3'''j$'' 	J 	"'"	 JJ 
D)) 	* 	JJ6!!"&"	 J	
 	
 	
 	
 	
 	
 'H&G'
 '
#   	#"?#8#8#:#:;;OO #O &&*4f,
 
 h%% 	@   0 011  h 	@5h??H 8:'          *,BCC %556FGG*&& ,ko.EFF 
%)T)T)*** *&& ,ko.FGG %* * * *BR* * *&& VTBR=S=SUUnn$i$$#/!))) ;%3 % 
 
  	(()BCCC'',,CKKvK&&&4$$S)))r   )rL  compat_levelr  rQ  rR  rS  rT  rU  r   r   r  IpcCompression | Nonerx  CompatLevel | Nonec                   d S r   rQ  r   r   rL  rx  r  rQ  rR  rS  rT  rU  r   r   r  s                r   sink_ipczLazyFrame.sink_ipc
  s	    $ sr   )
rL  rx  r  rQ  rR  rS  rT  rU  r   r  c                   d S r   rQ  r|  s                r   r}  zLazyFrame.sink_ipc
  s	    $ Cr   uncompressedc          	         t          |          }ddlm}  ||||d          }~|r"t          |                                          }nd}t          |          }|pd||	d}|d}nt          |t                    r|j        }|d}| j	        
                    |||||||	          }|
sL|                    |j                  }t                              |          }|                    |
           dS t                              |          S )a  
        Evaluate the query in streaming mode and write to an IPC file.

        This allows streaming results that are larger than RAM to be written to disk.

        Parameters
        ----------
        path
            File path to which the file should be written.
        compression : {'uncompressed', 'lz4', 'zstd'}
            Choose "zstd" for good compression performance.
            Choose "lz4" for fast compression/decompression.
        compat_level
            Use a specific compatibility level
            when exporting Polars' internal data structures.
        maintain_order
            Maintain the order in which data is processed.
            Setting this to `False` will be slightly faster.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        storage_options
            Options that indicate how to connect to a cloud provider.

            The cloud providers currently supported are AWS, GCP, and Azure.
            See supported keys here:

            * `aws <https://docs.rs/object_store/latest/object_store/aws/enum.AmazonS3ConfigKey.html>`_
            * `gcp <https://docs.rs/object_store/latest/object_store/gcp/enum.GoogleConfigKey.html>`_
            * `azure <https://docs.rs/object_store/latest/object_store/azure/enum.AzureConfigKey.html>`_
            * Hugging Face (`hf://`): Accepts an API key under the `token` parameter:             `{'token': '...'}`, or by setting the `HF_TOKEN` environment variable.

            If `storage_options` is not provided, Polars will try to infer the
            information from environment variables.
        credential_provider
            Provide a function that can be called to provide cloud storage
            credentials. The function is expected to return a dictionary of
            credential keys along with an optional credential expiry time.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        retries
            Number of retries if accessing a cloud instance fails.
        sync_on_close: { None, 'data', 'all' }
            Sync to disk when before closing a file.

            * `None` does not sync.
            * `data` syncs the file contents.
            * `all` syncs the file contents and metadata.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        mkdir: bool
            Recursively create all the directories in the path.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        lazy: bool
            Wait to start execution until `collect` is called.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query is run
            using the polars streaming engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars streaming
            engine.

            .. note::
               The GPU engine is currently not supported.
        optimizations
            The optimization passes done during query optimization.

            This has no effect if `lazy` is set to `True`.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        DataFrame

        Examples
        --------
        >>> lf = pl.scan_csv("/path/to/my_larger_than_ram_file.csv")  # doctest: +SKIP
        >>> lf.sink_ipc("out.arrow")  # doctest: +SKIP
        r   rg  r}  Nri  rj  Tr  )rn  rL  rx  ro  rR  rS  rp  r   )r   rq  rh  r   r   r   r   rX   _versionr   r}  r  r  r   r   r  )r   r   rL  rx  r  rQ  rR  rS  rT  rU  r   r   r  rh  rv  rn  rp  r   s                     r   r}  zLazyFrame.sink_ipc  sj   f  ''	
 	
 	
 	
 	
 	
 'H&G
'
 '
#   	#"?#8#8#:#:;;OO #O &&*4f,
 
 LLk22 	1'0L(Ki  #%) ;% ! 
 
  	(()BCCC'',,CKKvK&&&4$$S)))r   ,rE  r  i   )include_bominclude_header	separatorline_terminator
quote_char
batch_sizedatetime_formatdate_formattime_formatfloat_scientificfloat_precision
null_valuequote_styler  rQ  rR  rS  rT  rU  r   r   r  r   r  r  r  r  r  r  r  r  r  r  r  r  r  CsvQuoteStyle | Nonec                   d S r   rQ  r   r   r  r  r  r  r  r  r  r  r  r  r  r  r  r  rQ  rR  rS  rT  rU  r   r   r  s                           r   sink_csvzLazyFrame.sink_csv  s	    : sr   )r  r  r  r  r  r  r  r  r  r  r  r  r  r  rQ  rR  rS  rT  rU  r   r  c                   d S r   rQ  r  s                           r   r  zLazyFrame.sink_csv  s	    : Cr   c               l   ddl m}  |d|d            |d|d           |sd}t          |          }ddlm}  ||||d	          }~|r"t          |                                          }nd}t          |          }|pd
||d}| j        	                    |||t          |          |t          |          |||	|
||||||||          }|sL|                    |j                  }t                              |          }|                    |           dS t                              |          S )a  
        Evaluate the query in streaming mode and write to a CSV file.

        This allows streaming results that are larger than RAM to be written to disk.

        Parameters
        ----------
        path
            File path to which the file should be written.
        include_bom
            Whether to include UTF-8 BOM in the CSV output.
        include_header
            Whether to include header in the CSV output.
        separator
            Separate CSV fields with this symbol.
        line_terminator
            String used to end each row.
        quote_char
            Byte to use as quoting character.
        batch_size
            Number of rows that will be processed per thread.
        datetime_format
            A format string, with the specifiers defined by the
            `chrono <https://docs.rs/chrono/latest/chrono/format/strftime/index.html>`_
            Rust crate. If no format specified, the default fractional-second
            precision is inferred from the maximum timeunit found in the frame's
            Datetime cols (if any).
        date_format
            A format string, with the specifiers defined by the
            `chrono <https://docs.rs/chrono/latest/chrono/format/strftime/index.html>`_
            Rust crate.
        time_format
            A format string, with the specifiers defined by the
            `chrono <https://docs.rs/chrono/latest/chrono/format/strftime/index.html>`_
            Rust crate.
        float_scientific
            Whether to use scientific form always (true), never (false), or
            automatically (None) for `Float32` and `Float64` datatypes.
        float_precision
            Number of decimal places to write, applied to both `Float32` and
            `Float64` datatypes.
        null_value
            A string representing null values (defaulting to the empty string).
        quote_style : {'necessary', 'always', 'non_numeric', 'never'}
            Determines the quoting strategy used.

            - necessary (default): This puts quotes around fields only when necessary.
              They are necessary when fields contain a quote,
              delimiter or record terminator.
              Quotes are also necessary when writing an empty record
              (which is indistinguishable from a record with one empty field).
              This is the default.
            - always: This puts quotes around every field. Always.
            - never: This never puts quotes around fields, even if that results in
              invalid CSV data (e.g.: by not quoting strings containing the
              separator).
            - non_numeric: This puts quotes around all fields that are non-numeric.
              Namely, when writing a field that does not parse as a valid float
              or integer, then quotes will be used even if they aren`t strictly
              necessary.
        maintain_order
            Maintain the order in which data is processed.
            Setting this to `False` will be slightly faster.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        storage_options
            Options that indicate how to connect to a cloud provider.

            The cloud providers currently supported are AWS, GCP, and Azure.
            See supported keys here:

            * `aws <https://docs.rs/object_store/latest/object_store/aws/enum.AmazonS3ConfigKey.html>`_
            * `gcp <https://docs.rs/object_store/latest/object_store/gcp/enum.GoogleConfigKey.html>`_
            * `azure <https://docs.rs/object_store/latest/object_store/azure/enum.AzureConfigKey.html>`_
            * Hugging Face (`hf://`): Accepts an API key under the `token` parameter:             `{'token': '...'}`, or by setting the `HF_TOKEN` environment variable.

            If `storage_options` is not provided, Polars will try to infer the
            information from environment variables.
        credential_provider
            Provide a function that can be called to provide cloud storage
            credentials. The function is expected to return a dictionary of
            credential keys along with an optional credential expiry time.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        retries
            Number of retries if accessing a cloud instance fails.
        sync_on_close: { None, 'data', 'all' }
            Sync to disk when before closing a file.

            * `None` does not sync.
            * `data` syncs the file contents.
            * `all` syncs the file contents and metadata.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        mkdir: bool
            Recursively create all the directories in the path.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        lazy: bool
            Wait to start execution until `collect` is called.

            .. warning::
                This functionality is considered **unstable**. It may be changed at any
                point without it being considered a breaking change.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query is run
            using the polars streaming engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars streaming
            engine.
        optimizations
            The optimization passes done during query optimization.

            This has no effect if `lazy` is set to `True`.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        DataFrame

        Examples
        --------
        >>> lf = pl.scan_csv("/path/to/my_larger_than_ram_file.csv")  # doctest: +SKIP
        >>> lf.sink_csv("out.csv")  # doctest: +SKIP
        r   )_check_arg_is_1byter  F)can_be_emptyr  Nrg  r  ri  rj  )rn  r  r  r  r  r  r  r  r  r  r  r  r  r  ro  rR  rS  rp  r   )polars.io.csv._utilsr  r   rq  rh  r   r   r   r   r  ordr  r  r   r   r  )r   r   r  r  r  r  r  r  r  r  r  r  r  r  r  r  rQ  rR  rS  rT  rU  r   r   r  r  rh  rv  rn  rp  r   s                                 r   r  zLazyFrame.sink_csv  s   P 	=<<<<<KGGGGL*5IIII 	J''	
 	
 	
 	
 	
 	
 'H&G
'
 '
#   	#"?#8#8#:#:;;OO #O &&*4f,
 
 i  #))nn+:!+##-+!#) ;%% ! 
 
*  	(()BCCC'',,CKKvK&&&4$$S)))r   )	r  rQ  rR  rS  rT  rU  r   r   r  c       	            d S r   rQ  r   r   r  rQ  rR  rS  rT  rU  r   r   r  s              r   sink_ndjsonzLazyFrame.sink_ndjson  s	      sr   )r  rQ  rR  rS  rT  rU  r   r  c       	            d S r   rQ  r  s              r   r  zLazyFrame.sink_ndjson  s	      Cr   c       	           t          |	          }	ddlm}  ||||d          }~|r"t          |                                          }nd}t          |          }|pd||d}| j                            |||||          }|sL|                    |
j	                  }t                              |          }|                    |	           dS t                              |          S )	aX  
        Evaluate the query in streaming mode and write to an NDJSON file.

        This allows streaming results that are larger than RAM to be written to disk.

        Parameters
        ----------
        path
            File path to which the file should be written.
        maintain_order
            Maintain the order in which data is processed.
            Setting this to `False` will be slightly faster.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        storage_options
            Options that indicate how to connect to a cloud provider.

            The cloud providers currently supported are AWS, GCP, and Azure.
            See supported keys here:

            * `aws <https://docs.rs/object_store/latest/object_store/aws/enum.AmazonS3ConfigKey.html>`_
            * `gcp <https://docs.rs/object_store/latest/object_store/gcp/enum.GoogleConfigKey.html>`_
            * `azure <https://docs.rs/object_store/latest/object_store/azure/enum.AzureConfigKey.html>`_
            * Hugging Face (`hf://`): Accepts an API key under the `token` parameter:             `{'token': '...'}`, or by setting the `HF_TOKEN` environment variable.

            If `storage_options` is not provided, Polars will try to infer the
            information from environment variables.
        credential_provider
            Provide a function that can be called to provide cloud storage
            credentials. The function is expected to return a dictionary of
            credential keys along with an optional credential expiry time.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        retries
            Number of retries if accessing a cloud instance fails.
        sync_on_close: { None, 'data', 'all' }
            Sync to disk when before closing a file.

            * `None` does not sync.
            * `data` syncs the file contents.
            * `all` syncs the file contents and metadata.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        mkdir: bool
            Recursively create all the directories in the path.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        lazy: bool
            Wait to start execution until `collect` is called.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.
        engine
            Select the engine used to process the query, optional.
            At the moment, if set to `"auto"` (default), the query is run
            using the polars streaming engine. Polars will also
            attempt to use the engine set by the `POLARS_ENGINE_AFFINITY`
            environment variable. If it cannot run the query using the
            selected engine, the query is run using the polars streaming
            engine.
        optimizations
            The optimization passes done during query optimization.

            This has no effect if `lazy` is set to `True`.

            .. warning::
                This functionality is considered **unstable**. It may be changed
                at any point without it being considered a breaking change.

        Returns
        -------
        DataFrame

        Examples
        --------
        >>> lf = pl.scan_csv("/path/to/my_larger_than_ram_file.csv")  # doctest: +SKIP
        >>> lf.sink_ndjson("out.ndjson")  # doctest: +SKIP
        r   rg  r  Nri  rj  )rn  ro  rR  rS  rp  r   )r   rq  rh  r   r   r   r   	sink_jsonr  r  r   r   r  )r   r   r  rQ  rR  rS  rT  rU  r   r   r  rh  rv  rn  rp  r   s                   r   r  zLazyFrame.sink_ndjson  s2   P  ''	
 	
 	
 	
 	
 	
 'H&G'
 '
#   	#"?#8#8#:#:;;OO #O &&*4f,
 
 i!!) ;% " 
 
  	(()BCCC'',,CKKvK&&&4$$S)))r   zg`LazyFrame.fetch` is deprecated; use `LazyFrame.collect` instead, in conjunction with a call to `head`.  )r  r  r  r  r  r  r  r  r  r  r  n_rowsc               D    |                      |||||||||	|
||          S )a  
        Collect a small number of rows for debugging purposes.

        .. deprecated:: 1.0
            Use :meth:`collect` instead, in conjunction with a call to :meth:`head`.`

        Notes
        -----
        This is similar to a :func:`collect` operation, but it overwrites the number of
        rows read by *every* scan operation. Be aware that `fetch` does not guarantee
        the final number of rows in the DataFrame. Filters, join operations and fewer
        rows being available in the scanned data will all influence the final number
        of rows (joins are especially susceptible to this, and may return no data
        at all if `n_rows` is too small as the join keys may not be present).

        Warnings
        --------
        This is strictly a utility function that can help to debug queries using a
        smaller number of rows, and should *not* be used in production code.
        )r  r  r  r  r  r  r  r  r  r  r  r  )_fetch)r   r  r  r  r  r  r  r  r  r  r  r  r  s                r   fetchzLazyFrame.fetch{  sD    P {{'#1 3 3+)//!5)  
 
 	
r   )r  r  r  r  r  r  r  r  r  r  r  r  c                   |rd}d}d}d}	d}
d}d}|}| j                             |||||||	|
||dd|d          }t          |                    |                    S )uM
  
        Collect a small number of rows for debugging purposes.

        Do not confuse with `collect`; this function will frequently return
        incorrect data (see the warning for additional details).

        Parameters
        ----------
        n_rows
            Collect n_rows from the data sources.
        type_coercion
            Run type coercion optimization.
        predicate_pushdown
            Run predicate pushdown optimization.
        projection_pushdown
            Run projection pushdown optimization.
        simplify_expression
            Run simplify expressions optimization.
        no_optimization
            Turn off optimizations.
        slice_pushdown
            Slice pushdown optimization
        comm_subplan_elim
            Will try to cache branching subplans that occur on self-joins or unions.
        comm_subexpr_elim
            Common subexpressions will be cached and reused.
        cluster_with_columns
            Combine sequential independent calls to with_columns
        collapse_joins
            Collapse a join and filters into a faster join

        Notes
        -----
        This is similar to a :func:`collect` operation, but it overwrites the number of
        rows read by *every* scan operation. Be aware that `fetch` does not guarantee
        the final number of rows in the DataFrame. Filters, join operations and fewer
        rows being available in the scanned data will all influence the final number
        of rows (joins are especially susceptible to this, and may return no data
        at all if `n_rows` is too small as the join keys may not be present).

        Warnings
        --------
        This is strictly a utility function that can help to debug queries using a
        smaller number of rows, and should *not* be used in production code.

        Returns
        -------
        DataFrame

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "b", "c"],
        ...         "b": [1, 2, 3, 4, 5, 6],
        ...         "c": [6, 5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a", maintain_order=True).agg(pl.all().sum())._fetch(2)
        shape: (2, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 1   ┆ 6   │
        │ b   ┆ 2   ┆ 5   │
        └─────┴─────┴─────┘
        F)r  
type_checkr  r  r  r  r  r  r  r  r   r   r  r   )r   optimization_toggler5   r  )r   r  r  r  r  r  r  r  r  r  r  r  r  r  r  lfs                   r   r  zLazyFrame._fetch  s    l  	#!&"'"N % %#( "N 
Y**'!1 3 3)//!5)% + 
 
  rxx''(((r   c                    | S )aY  
        Return lazy representation, i.e. itself.

        Useful for writing code that expects either a :class:`DataFrame` or
        :class:`LazyFrame`. On LazyFrame this is a no-op, and returns the same object.

        Returns
        -------
        LazyFrame

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [None, 2, 3, 4],
        ...         "b": [0.5, None, 2.5, 13],
        ...         "c": [True, True, False, None],
        ...     }
        ... )
        >>> lf.lazy()  # doctest: +ELLIPSIS
        <LazyFrame at ...>
        rQ  r   s    r   r   zLazyFrame.lazy$  s	    . r   c                Z    |                      | j                                                  S )z
        Cache the result once the execution of the physical plan hits this node.

        It is not recommended using this as the optimizer likely can do a better job.
        )r   r   cacher   s    r   r  zLazyFrame.cache=  s$     	 1 1222r   r   r  `Mapping[ColumnNameOrSelector | PolarsDataType, PolarsDataType | PythonDataType] | PolarsDataTypec          	        t          |t                    s=t          |          }|                     | j                            ||                    S i }|                                D ]\  }}t          |          sCt          |t                    s.t          |t                    r(t          d |D                       rt          |          }t          |          }|                    t          |t                    r||in(t                              t!          | |          |                     |                     | j                            ||                    S )uS  
        Cast LazyFrame column(s) to the specified dtype(s).

        Parameters
        ----------
        dtypes
            Mapping of column names (or selector) to dtypes, or a single dtype
            to which all columns will be cast.
        strict
            Throw an error if a cast could not be done (for instance, due to an
            overflow).

        Examples
        --------
        >>> from datetime import date
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": [date(2020, 1, 2), date(2021, 3, 4), date(2022, 5, 6)],
        ...     }
        ... )

        Cast specific frame columns to the specified dtypes:

        >>> lf.cast({"foo": pl.Float32, "bar": pl.UInt8}).collect()
        shape: (3, 3)
        ┌─────┬─────┬────────────┐
        │ foo ┆ bar ┆ ham        │
        │ --- ┆ --- ┆ ---        │
        │ f32 ┆ u8  ┆ date       │
        ╞═════╪═════╪════════════╡
        │ 1.0 ┆ 6   ┆ 2020-01-02 │
        │ 2.0 ┆ 7   ┆ 2021-03-04 │
        │ 3.0 ┆ 8   ┆ 2022-05-06 │
        └─────┴─────┴────────────┘

        Cast all frame columns matching one dtype (or dtype group) to another dtype:

        >>> lf.cast({pl.Date: pl.Datetime}).collect()
        shape: (3, 3)
        ┌─────┬─────┬─────────────────────┐
        │ foo ┆ bar ┆ ham                 │
        │ --- ┆ --- ┆ ---                 │
        │ i64 ┆ f64 ┆ datetime[μs]        │
        ╞═════╪═════╪═════════════════════╡
        │ 1   ┆ 6.0 ┆ 2020-01-02 00:00:00 │
        │ 2   ┆ 7.0 ┆ 2021-03-04 00:00:00 │
        │ 3   ┆ 8.0 ┆ 2022-05-06 00:00:00 │
        └─────┴─────┴─────────────────────┘

        Use selectors to define the columns being cast:

        >>> import polars.selectors as cs
        >>> lf.cast({cs.numeric(): pl.UInt32, cs.temporal(): pl.String}).collect()
        shape: (3, 3)
        ┌─────┬─────┬────────────┐
        │ foo ┆ bar ┆ ham        │
        │ --- ┆ --- ┆ ---        │
        │ u32 ┆ u32 ┆ str        │
        ╞═════╪═════╪════════════╡
        │ 1   ┆ 6   ┆ 2020-01-02 │
        │ 2   ┆ 7   ┆ 2021-03-04 │
        │ 3   ┆ 8   ┆ 2022-05-06 │
        └─────┴─────┴────────────┘

        Cast all frame columns to the specified dtype:

        >>> lf.cast(pl.String).collect().to_dict(as_series=False)
        {'foo': ['1', '2', '3'],
         'bar': ['6.0', '7.0', '8.0'],
         'ham': ['2020-01-02', '2021-03-04', '2022-05-06']}
        c              3  4   K   | ]}t          |          V  d S r   )rO   rx  xs     r   rz  z!LazyFrame.cast.<locals>.<genexpr>  s*      1P1P/!2D2D1P1P1P1P1P1Pr   )r   r   rP   r   r   cast_allr   rO   rQ   r   allr_   updater   r  fromkeysr`   r  )r   r  r   cast_mapr  r  s         r   r  zLazyFrame.castE  sN   h &'** 	H%f--F##DI$6$6vv$F$FGGG 	 	HAu""  jM&B&B  1j)) .11P1Pa1P1P1P.P.P  QKK$U++EOOa%%DE

]]?4#;#;UCC    	x @ @AAAr   r  c                    t          j        |                                                               |                                          S )u  
        Create an empty copy of the current LazyFrame, with zero to 'n' rows.

        Returns a copy with an identical schema but no data.

        Parameters
        ----------
        n
            Number of (empty) rows to return in the cleared frame.

        See Also
        --------
        clone : Cheap deepcopy/clone.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [None, 2, 3, 4],
        ...         "b": [0.5, None, 2.5, 13],
        ...         "c": [True, True, False, None],
        ...     }
        ... )
        >>> lf.clear().collect()
        shape: (0, 3)
        ┌─────┬─────┬──────┐
        │ a   ┆ b   ┆ c    │
        │ --- ┆ --- ┆ ---  │
        │ i64 ┆ f64 ┆ bool │
        ╞═════╪═════╪══════╡
        └─────┴─────┴──────┘

        >>> lf.clear(2).collect()
        shape: (2, 3)
        ┌──────┬──────┬──────┐
        │ a    ┆ b    ┆ c    │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ f64  ┆ bool │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        │ null ┆ null ┆ null │
        └──────┴──────┴──────┘
        )r   )r  rl   r   clearr   r   r  s     r   r  zLazyFrame.clear  s>    X |4#6#6#8#8999??BBGGIIIr   c                Z    |                      | j                                                  S )aH  
        Create a copy of this LazyFrame.

        This is a cheap operation that does not copy data.

        See Also
        --------
        clear : Create an empty copy of the current LazyFrame, with identical
            schema but no data.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [None, 2, 3, 4],
        ...         "b": [0.5, None, 2.5, 13],
        ...         "c": [True, True, False, None],
        ...     }
        ... )
        >>> lf.clone()  # doctest: +ELLIPSIS
        <LazyFrame at ...>
        )r   r   r+  r   s    r   r+  zLazyFrame.clone  s$    . 	 1 1222r   )invert
predicates`tuple[IntoExprColumn | Iterable[IntoExprColumn] | bool | list[bool] | np.ndarray[Any, Any], ...]constraintsdict[str, Any]r  c                  g }g }|D ]u}|du r|s|du r|s|du r|s|du r|s|                                  c S t          |          rt          |          }t          |d          r/|                    t          j        |t                               t          |          x}rt          d |D                       sG|st          |t
          j                  sst          |t                    r||                                 v sHt          |t
          j                  rd|j         dnt          |          }d| }	t!          |	          |                    d	 t%          |          D                        w|                    d
 |                                D                        |s|sd}	t!          |	          |r)t)          |          dk    rt+          j        | n	|d         nd}
|r0t+          j        t1          t2          |                    }|
|n||
z  }
|
|                     | j                  S |r| j        j        n| j        j        }|                      ||
j                            S )z"Common code for filter/remove ops.FT)include_series)r  c              3  L   K   | ]}t          |t          j                   V   d S r   )r   r  rn   r  s     r   rz  z$LazyFrame._filter.<locals>.<genexpr>  s1      >>qJq"'222>>>>>>r   u   Series(…, dtype=)z invalid predicate for `filter`: c              3  4   K   | ]}t          |          V  d S r   )r6   r  s     r   rz  z$LazyFrame._filter.<locals>.<genexpr>#  s9       & &%&IaLL& & & & & &r   c              3  j   K   | ].\  }}t          j        |                              |          V  /d S r   )r  r  eq)rx  r  values      r   rz  z$LazyFrame._filter.<locals>.<genexpr>(  sK       
 
&1dEAE$KKNN5!!
 
 
 
 
 
r   z5at least one predicate or constraint must be providedr  r   N)r  r*   tupler.   r  r  r  r9   r/   anyr   rn   r   r   r  reprr   r  r%   r   r	  r  all_horizontalr  r   r   r   r   removefilter_pyexpr)r   r  r  r  all_predicatesboolean_masksr  is_seqerrr   combined_predicate	mask_exprfilter_methods                r   _filterzLazyFrame._filter  s    )+ 	 	AU

v
199V9T		f	!u**V*zz||###Q !HH  $777 $$RYq%@%@%@AAAA&q>>)>>A>>>>> 	
 #1bg.. $As++ 12T5H5H5J5J0J0J "!RY//!33333a 
 ?>>nn$%% & &*H*K*K& & &    
 	 
 
5@5F5F5H5H
 
 
 	
 	
 	
  	!- 	!ICC..  ~&&**  .11#A&&  	  	fT=99::I &- 	!33  %##DI...,2H	((	8H.@.H I IJJJr   TIntoExprColumn | Iterable[IntoExprColumn] | bool | list[bool] | np.ndarray[Any, Any]c                    |sd|rt          |          dk    r|d         du r|                                 S t          |          dk    r|d         du r|                                 S |                     ||d          S )u.  
        Filter rows in the LazyFrame based on a predicate expression.

        The original order of the remaining rows is preserved.

        Rows where the filter predicate does not evaluate to True are discarded
        (this includes rows where the predicate evaluates as `null`).

        Parameters
        ----------
        predicates
            Expression that evaluates to a boolean Series.
        constraints
            Column filters; use `name = value` to filter columns using the supplied
            value. Each constraint behaves the same as `pl.col(name).eq(value)`,
            and is implicitly joined with the other filter conditions using `&`.

        Notes
        -----
        If you are transitioning from Pandas, and performing filter operations based on
        the comparison of two or more columns, please note that in Polars any comparison
        involving `null` values will result in a `null` result, *not* boolean True or
        False. As a result, these rows will not be retained. Ensure that null values
        are handled appropriately to avoid unexpected behaviour (see examples below).

        See Also
        --------
        remove

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3, None, 4, None, 0],
        ...         "bar": [6, 7, 8, None, None, 9, 0],
        ...         "ham": ["a", "b", "c", None, "d", "e", "f"],
        ...     }
        ... )

        Filter on one condition:

        >>> lf.filter(pl.col("foo") > 1).collect()
        shape: (3, 3)
        ┌─────┬──────┬─────┐
        │ foo ┆ bar  ┆ ham │
        │ --- ┆ ---  ┆ --- │
        │ i64 ┆ i64  ┆ str │
        ╞═════╪══════╪═════╡
        │ 2   ┆ 7    ┆ b   │
        │ 3   ┆ 8    ┆ c   │
        │ 4   ┆ null ┆ d   │
        └─────┴──────┴─────┘

        Filter on multiple conditions:

        >>> lf.filter((pl.col("foo") < 3) & (pl.col("ham") == "a")).collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        └─────┴─────┴─────┘

        Provide multiple filters using `*args` syntax:

        >>> lf.filter(
        ...     pl.col("foo") == 1,
        ...     pl.col("ham") == "a",
        ... ).collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        └─────┴─────┴─────┘

        Provide multiple filters using `**kwargs` syntax:

        >>> lf.filter(foo=1, ham="a").collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        └─────┴─────┴─────┘

        Filter on an OR condition:

        >>> lf.filter(
        ...     (pl.col("foo") == 1) | (pl.col("ham") == "c"),
        ... ).collect()
        shape: (2, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        │ 3   ┆ 8   ┆ c   │
        └─────┴─────┴─────┘

        Filter by comparing two columns against each other

        >>> lf.filter(
        ...     pl.col("foo") == pl.col("bar"),
        ... ).collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 0   ┆ 0   ┆ f   │
        └─────┴─────┴─────┘

        >>> lf.filter(
        ...     pl.col("foo") != pl.col("bar"),
        ... ).collect()
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        │ 2   ┆ 7   ┆ b   │
        │ 3   ┆ 8   ┆ c   │
        └─────┴─────┴─────┘

        Notice how the row with `None` values is filtered out; using `ne_missing`
        ensures that null values compare equal, and we get similar behaviour to Pandas:

        >>> lf.filter(
        ...     pl.col("foo").ne_missing(pl.col("bar")),
        ... ).collect()
        shape: (5, 3)
        ┌──────┬──────┬─────┐
        │ foo  ┆ bar  ┆ ham │
        │ ---  ┆ ---  ┆ --- │
        │ i64  ┆ i64  ┆ str │
        ╞══════╪══════╪═════╡
        │ 1    ┆ 6    ┆ a   │
        │ 2    ┆ 7    ┆ b   │
        │ 3    ┆ 8    ┆ c   │
        │ 4    ┆ null ┆ d   │
        │ null ┆ 9    ┆ e   │
        └──────┴──────┴─────┘
        r  r   TFr  r  r  )r	  r+  r  r  r   r  r  s      r   r  zLazyFrame.filterI  s    J  	$ $#j//Q"6"6:a=D;P;Pzz||#:!##
1(>(>zz||#||!#  
 
 	
r   c                    |sd|rt          |          dk    r|d         du r|                                 S t          |          dk    r|d         du r|                                 S |                     ||d          S )us  
        Remove rows, dropping those that match the given predicate expression(s).

        The original order of the remaining rows is preserved.

        Rows where the filter predicate does not evaluate to True are retained
        (this includes rows where the predicate evaluates as `null`).

        Parameters
        ----------
        predicates
            Expression that evaluates to a boolean Series.
        constraints
            Column filters; use `name = value` to filter columns using the supplied
            value. Each constraint behaves the same as `pl.col(name).eq(value)`,
            and is implicitly joined with the other filter conditions using `&`.

        Notes
        -----
        If you are transitioning from Pandas, and performing filter operations based on
        the comparison of two or more columns, please note that in Polars any comparison
        involving `null` values will result in a `null` result, *not* boolean True or
        False. As a result, these rows will not be removed. Ensure that null values
        are handled appropriately to avoid unexpected behaviour (see examples below).

        See Also
        --------
        filter

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [2, 3, None, 4, 0],
        ...         "bar": [5, 6, None, None, 0],
        ...         "ham": ["a", "b", None, "c", "d"],
        ...     }
        ... )

        Remove rows matching a condition:

        >>> lf.remove(
        ...     pl.col("bar") >= 5,
        ... ).collect()
        shape: (3, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        │ 4    ┆ null ┆ c    │
        │ 0    ┆ 0    ┆ d    │
        └──────┴──────┴──────┘

        Discard rows based on multiple conditions, combined with and/or operators:

        >>> lf.remove(
        ...     (pl.col("foo") >= 0) & (pl.col("bar") >= 0),
        ... ).collect()
        shape: (2, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        │ 4    ┆ null ┆ c    │
        └──────┴──────┴──────┘

        >>> lf.remove(
        ...     (pl.col("foo") >= 0) | (pl.col("bar") >= 0),
        ... ).collect()
        shape: (1, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        └──────┴──────┴──────┘

        Provide multiple constraints using `*args` syntax:

        >>> lf.remove(
        ...     pl.col("ham").is_not_null(),
        ...     pl.col("bar") >= 0,
        ... ).collect()
        shape: (2, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        │ 4    ┆ null ┆ c    │
        └──────┴──────┴──────┘

        Provide constraints(s) using `**kwargs` syntax:

        >>> lf.remove(foo=0, bar=0).collect()
        shape: (4, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ 2    ┆ 5    ┆ a    │
        │ 3    ┆ 6    ┆ b    │
        │ null ┆ null ┆ null │
        │ 4    ┆ null ┆ c    │
        └──────┴──────┴──────┘

        Remove rows by comparing two columns against each other; in this case, we
        remove rows where the two columns are not equal (using `ne_missing` to
        ensure that null values compare equal):

        >>> lf.remove(
        ...     pl.col("foo").ne_missing(pl.col("bar")),
        ... ).collect()
        shape: (2, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ i64  ┆ i64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ null ┆ null ┆ null │
        │ 0    ┆ 0    ┆ d    │
        └──────┴──────┴──────┘
        r  r   TFr  )r	  r  r+  r  r  s      r   r  zLazyFrame.remove  s    Z  	$ $#j//Q"6"6:a=D;P;Pzz||#:!##
1(>(>zz||#||!#  
 
 	
r   exprsnamed_exprsc                    t          t          t          j                            dd                              }t          |i |d|i}|                     | j                            |                    S )u  
        Select columns from this LazyFrame.

        Parameters
        ----------
        *exprs
            Column(s) to select, specified as positional arguments.
            Accepts expression input. Strings are parsed as column names,
            other non-expression inputs are parsed as literals.
        **named_exprs
            Additional columns to select, specified as keyword arguments.
            The columns will be renamed to the keyword used.

        Examples
        --------
        Pass the name of a column to select that column.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6, 7, 8],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.select("foo").collect()
        shape: (3, 1)
        ┌─────┐
        │ foo │
        │ --- │
        │ i64 │
        ╞═════╡
        │ 1   │
        │ 2   │
        │ 3   │
        └─────┘

        Multiple columns can be selected by passing a list of column names.

        >>> lf.select(["foo", "bar"]).collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ foo ┆ bar │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 6   │
        │ 2   ┆ 7   │
        │ 3   ┆ 8   │
        └─────┴─────┘

        Multiple columns can also be selected using positional arguments instead of a
        list. Expressions are also accepted.

        >>> lf.select(pl.col("foo"), pl.col("bar") + 1).collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ foo ┆ bar │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 7   │
        │ 2   ┆ 8   │
        │ 3   ┆ 9   │
        └─────┴─────┘

        Use keyword arguments to easily name your expression inputs.

        >>> lf.select(
        ...     threshold=pl.when(pl.col("foo") > 2).then(10).otherwise(0)
        ... ).collect()
        shape: (3, 1)
        ┌───────────┐
        │ threshold │
        │ ---       │
        │ i32       │
        ╞═══════════╡
        │ 0         │
        │ 0         │
        │ 10        │
        └───────────┘

        Expressions with multiple outputs can be automatically instantiated as Structs
        by enabling the setting `Config.set_auto_structify(True)`:

        >>> with pl.Config(auto_structify=True):
        ...     lf.select(
        ...         is_odd=(pl.col(pl.Int64) % 2 == 1).name.suffix("_is_odd"),
        ...     ).collect()
        shape: (3, 1)
        ┌──────────────┐
        │ is_odd       │
        │ ---          │
        │ struct[2]    │
        ╞══════════════╡
        │ {true,false} │
        │ {false,true} │
        │ {true,false} │
        └──────────────┘
        POLARS_AUTO_STRUCTIFYr   __structify)	r   r  osenvironr!  r%   r   r   r  r   r  r  	structifypyexprss        r   r  zLazyFrame.select  s}    L RZ^^,CQGGHHII	0
!
 
/8
 
 
 	 0 0 9 9:::r   c                    t          t          t          j                            dd                              }t          |i |d|i}|                     | j                            |                    S )a  
        Select columns from this LazyFrame.

        This will run all expression sequentially instead of in parallel.
        Use this when the work per expression is cheap.

        Parameters
        ----------
        *exprs
            Column(s) to select, specified as positional arguments.
            Accepts expression input. Strings are parsed as column names,
            other non-expression inputs are parsed as literals.
        **named_exprs
            Additional columns to select, specified as keyword arguments.
            The columns will be renamed to the keyword used.

        See Also
        --------
        select
        r  r   r  )	r   r  r  r  r!  r%   r   r   
select_seqr  s        r   r  zLazyFrame.select_seq  s|    . RZ^^,CQGGHHII	0
!
 
/8
 
 
 	 4 4W = =>>>r   )r  named_byrZ   c               D   |                                 D ]V}t          |t          t          j        t          j        f          s(dt          |           d|d|d}t          |          Wt          |i |}| j	        
                    ||          }t          |          S )u  
        Start a group by operation.

        Parameters
        ----------
        *by
            Column(s) to group by. Accepts expression input. Strings are parsed as
            column names.
        maintain_order
            Ensure that the order of the groups is consistent with the input data.
            This is slower than a default group by.
            Setting this to `True` blocks the possibility
            to run on the streaming engine.
        **named_by
            Additional columns to group by, specified as keyword arguments.
            The columns will be renamed to the keyword used.

        Examples
        --------
        Group by one column and call `agg` to compute the grouped sum of another
        column.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["a", "b", "a", "b", "c"],
        ...         "b": [1, 2, 1, 3, 3],
        ...         "c": [5, 4, 3, 2, 1],
        ...     }
        ... )
        >>> lf.group_by("a").agg(pl.col("b").sum()).collect()  # doctest: +IGNORE_RESULT
        shape: (3, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ a   ┆ 2   │
        │ b   ┆ 5   │
        │ c   ┆ 3   │
        └─────┴─────┘

        Set `maintain_order=True` to ensure the order of the groups is consistent with
        the input.

        >>> lf.group_by("a", maintain_order=True).agg(pl.col("c")).collect()
        shape: (3, 2)
        ┌─────┬───────────┐
        │ a   ┆ c         │
        │ --- ┆ ---       │
        │ str ┆ list[i64] │
        ╞═════╪═══════════╡
        │ a   ┆ [5, 3]    │
        │ b   ┆ [4, 2]    │
        │ c   ┆ [1]       │
        └─────┴───────────┘

        Group by multiple columns by passing a list of column names.

        >>> lf.group_by(["a", "b"]).agg(pl.max("c")).collect()  # doctest: +SKIP
        shape: (4, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 1   ┆ 5   │
        │ b   ┆ 2   ┆ 4   │
        │ b   ┆ 3   ┆ 2   │
        │ c   ┆ 3   ┆ 1   │
        └─────┴─────┴─────┘

        Or use positional arguments to group by multiple columns in the same way.
        Expressions are also accepted.

        >>> lf.group_by("a", pl.col("b") // 2).agg(
        ...     pl.col("c").mean()
        ... ).collect()  # doctest: +SKIP
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ f64 │
        ╞═════╪═════╪═════╡
        │ a   ┆ 0   ┆ 4.0 │
        │ b   ┆ 1   ┆ 3.0 │
        │ c   ┆ 1   ┆ 1.0 │
        └─────┴─────┴─────┘
        z=Expected Polars expression or object convertible to one, got z&.

Hint: if you tried
    group_by(by=z;)
then you probably want to use this instead:
    group_by(r  )valuesr   r   r  rn   r  ru  r   r%   r   group_byrZ   )r   r  r  r  r  r   r  lgbs           r   r  zLazyFrame.group_by   s    | __&& 		% 		%Eec27BI%>?? %/TXY^T_T_ / /',/ / %*	/ / /   nn$% /?h??i  773r   r  z0.20.14right)offsetclosedr  index_columnperiodstr | timedeltar  str | timedelta | Noner  rp   $IntoExpr | Iterable[IntoExpr] | Nonec                  t          |          }|t          t          |                    }|t          |          ng }t          |          }t          |          }| j                            |||||          }t          |          S )u  
        Create rolling groups based on a temporal or integer column.

        Different from a `group_by_dynamic` the windows are now determined by the
        individual values and are not of constant intervals. For constant intervals
        use :func:`LazyFrame.group_by_dynamic`.

        If you have a time series `<t_0, t_1, ..., t_n>`, then by default the
        windows created will be

            * (t_0 - period, t_0]
            * (t_1 - period, t_1]
            * ...
            * (t_n - period, t_n]

        whereas if you pass a non-default `offset`, then the windows will be

            * (t_0 + offset, t_0 + offset + period]
            * (t_1 + offset, t_1 + offset + period]
            * ...
            * (t_n + offset, t_n + offset + period]

        The `period` and `offset` arguments are created either from a timedelta, or
        by using the following string language:

        - 1ns   (1 nanosecond)
        - 1us   (1 microsecond)
        - 1ms   (1 millisecond)
        - 1s    (1 second)
        - 1m    (1 minute)
        - 1h    (1 hour)
        - 1d    (1 calendar day)
        - 1w    (1 calendar week)
        - 1mo   (1 calendar month)
        - 1q    (1 calendar quarter)
        - 1y    (1 calendar year)
        - 1i    (1 index count)

        Or combine them:
        "3d12h4m25s" # 3 days, 12 hours, 4 minutes, and 25 seconds

        By "calendar day", we mean the corresponding time on the next day (which may
        not be 24 hours, due to daylight savings). Similarly for "calendar week",
        "calendar month", "calendar quarter", and "calendar year".

        .. versionchanged:: 0.20.14
            The `by` parameter was renamed `group_by`.

        Parameters
        ----------
        index_column
            Column used to group based on the time window.
            Often of type Date/Datetime.
            This column must be sorted in ascending order (or, if `group_by` is
            specified, then it must be sorted in ascending order within each group).

            In case of a rolling group by on indices, dtype needs to be one of
            {UInt32, UInt64, Int32, Int64}. Note that the first three get temporarily
            cast to Int64, so if performance matters use an Int64 column.
        period
            Length of the window - must be non-negative.
        offset
            Offset of the window. Default is `-period`.
        closed : {'right', 'left', 'both', 'none'}
            Define which sides of the temporal interval are closed (inclusive).
        group_by
            Also group by this column/these columns

        Returns
        -------
        LazyGroupBy
            Object you can call `.agg` on to aggregate by groups, the result
            of which will be sorted by `index_column` (but note that if `group_by`
            columns are passed, it will only be sorted within each group).

        See Also
        --------
        group_by_dynamic

        Examples
        --------
        >>> dates = [
        ...     "2020-01-01 13:45:48",
        ...     "2020-01-01 16:42:13",
        ...     "2020-01-01 16:45:09",
        ...     "2020-01-02 18:12:48",
        ...     "2020-01-03 19:45:32",
        ...     "2020-01-08 23:16:43",
        ... ]
        >>> df = pl.LazyFrame({"dt": dates, "a": [3, 7, 5, 9, 2, 1]}).with_columns(
        ...     pl.col("dt").str.strptime(pl.Datetime).set_sorted()
        ... )
        >>> out = (
        ...     df.rolling(index_column="dt", period="2d")
        ...     .agg(
        ...         pl.sum("a").alias("sum_a"),
        ...         pl.min("a").alias("min_a"),
        ...         pl.max("a").alias("max_a"),
        ...     )
        ...     .collect()
        ... )
        >>> out
        shape: (6, 4)
        ┌─────────────────────┬───────┬───────┬───────┐
        │ dt                  ┆ sum_a ┆ min_a ┆ max_a │
        │ ---                 ┆ ---   ┆ ---   ┆ ---   │
        │ datetime[μs]        ┆ i64   ┆ i64   ┆ i64   │
        ╞═════════════════════╪═══════╪═══════╪═══════╡
        │ 2020-01-01 13:45:48 ┆ 3     ┆ 3     ┆ 3     │
        │ 2020-01-01 16:42:13 ┆ 10    ┆ 3     ┆ 7     │
        │ 2020-01-01 16:45:09 ┆ 15    ┆ 3     ┆ 7     │
        │ 2020-01-02 18:12:48 ┆ 24    ┆ 3     ┆ 9     │
        │ 2020-01-03 19:45:32 ┆ 11    ┆ 2     ┆ 9     │
        │ 2020-01-08 23:16:43 ┆ 1     ┆ 1     ┆ 1     │
        └─────────────────────┴───────┴───────┴───────┘
        )r$   r   r   r%   r   rollingrZ   )r   r  r  r  r  r  
pyexprs_byr  s           r   r  zLazyFrame.rolling  s    | -\::>+,DV,L,LMMF 9A8L*8444RT 	 *&11)&11ifffjQQ3r   r  window)r  r  include_boundariesr  labelr  start_byeveryr  r  r|   r  r   c                  t          |          }|d}||}t          |          }t          |          }t          |          }|t          |          ng }
| j                            ||||||||
|		  	        }t          |          S )u=  
        Group based on a time value (or index value of type Int32, Int64).

        Time windows are calculated and rows are assigned to windows. Different from a
        normal group by is that a row can be member of multiple groups.
        By default, the windows look like:

        - [start, start + period)
        - [start + every, start + every + period)
        - [start + 2*every, start + 2*every + period)
        - ...

        where `start` is determined by `start_by`, `offset`, `every`, and the earliest
        datapoint. See the `start_by` argument description for details.

        .. warning::
            The index column must be sorted in ascending order. If `group_by` is passed, then
            the index column must be sorted in ascending order within each group.

        .. versionchanged:: 0.20.14
            The `by` parameter was renamed `group_by`.

        Parameters
        ----------
        index_column
            Column used to group based on the time window.
            Often of type Date/Datetime.
            This column must be sorted in ascending order (or, if `group_by` is specified,
            then it must be sorted in ascending order within each group).

            In case of a dynamic group by on indices, dtype needs to be one of
            {Int32, Int64}. Note that Int32 gets temporarily cast to Int64, so if
            performance matters use an Int64 column.
        every
            interval of the window
        period
            length of the window, if None it will equal 'every'
        offset
            offset of the window, does not take effect if `start_by` is 'datapoint'.
            Defaults to zero.
        include_boundaries
            Add the lower and upper bound of the window to the "_lower_boundary" and
            "_upper_boundary" columns. This will impact performance because it's harder to
            parallelize
        closed : {'left', 'right', 'both', 'none'}
            Define which sides of the temporal interval are closed (inclusive).
        label : {'left', 'right', 'datapoint'}
            Define which label to use for the window:

            - 'left': lower boundary of the window
            - 'right': upper boundary of the window
            - 'datapoint': the first value of the index column in the given window.
              If you don't need the label to be at one of the boundaries, choose this
              option for maximum performance
        group_by
            Also group by this column/these columns
        start_by : {'window', 'datapoint', 'monday', 'tuesday', 'wednesday', 'thursday', 'friday', 'saturday', 'sunday'}
            The strategy to determine the start of the first window by.

            * 'window': Start by taking the earliest timestamp, truncating it with
              `every`, and then adding `offset`.
              Note that weekly windows start on Monday.
            * 'datapoint': Start from the first encountered data point.
            * a day of the week (only takes effect if `every` contains `'w'`):

              * 'monday': Start the window on the Monday before the first data point.
              * 'tuesday': Start the window on the Tuesday before the first data point.
              * ...
              * 'sunday': Start the window on the Sunday before the first data point.

              The resulting window is then shifted back until the earliest datapoint
              is in or in front of it.

        Returns
        -------
        LazyGroupBy
            Object you can call `.agg` on to aggregate by groups, the result
            of which will be sorted by `index_column` (but note that if `group_by` columns are
            passed, it will only be sorted within each group).

        See Also
        --------
        rolling

        Notes
        -----
        1) If you're coming from pandas, then

           .. code-block:: python

               # polars
               df.group_by_dynamic("ts", every="1d").agg(pl.col("value").sum())

           is equivalent to

           .. code-block:: python

               # pandas
               df.set_index("ts").resample("D")["value"].sum().reset_index()

           though note that, unlike pandas, polars doesn't add extra rows for empty
           windows. If you need `index_column` to be evenly spaced, then please combine
           with :func:`DataFrame.upsample`.

        2) The `every`, `period` and `offset` arguments are created with
           the following string language:

           - 1ns   (1 nanosecond)
           - 1us   (1 microsecond)
           - 1ms   (1 millisecond)
           - 1s    (1 second)
           - 1m    (1 minute)
           - 1h    (1 hour)
           - 1d    (1 calendar day)
           - 1w    (1 calendar week)
           - 1mo   (1 calendar month)
           - 1q    (1 calendar quarter)
           - 1y    (1 calendar year)
           - 1i    (1 index count)

           Or combine them:
           "3d12h4m25s" # 3 days, 12 hours, 4 minutes, and 25 seconds

           By "calendar day", we mean the corresponding time on the next day (which may
           not be 24 hours, due to daylight savings). Similarly for "calendar week",
           "calendar month", "calendar quarter", and "calendar year".

           In case of a group_by_dynamic on an integer column, the windows are defined by:

           - "1i"      # length 1
           - "10i"     # length 10

        Examples
        --------
        >>> from datetime import datetime
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "time": pl.datetime_range(
        ...             start=datetime(2021, 12, 16),
        ...             end=datetime(2021, 12, 16, 3),
        ...             interval="30m",
        ...             eager=True,
        ...         ),
        ...         "n": range(7),
        ...     }
        ... )
        >>> lf.collect()
        shape: (7, 2)
        ┌─────────────────────┬─────┐
        │ time                ┆ n   │
        │ ---                 ┆ --- │
        │ datetime[μs]        ┆ i64 │
        ╞═════════════════════╪═════╡
        │ 2021-12-16 00:00:00 ┆ 0   │
        │ 2021-12-16 00:30:00 ┆ 1   │
        │ 2021-12-16 01:00:00 ┆ 2   │
        │ 2021-12-16 01:30:00 ┆ 3   │
        │ 2021-12-16 02:00:00 ┆ 4   │
        │ 2021-12-16 02:30:00 ┆ 5   │
        │ 2021-12-16 03:00:00 ┆ 6   │
        └─────────────────────┴─────┘

        Group by windows of 1 hour.

        >>> lf.group_by_dynamic("time", every="1h", closed="right").agg(
        ...     pl.col("n")
        ... ).collect()
        shape: (4, 2)
        ┌─────────────────────┬───────────┐
        │ time                ┆ n         │
        │ ---                 ┆ ---       │
        │ datetime[μs]        ┆ list[i64] │
        ╞═════════════════════╪═══════════╡
        │ 2021-12-15 23:00:00 ┆ [0]       │
        │ 2021-12-16 00:00:00 ┆ [1, 2]    │
        │ 2021-12-16 01:00:00 ┆ [3, 4]    │
        │ 2021-12-16 02:00:00 ┆ [5, 6]    │
        └─────────────────────┴───────────┘

        The window boundaries can also be added to the aggregation result

        >>> lf.group_by_dynamic(
        ...     "time", every="1h", include_boundaries=True, closed="right"
        ... ).agg(pl.col("n").mean()).collect()
        shape: (4, 4)
        ┌─────────────────────┬─────────────────────┬─────────────────────┬─────┐
        │ _lower_boundary     ┆ _upper_boundary     ┆ time                ┆ n   │
        │ ---                 ┆ ---                 ┆ ---                 ┆ --- │
        │ datetime[μs]        ┆ datetime[μs]        ┆ datetime[μs]        ┆ f64 │
        ╞═════════════════════╪═════════════════════╪═════════════════════╪═════╡
        │ 2021-12-15 23:00:00 ┆ 2021-12-16 00:00:00 ┆ 2021-12-15 23:00:00 ┆ 0.0 │
        │ 2021-12-16 00:00:00 ┆ 2021-12-16 01:00:00 ┆ 2021-12-16 00:00:00 ┆ 1.5 │
        │ 2021-12-16 01:00:00 ┆ 2021-12-16 02:00:00 ┆ 2021-12-16 01:00:00 ┆ 3.5 │
        │ 2021-12-16 02:00:00 ┆ 2021-12-16 03:00:00 ┆ 2021-12-16 02:00:00 ┆ 5.5 │
        └─────────────────────┴─────────────────────┴─────────────────────┴─────┘

        When closed="left", the window excludes the right end of interval:
        [lower_bound, upper_bound)

        >>> lf.group_by_dynamic("time", every="1h", closed="left").agg(
        ...     pl.col("n")
        ... ).collect()
        shape: (4, 2)
        ┌─────────────────────┬───────────┐
        │ time                ┆ n         │
        │ ---                 ┆ ---       │
        │ datetime[μs]        ┆ list[i64] │
        ╞═════════════════════╪═══════════╡
        │ 2021-12-16 00:00:00 ┆ [0, 1]    │
        │ 2021-12-16 01:00:00 ┆ [2, 3]    │
        │ 2021-12-16 02:00:00 ┆ [4, 5]    │
        │ 2021-12-16 03:00:00 ┆ [6]       │
        └─────────────────────┴───────────┘

        When closed="both" the time values at the window boundaries belong to 2 groups.

        >>> lf.group_by_dynamic("time", every="1h", closed="both").agg(
        ...     pl.col("n")
        ... ).collect()
        shape: (4, 2)
        ┌─────────────────────┬───────────┐
        │ time                ┆ n         │
        │ ---                 ┆ ---       │
        │ datetime[μs]        ┆ list[i64] │
        ╞═════════════════════╪═══════════╡
        │ 2021-12-16 00:00:00 ┆ [0, 1, 2] │
        │ 2021-12-16 01:00:00 ┆ [2, 3, 4] │
        │ 2021-12-16 02:00:00 ┆ [4, 5, 6] │
        │ 2021-12-16 03:00:00 ┆ [6]       │
        └─────────────────────┴───────────┘

        Dynamic group bys can also be combined with grouping on normal keys

        >>> lf = lf.with_columns(groups=pl.Series(["a", "a", "a", "b", "b", "a", "a"]))
        >>> lf.collect()
        shape: (7, 3)
        ┌─────────────────────┬─────┬────────┐
        │ time                ┆ n   ┆ groups │
        │ ---                 ┆ --- ┆ ---    │
        │ datetime[μs]        ┆ i64 ┆ str    │
        ╞═════════════════════╪═════╪════════╡
        │ 2021-12-16 00:00:00 ┆ 0   ┆ a      │
        │ 2021-12-16 00:30:00 ┆ 1   ┆ a      │
        │ 2021-12-16 01:00:00 ┆ 2   ┆ a      │
        │ 2021-12-16 01:30:00 ┆ 3   ┆ b      │
        │ 2021-12-16 02:00:00 ┆ 4   ┆ b      │
        │ 2021-12-16 02:30:00 ┆ 5   ┆ a      │
        │ 2021-12-16 03:00:00 ┆ 6   ┆ a      │
        └─────────────────────┴─────┴────────┘
        >>> lf.group_by_dynamic(
        ...     "time",
        ...     every="1h",
        ...     closed="both",
        ...     group_by="groups",
        ...     include_boundaries=True,
        ... ).agg(pl.col("n")).collect()
        shape: (6, 5)
        ┌────────┬─────────────────────┬─────────────────────┬─────────────────────┬───────────┐
        │ groups ┆ _lower_boundary     ┆ _upper_boundary     ┆ time                ┆ n         │
        │ ---    ┆ ---                 ┆ ---                 ┆ ---                 ┆ ---       │
        │ str    ┆ datetime[μs]        ┆ datetime[μs]        ┆ datetime[μs]        ┆ list[i64] │
        ╞════════╪═════════════════════╪═════════════════════╪═════════════════════╪═══════════╡
        │ a      ┆ 2021-12-16 00:00:00 ┆ 2021-12-16 01:00:00 ┆ 2021-12-16 00:00:00 ┆ [0, 1, 2] │
        │ a      ┆ 2021-12-16 01:00:00 ┆ 2021-12-16 02:00:00 ┆ 2021-12-16 01:00:00 ┆ [2]       │
        │ a      ┆ 2021-12-16 02:00:00 ┆ 2021-12-16 03:00:00 ┆ 2021-12-16 02:00:00 ┆ [5, 6]    │
        │ a      ┆ 2021-12-16 03:00:00 ┆ 2021-12-16 04:00:00 ┆ 2021-12-16 03:00:00 ┆ [6]       │
        │ b      ┆ 2021-12-16 01:00:00 ┆ 2021-12-16 02:00:00 ┆ 2021-12-16 01:00:00 ┆ [3, 4]    │
        │ b      ┆ 2021-12-16 02:00:00 ┆ 2021-12-16 03:00:00 ┆ 2021-12-16 02:00:00 ┆ [4]       │
        └────────┴─────────────────────┴─────────────────────┴─────────────────────┴───────────┘

        Dynamic group by on an index column

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "idx": pl.int_range(0, 6, eager=True),
        ...         "A": ["A", "A", "B", "B", "B", "C"],
        ...     }
        ... )
        >>> lf.group_by_dynamic(
        ...     "idx",
        ...     every="2i",
        ...     period="3i",
        ...     include_boundaries=True,
        ...     closed="right",
        ... ).agg(pl.col("A").alias("A_agg_list")).collect()
        shape: (4, 4)
        ┌─────────────────┬─────────────────┬─────┬─────────────────┐
        │ _lower_boundary ┆ _upper_boundary ┆ idx ┆ A_agg_list      │
        │ ---             ┆ ---             ┆ --- ┆ ---             │
        │ i64             ┆ i64             ┆ i64 ┆ list[str]       │
        ╞═════════════════╪═════════════════╪═════╪═════════════════╡
        │ -2              ┆ 1               ┆ -2  ┆ ["A", "A"]      │
        │ 0               ┆ 3               ┆ 0   ┆ ["A", "B", "B"] │
        │ 2               ┆ 5               ┆ 2   ┆ ["B", "B", "C"] │
        │ 4               ┆ 7               ┆ 4   ┆ ["C"]           │
        └─────────────────┴─────────────────┴─────┴─────────────────┘
        N0ns)r$   r   r%   r   group_by_dynamicrZ   )r   r  r  r  r  r  r  r  r  r  r  r  s               r   r  zLazyFrame.group_by_dynamic  s    n	 -\::>F>F)&11)&11(// 9A8L*8444RT 	 i((

 

 3r   backward_right)left_onright_ononby_leftby_rightr  strategysuffix	toleranceallow_parallelforce_parallelcoalesceallow_exact_matchescheck_sortednessr  str | None | Exprr  r  r  str | Sequence[str] | Noner  r  ro   r  r	  $str | int | float | timedelta | Noner
  r  r  r  r  c                   t          | |           t          |t          t          j        f          r|}|}||d}t          |          |t          |t                    r|gn|}|}n=||5t          |t                    r|gn|}t          |t                    r|gn|}nd}d}d}d}t          |
t                    r|
}n't          |
t                    rt          |
          }n|
}t          |t          j                  st          j	        |          }t          |t          j                  st          j	        |          }| 
                    | j                            |j        |j        |j        |||||	||||||                    S )u/9  
        Perform an asof join.

        This is similar to a left-join except that we match on nearest key rather than
        equal keys.

        Both DataFrames must be sorted by the `on` key (within each `by` group, if
        specified).

        For each row in the left DataFrame:

          - A "backward" search selects the last row in the right DataFrame whose
            'on' key is less than or equal to the left's key.

          - A "forward" search selects the first row in the right DataFrame whose
            'on' key is greater than or equal to the left's key.

            A "nearest" search selects the last row in the right DataFrame whose value
            is nearest to the left's key. String keys are not currently supported for a
            nearest search.

        The default is "backward".

        Parameters
        ----------
        other
            Lazy DataFrame to join with.
        left_on
            Join column of the left DataFrame.
        right_on
            Join column of the right DataFrame.
        on
            Join column of both DataFrames. If set, `left_on` and `right_on` should be
            None.
        by
            Join on these columns before doing asof join.
        by_left
            Join on these columns before doing asof join.
        by_right
            Join on these columns before doing asof join.
        strategy : {'backward', 'forward', 'nearest'}
            Join strategy.
        suffix
            Suffix to append to columns with a duplicate name.
        tolerance
            Numeric tolerance. By setting this the join will only be done if the near
            keys are within this distance. If an asof join is done on columns of dtype
            "Date", "Datetime", "Duration" or "Time", use either a datetime.timedelta
            object or the following string language:

                - 1ns   (1 nanosecond)
                - 1us   (1 microsecond)
                - 1ms   (1 millisecond)
                - 1s    (1 second)
                - 1m    (1 minute)
                - 1h    (1 hour)
                - 1d    (1 calendar day)
                - 1w    (1 calendar week)
                - 1mo   (1 calendar month)
                - 1q    (1 calendar quarter)
                - 1y    (1 calendar year)

                Or combine them:
                "3d12h4m25s" # 3 days, 12 hours, 4 minutes, and 25 seconds

                By "calendar day", we mean the corresponding time on the next day
                (which may not be 24 hours, due to daylight savings). Similarly for
                "calendar week", "calendar month", "calendar quarter", and
                "calendar year".

        allow_parallel
            Allow the physical plan to optionally evaluate the computation of both
            DataFrames up to the join in parallel.
        force_parallel
            Force the physical plan to evaluate the computation of both DataFrames up to
            the join in parallel.
        coalesce
            Coalescing behavior (merging of `on` / `left_on` / `right_on` columns):

            - True: -> Always coalesce join columns.
            - False: -> Never coalesce join columns.

            Note that joining on any other expressions than `col`
            will turn off coalescing.
        allow_exact_matches
            Whether exact matches are valid join predicates.

            - If True, allow matching with the same ``on`` value
                (i.e. less-than-or-equal-to / greater-than-or-equal-to)
            - If False, don't match the same ``on`` value
                (i.e., strictly less-than / strictly greater-than).
        check_sortedness
            Check the sortedness of the asof keys. If the keys are not sorted Polars
            will error. Currently, sortedness cannot be checked if 'by' groups are
            provided.


        Examples
        --------
        >>> from datetime import date
        >>> gdp = pl.LazyFrame(
        ...     {
        ...         "date": pl.date_range(
        ...             date(2016, 1, 1),
        ...             date(2020, 1, 1),
        ...             "1y",
        ...             eager=True,
        ...         ),
        ...         "gdp": [4164, 4411, 4566, 4696, 4827],
        ...     }
        ... )
        >>> gdp.collect()
        shape: (5, 2)
        ┌────────────┬──────┐
        │ date       ┆ gdp  │
        │ ---        ┆ ---  │
        │ date       ┆ i64  │
        ╞════════════╪══════╡
        │ 2016-01-01 ┆ 4164 │
        │ 2017-01-01 ┆ 4411 │
        │ 2018-01-01 ┆ 4566 │
        │ 2019-01-01 ┆ 4696 │
        │ 2020-01-01 ┆ 4827 │
        └────────────┴──────┘

        >>> population = pl.LazyFrame(
        ...     {
        ...         "date": [date(2016, 3, 1), date(2018, 8, 1), date(2019, 1, 1)],
        ...         "population": [82.19, 82.66, 83.12],
        ...     }
        ... ).sort("date")
        >>> population.collect()
        shape: (3, 2)
        ┌────────────┬────────────┐
        │ date       ┆ population │
        │ ---        ┆ ---        │
        │ date       ┆ f64        │
        ╞════════════╪════════════╡
        │ 2016-03-01 ┆ 82.19      │
        │ 2018-08-01 ┆ 82.66      │
        │ 2019-01-01 ┆ 83.12      │
        └────────────┴────────────┘

        Note how the dates don't quite match. If we join them using `join_asof` and
        `strategy='backward'`, then each date from `population` which doesn't have an
        exact match is matched with the closest earlier date from `gdp`:

        >>> population.join_asof(gdp, on="date", strategy="backward").collect()
        shape: (3, 3)
        ┌────────────┬────────────┬──────┐
        │ date       ┆ population ┆ gdp  │
        │ ---        ┆ ---        ┆ ---  │
        │ date       ┆ f64        ┆ i64  │
        ╞════════════╪════════════╪══════╡
        │ 2016-03-01 ┆ 82.19      ┆ 4164 │
        │ 2018-08-01 ┆ 82.66      ┆ 4566 │
        │ 2019-01-01 ┆ 83.12      ┆ 4696 │
        └────────────┴────────────┴──────┘

        Note how:

        - date `2016-03-01` from `population` is matched with `2016-01-01` from `gdp`;
        - date `2018-08-01` from `population` is matched with `2018-01-01` from `gdp`.

        You can verify this by passing `coalesce=False`:

        >>> population.join_asof(
        ...     gdp, on="date", strategy="backward", coalesce=False
        ... ).collect()
        shape: (3, 4)
        ┌────────────┬────────────┬────────────┬──────┐
        │ date       ┆ population ┆ date_right ┆ gdp  │
        │ ---        ┆ ---        ┆ ---        ┆ ---  │
        │ date       ┆ f64        ┆ date       ┆ i64  │
        ╞════════════╪════════════╪════════════╪══════╡
        │ 2016-03-01 ┆ 82.19      ┆ 2016-01-01 ┆ 4164 │
        │ 2018-08-01 ┆ 82.66      ┆ 2018-01-01 ┆ 4566 │
        │ 2019-01-01 ┆ 83.12      ┆ 2019-01-01 ┆ 4696 │
        └────────────┴────────────┴────────────┴──────┘

        If we instead use `strategy='forward'`, then each date from `population` which
        doesn't have an exact match is matched with the closest later date from `gdp`:

        >>> population.join_asof(gdp, on="date", strategy="forward").collect()
        shape: (3, 3)
        ┌────────────┬────────────┬──────┐
        │ date       ┆ population ┆ gdp  │
        │ ---        ┆ ---        ┆ ---  │
        │ date       ┆ f64        ┆ i64  │
        ╞════════════╪════════════╪══════╡
        │ 2016-03-01 ┆ 82.19      ┆ 4411 │
        │ 2018-08-01 ┆ 82.66      ┆ 4696 │
        │ 2019-01-01 ┆ 83.12      ┆ 4696 │
        └────────────┴────────────┴──────┘

        Note how:

        - date `2016-03-01` from `population` is matched with `2017-01-01` from `gdp`;
        - date `2018-08-01` from `population` is matched with `2019-01-01` from `gdp`.

        Finally, `strategy='nearest'` gives us a mix of the two results above, as each
        date from `population` which doesn't have an exact match is matched with the
        closest date from `gdp`, regardless of whether it's earlier or later:

        >>> population.join_asof(gdp, on="date", strategy="nearest").collect()
        shape: (3, 3)
        ┌────────────┬────────────┬──────┐
        │ date       ┆ population ┆ gdp  │
        │ ---        ┆ ---        ┆ ---  │
        │ date       ┆ f64        ┆ i64  │
        ╞════════════╪════════════╪══════╡
        │ 2016-03-01 ┆ 82.19      ┆ 4164 │
        │ 2018-08-01 ┆ 82.66      ┆ 4696 │
        │ 2019-01-01 ┆ 83.12      ┆ 4696 │
        └────────────┴────────────┴──────┘

        Note how:

        - date `2016-03-01` from `population` is matched with `2016-01-01` from `gdp`;
        - date `2018-08-01` from `population` is matched with `2019-01-01` from `gdp`.

        They `by` argument allows joining on another column first, before the asof join.
        In this example we join by `country` first, then asof join by date, as above.

        >>> gdp_dates = pl.date_range(  # fmt: skip
        ...     date(2016, 1, 1), date(2020, 1, 1), "1y", eager=True
        ... )
        >>> gdp2 = pl.LazyFrame(
        ...     {
        ...         "country": ["Germany"] * 5 + ["Netherlands"] * 5,
        ...         "date": pl.concat([gdp_dates, gdp_dates]),
        ...         "gdp": [4164, 4411, 4566, 4696, 4827, 784, 833, 914, 910, 909],
        ...     }
        ... ).sort("country", "date")
        >>>
        >>> gdp2.collect()
        shape: (10, 3)
        ┌─────────────┬────────────┬──────┐
        │ country     ┆ date       ┆ gdp  │
        │ ---         ┆ ---        ┆ ---  │
        │ str         ┆ date       ┆ i64  │
        ╞═════════════╪════════════╪══════╡
        │ Germany     ┆ 2016-01-01 ┆ 4164 │
        │ Germany     ┆ 2017-01-01 ┆ 4411 │
        │ Germany     ┆ 2018-01-01 ┆ 4566 │
        │ Germany     ┆ 2019-01-01 ┆ 4696 │
        │ Germany     ┆ 2020-01-01 ┆ 4827 │
        │ Netherlands ┆ 2016-01-01 ┆ 784  │
        │ Netherlands ┆ 2017-01-01 ┆ 833  │
        │ Netherlands ┆ 2018-01-01 ┆ 914  │
        │ Netherlands ┆ 2019-01-01 ┆ 910  │
        │ Netherlands ┆ 2020-01-01 ┆ 909  │
        └─────────────┴────────────┴──────┘
        >>> pop2 = pl.LazyFrame(
        ...     {
        ...         "country": ["Germany"] * 3 + ["Netherlands"] * 3,
        ...         "date": [
        ...             date(2016, 3, 1),
        ...             date(2018, 8, 1),
        ...             date(2019, 1, 1),
        ...             date(2016, 3, 1),
        ...             date(2018, 8, 1),
        ...             date(2019, 1, 1),
        ...         ],
        ...         "population": [82.19, 82.66, 83.12, 17.11, 17.32, 17.40],
        ...     }
        ... ).sort("country", "date")
        >>>
        >>> pop2.collect()
        shape: (6, 3)
        ┌─────────────┬────────────┬────────────┐
        │ country     ┆ date       ┆ population │
        │ ---         ┆ ---        ┆ ---        │
        │ str         ┆ date       ┆ f64        │
        ╞═════════════╪════════════╪════════════╡
        │ Germany     ┆ 2016-03-01 ┆ 82.19      │
        │ Germany     ┆ 2018-08-01 ┆ 82.66      │
        │ Germany     ┆ 2019-01-01 ┆ 83.12      │
        │ Netherlands ┆ 2016-03-01 ┆ 17.11      │
        │ Netherlands ┆ 2018-08-01 ┆ 17.32      │
        │ Netherlands ┆ 2019-01-01 ┆ 17.4       │
        └─────────────┴────────────┴────────────┘
        >>> pop2.join_asof(gdp2, by="country", on="date", strategy="nearest").collect()
        shape: (6, 4)
        ┌─────────────┬────────────┬────────────┬──────┐
        │ country     ┆ date       ┆ population ┆ gdp  │
        │ ---         ┆ ---        ┆ ---        ┆ ---  │
        │ str         ┆ date       ┆ f64        ┆ i64  │
        ╞═════════════╪════════════╪════════════╪══════╡
        │ Germany     ┆ 2016-03-01 ┆ 82.19      ┆ 4164 │
        │ Germany     ┆ 2018-08-01 ┆ 82.66      ┆ 4696 │
        │ Germany     ┆ 2019-01-01 ┆ 83.12      ┆ 4696 │
        │ Netherlands ┆ 2016-03-01 ┆ 17.11      ┆ 784  │
        │ Netherlands ┆ 2018-08-01 ┆ 17.32      ┆ 910  │
        │ Netherlands ┆ 2019-01-01 ┆ 17.4       ┆ 910  │
        └─────────────┴────────────┴────────────┴──────┘
        Nz4you should pass the column to join on as an argument)r  allow_eqr  )r4   r   r   r  rn   r   r	   r   r  r  r   r   	join_asofr  )r   r  r  r  r  r  r  r  r  r  r	  r
  r  r  r  r  r   by_left_	by_right_tolerance_strtolerance_nums                        r   r  zLazyFrame.join_asofi  s   x	 	$&&&b3.)) 	GH?h.HCS//!>)"c22:ttH II!x';$.w$<$<Iyy'H&03&?&?M

XII HI$(,0i%% 	&%MM	9-- 	&4Y??MM%M'27++ 	%eGnnG(BG,, 	'uXHI
 !,!1    
 
 	
r   
join_nullsnulls_equalz1.24innerzm:m)	r  r  r  validater  r  r  r
  r  (str | Expr | Sequence[str | Expr] | Nonehowrz   r  r{   MaintainOrderJoin | Nonec       	           t          | |           |
d}
|du}|du}|du}|p|}|r|rd}t          |          ||k    rd}t          |          |dk    rd}t          dd	           nr|d
k    rd}	d}t          dd	           nV|dk    rP|s|rd}t          |          |                     | j                            |j        g g |||||||

  
                  S |rt          |          }|}|}n2|rt          |          }t          |          }nd}t          |          |                     | j                            |j        |||||||||
|	                    S )u"  
        Add a join operation to the Logical Plan.

        .. versionchanged:: 1.24
            The `join_nulls` parameter was renamed `nulls_equal`.

        Parameters
        ----------
        other
            Lazy DataFrame to join with.
        on
            Name(s) of the join columns in both DataFrames. If set, `left_on` and
            `right_on` should be None. This should not be specified if `how='cross'`.
        how : {'inner','left', 'right', 'full', 'semi', 'anti', 'cross'}
            Join strategy.

            .. list-table ::
               :header-rows: 0

               * - **inner**
                 - *(Default)* Returns rows that have matching values in both tables.
               * - **left**
                 - Returns all rows from the left table, and the matched rows from
                   the right table.
               * - **full**
                 - Returns all rows when there is a match in either left or right.
               * - **cross**
                 - Returns the Cartesian product of rows from both tables
               * - **semi**
                 - Returns rows from the left table that have a match in the right
                   table.
               * - **anti**
                 - Returns rows from the left table that have no match in the right
                   table.

        left_on
            Join column of the left DataFrame.
        right_on
            Join column of the right DataFrame.
        suffix
            Suffix to append to columns with a duplicate name.
        validate: {'m:m', 'm:1', '1:m', '1:1'}
            Checks if join is of specified type.

            .. list-table ::
               :header-rows: 0

               * - **m:m**
                 - *(Default)* Many-to-many. Does not result in checks.
               * - **1:1**
                 - One-to-one. Checks if join keys are unique in both left and
                   right datasets.
               * - **1:m**
                 - One-to-many. Checks if join keys are unique in left dataset.
               * - **m:1**
                 - Many-to-one. Check if join keys are unique in right dataset.

            .. note::
                This is currently not supported by the streaming engine.
        nulls_equal
            Join on null values. By default null values will never produce matches.
        coalesce
            Coalescing behavior (merging of join columns).

            .. list-table ::
               :header-rows: 0

               * - **None**
                 - *(Default)* Coalesce unless `how='full'` is specified.
               * - **True**
                 - Always coalesce join columns.
               * - **False**
                 - Never coalesce join columns.

            .. note::
                Joining on any other expressions than `col`
                will turn off coalescing.
        maintain_order : {'none', 'left', 'right', 'left_right', 'right_left'}
            Which DataFrame row order to preserve, if any.
            Do not rely on any observed ordering without explicitly setting this
            parameter, as your code may break in a future release.
            Not specifying any ordering can improve performance.
            Supported for inner, left, right and full joins

            .. list-table ::
               :header-rows: 0

               * - **none**
                 - *(Default)* No specific ordering is desired. The ordering might
                   differ across Polars versions or even between different runs.
               * - **left**
                 - Preserves the order of the left DataFrame.
               * - **right**
                 - Preserves the order of the right DataFrame.
               * - **left_right**
                 - First preserves the order of the left DataFrame, then the right.
               * - **right_left**
                 - First preserves the order of the right DataFrame, then the left.

        allow_parallel
            Allow the physical plan to optionally evaluate the computation of both
            DataFrames up to the join in parallel.
        force_parallel
            Force the physical plan to evaluate the computation of both DataFrames up to
            the join in parallel.

        See Also
        --------
        join_asof

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> other_lf = pl.LazyFrame(
        ...     {
        ...         "apple": ["x", "y", "z"],
        ...         "ham": ["a", "b", "d"],
        ...     }
        ... )
        >>> lf.join(other_lf, on="ham").collect()
        shape: (2, 4)
        ┌─────┬─────┬─────┬───────┐
        │ foo ┆ bar ┆ ham ┆ apple │
        │ --- ┆ --- ┆ --- ┆ ---   │
        │ i64 ┆ f64 ┆ str ┆ str   │
        ╞═════╪═════╪═════╪═══════╡
        │ 1   ┆ 6.0 ┆ a   ┆ x     │
        │ 2   ┆ 7.0 ┆ b   ┆ y     │
        └─────┴─────┴─────┴───────┘
        >>> lf.join(other_lf, on="ham", how="full").collect()
        shape: (4, 5)
        ┌──────┬──────┬──────┬───────┬───────────┐
        │ foo  ┆ bar  ┆ ham  ┆ apple ┆ ham_right │
        │ ---  ┆ ---  ┆ ---  ┆ ---   ┆ ---       │
        │ i64  ┆ f64  ┆ str  ┆ str   ┆ str       │
        ╞══════╪══════╪══════╪═══════╪═══════════╡
        │ 1    ┆ 6.0  ┆ a    ┆ x     ┆ a         │
        │ 2    ┆ 7.0  ┆ b    ┆ y     ┆ b         │
        │ null ┆ null ┆ null ┆ z     ┆ d         │
        │ 3    ┆ 8.0  ┆ c    ┆ null  ┆ null      │
        └──────┴──────┴──────┴───────┴───────────┘
        >>> lf.join(other_lf, on="ham", how="left", coalesce=True).collect()
        shape: (3, 4)
        ┌─────┬─────┬─────┬───────┐
        │ foo ┆ bar ┆ ham ┆ apple │
        │ --- ┆ --- ┆ --- ┆ ---   │
        │ i64 ┆ f64 ┆ str ┆ str   │
        ╞═════╪═════╪═════╪═══════╡
        │ 1   ┆ 6.0 ┆ a   ┆ x     │
        │ 2   ┆ 7.0 ┆ b   ┆ y     │
        │ 3   ┆ 8.0 ┆ c   ┆ null  │
        └─────┴─────┴─────┴───────┘
        >>> lf.join(other_lf, on="ham", how="semi").collect()
        shape: (2, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ f64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6.0 ┆ a   │
        │ 2   ┆ 7.0 ┆ b   │
        └─────┴─────┴─────┘
        >>> lf.join(other_lf, on="ham", how="anti").collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ f64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 3   ┆ 8.0 ┆ c   │
        └─────┴─────┴─────┘

        >>> lf.join(other_lf, how="cross").collect()
        shape: (9, 5)
        ┌─────┬─────┬─────┬───────┬───────────┐
        │ foo ┆ bar ┆ ham ┆ apple ┆ ham_right │
        │ --- ┆ --- ┆ --- ┆ ---   ┆ ---       │
        │ i64 ┆ f64 ┆ str ┆ str   ┆ str       │
        ╞═════╪═════╪═════╪═══════╪═══════════╡
        │ 1   ┆ 6.0 ┆ a   ┆ x     ┆ a         │
        │ 1   ┆ 6.0 ┆ a   ┆ y     ┆ b         │
        │ 1   ┆ 6.0 ┆ a   ┆ z     ┆ d         │
        │ 2   ┆ 7.0 ┆ b   ┆ x     ┆ a         │
        │ 2   ┆ 7.0 ┆ b   ┆ y     ┆ b         │
        │ 2   ┆ 7.0 ┆ b   ┆ z     ┆ d         │
        │ 3   ┆ 8.0 ┆ c   ┆ x     ┆ a         │
        │ 3   ┆ 8.0 ┆ c   ┆ y     ┆ b         │
        │ 3   ┆ 8.0 ┆ c   ┆ z     ┆ d         │
        └─────┴─────┴─────┴───────┴───────────┘
        Nri  z;cannot use 'on' in conjunction with 'left_on' or 'right_on'z+'left_on' requires corresponding 'right_on'outerrf  :use of `how='outer'` should be replaced with `how='full'`.0.20.29r  outer_coalesceTzRuse of `how='outer_coalesce'` should be replaced with `how='full', coalesce=True`.crossz$cross join should not pass join keysz-must specify `on` OR `left_on` and `right_on`)r4   r   r"   r   r   joinr%   )r   r  r  r  r  r  r  r  r  r  r  r
  r  uses_onuses_left_onuses_right_on
uses_lr_onr   r  pyexprs_leftpyexprs_rights                        r   r&  zLazyFrame.join  s	   j 	$&&&!#ND.d* ,!2]
 	"z 	"OCS//!]**?CS//!'>>C%L!     $$$HC%d!     G^^ &* &< oo%##	J"""     		"4R88G"L#MM 	"9'BBL:8DDMMACS//!INN
 
 
 	
r   )r  Expr | Iterable[Expr]c                   t          | |           t          | }|                     | j                            |j        ||                    S )u  
        Perform a join based on one or multiple (in)equality predicates.

        This performs an inner join, so only rows where all predicates are true
        are included in the result, and a row from either DataFrame may be included
        multiple times in the result.

        .. note::
            The row order of the input DataFrames is not preserved.

        .. warning::
            This functionality is experimental. It may be
            changed at any point without it being considered a breaking change.

        Parameters
        ----------
        other
            DataFrame to join with.
        *predicates
            (In)Equality condition to join the two tables on.
            When a column name occurs in both tables, the proper suffix must
            be applied in the predicate.
        suffix
            Suffix to append to columns with a duplicate name.

        Examples
        --------
        >>> east = pl.LazyFrame(
        ...     {
        ...         "id": [100, 101, 102],
        ...         "dur": [120, 140, 160],
        ...         "rev": [12, 14, 16],
        ...         "cores": [2, 8, 4],
        ...     }
        ... )
        >>> west = pl.LazyFrame(
        ...     {
        ...         "t_id": [404, 498, 676, 742],
        ...         "time": [90, 130, 150, 170],
        ...         "cost": [9, 13, 15, 16],
        ...         "cores": [4, 2, 1, 4],
        ...     }
        ... )
        >>> east.join_where(
        ...     west,
        ...     pl.col("dur") < pl.col("time"),
        ...     pl.col("rev") < pl.col("cost"),
        ... ).collect()
        shape: (5, 8)
        ┌─────┬─────┬─────┬───────┬──────┬──────┬──────┬─────────────┐
        │ id  ┆ dur ┆ rev ┆ cores ┆ t_id ┆ time ┆ cost ┆ cores_right │
        │ --- ┆ --- ┆ --- ┆ ---   ┆ ---  ┆ ---  ┆ ---  ┆ ---         │
        │ i64 ┆ i64 ┆ i64 ┆ i64   ┆ i64  ┆ i64  ┆ i64  ┆ i64         │
        ╞═════╪═════╪═════╪═══════╪══════╪══════╪══════╪═════════════╡
        │ 100 ┆ 120 ┆ 12  ┆ 2     ┆ 498  ┆ 130  ┆ 13   ┆ 2           │
        │ 100 ┆ 120 ┆ 12  ┆ 2     ┆ 676  ┆ 150  ┆ 15   ┆ 1           │
        │ 100 ┆ 120 ┆ 12  ┆ 2     ┆ 742  ┆ 170  ┆ 16   ┆ 4           │
        │ 101 ┆ 140 ┆ 14  ┆ 8     ┆ 676  ┆ 150  ┆ 15   ┆ 1           │
        │ 101 ┆ 140 ┆ 14  ┆ 8     ┆ 742  ┆ 170  ┆ 16   ┆ 4           │
        └─────┴─────┴─────┴───────┴──────┴──────┴──────┴─────────────┘
        )r4   r%   r   r   
join_where)r   r  r  r  r  s        r   r/  zLazyFrame.join_where  sW    H 	$&&&0*=I  
 
 
 	
r   c                    t          t          t          j                            dd                              }t          |i |d|i}|                     | j                            |                    S )u  
        Add columns to this LazyFrame.

        Added columns will replace existing columns with the same name.

        Parameters
        ----------
        *exprs
            Column(s) to add, specified as positional arguments.
            Accepts expression input. Strings are parsed as column names, other
            non-expression inputs are parsed as literals.
        **named_exprs
            Additional columns to add, specified as keyword arguments.
            The columns will be renamed to the keyword used.

        Returns
        -------
        LazyFrame
            A new LazyFrame with the columns added.

        Notes
        -----
        Creating a new LazyFrame using this method does not create a new copy of
        existing data.

        Examples
        --------
        Pass an expression to add it as a new column.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [0.5, 4, 10, 13],
        ...         "c": [True, True, False, True],
        ...     }
        ... )
        >>> lf.with_columns((pl.col("a") ** 2).alias("a^2")).collect()
        shape: (4, 4)
        ┌─────┬──────┬───────┬─────┐
        │ a   ┆ b    ┆ c     ┆ a^2 │
        │ --- ┆ ---  ┆ ---   ┆ --- │
        │ i64 ┆ f64  ┆ bool  ┆ i64 │
        ╞═════╪══════╪═══════╪═════╡
        │ 1   ┆ 0.5  ┆ true  ┆ 1   │
        │ 2   ┆ 4.0  ┆ true  ┆ 4   │
        │ 3   ┆ 10.0 ┆ false ┆ 9   │
        │ 4   ┆ 13.0 ┆ true  ┆ 16  │
        └─────┴──────┴───────┴─────┘

        Added columns will replace existing columns with the same name.

        >>> lf.with_columns(pl.col("a").cast(pl.Float64)).collect()
        shape: (4, 3)
        ┌─────┬──────┬───────┐
        │ a   ┆ b    ┆ c     │
        │ --- ┆ ---  ┆ ---   │
        │ f64 ┆ f64  ┆ bool  │
        ╞═════╪══════╪═══════╡
        │ 1.0 ┆ 0.5  ┆ true  │
        │ 2.0 ┆ 4.0  ┆ true  │
        │ 3.0 ┆ 10.0 ┆ false │
        │ 4.0 ┆ 13.0 ┆ true  │
        └─────┴──────┴───────┘

        Multiple columns can be added using positional arguments.

        >>> lf.with_columns(
        ...     (pl.col("a") ** 2).alias("a^2"),
        ...     (pl.col("b") / 2).alias("b/2"),
        ...     (pl.col("c").not_()).alias("not c"),
        ... ).collect()
        shape: (4, 6)
        ┌─────┬──────┬───────┬─────┬──────┬───────┐
        │ a   ┆ b    ┆ c     ┆ a^2 ┆ b/2  ┆ not c │
        │ --- ┆ ---  ┆ ---   ┆ --- ┆ ---  ┆ ---   │
        │ i64 ┆ f64  ┆ bool  ┆ i64 ┆ f64  ┆ bool  │
        ╞═════╪══════╪═══════╪═════╪══════╪═══════╡
        │ 1   ┆ 0.5  ┆ true  ┆ 1   ┆ 0.25 ┆ false │
        │ 2   ┆ 4.0  ┆ true  ┆ 4   ┆ 2.0  ┆ false │
        │ 3   ┆ 10.0 ┆ false ┆ 9   ┆ 5.0  ┆ true  │
        │ 4   ┆ 13.0 ┆ true  ┆ 16  ┆ 6.5  ┆ false │
        └─────┴──────┴───────┴─────┴──────┴───────┘

        Multiple columns can also be added by passing a list of expressions.

        >>> lf.with_columns(
        ...     [
        ...         (pl.col("a") ** 2).alias("a^2"),
        ...         (pl.col("b") / 2).alias("b/2"),
        ...         (pl.col("c").not_()).alias("not c"),
        ...     ]
        ... ).collect()
        shape: (4, 6)
        ┌─────┬──────┬───────┬─────┬──────┬───────┐
        │ a   ┆ b    ┆ c     ┆ a^2 ┆ b/2  ┆ not c │
        │ --- ┆ ---  ┆ ---   ┆ --- ┆ ---  ┆ ---   │
        │ i64 ┆ f64  ┆ bool  ┆ i64 ┆ f64  ┆ bool  │
        ╞═════╪══════╪═══════╪═════╪══════╪═══════╡
        │ 1   ┆ 0.5  ┆ true  ┆ 1   ┆ 0.25 ┆ false │
        │ 2   ┆ 4.0  ┆ true  ┆ 4   ┆ 2.0  ┆ false │
        │ 3   ┆ 10.0 ┆ false ┆ 9   ┆ 5.0  ┆ true  │
        │ 4   ┆ 13.0 ┆ true  ┆ 16  ┆ 6.5  ┆ false │
        └─────┴──────┴───────┴─────┴──────┴───────┘

        Use keyword arguments to easily name your expression inputs.

        >>> lf.with_columns(
        ...     ab=pl.col("a") * pl.col("b"),
        ...     not_c=pl.col("c").not_(),
        ... ).collect()
        shape: (4, 5)
        ┌─────┬──────┬───────┬──────┬───────┐
        │ a   ┆ b    ┆ c     ┆ ab   ┆ not_c │
        │ --- ┆ ---  ┆ ---   ┆ ---  ┆ ---   │
        │ i64 ┆ f64  ┆ bool  ┆ f64  ┆ bool  │
        ╞═════╪══════╪═══════╪══════╪═══════╡
        │ 1   ┆ 0.5  ┆ true  ┆ 0.5  ┆ false │
        │ 2   ┆ 4.0  ┆ true  ┆ 8.0  ┆ false │
        │ 3   ┆ 10.0 ┆ false ┆ 30.0 ┆ true  │
        │ 4   ┆ 13.0 ┆ true  ┆ 52.0 ┆ false │
        └─────┴──────┴───────┴──────┴───────┘

        Expressions with multiple outputs can automatically be instantiated as Structs
        by enabling the experimental setting `Config.set_auto_structify(True)`:

        >>> with pl.Config(auto_structify=True):
        ...     lf.drop("c").with_columns(
        ...         diffs=pl.col(["a", "b"]).diff().name.suffix("_diff"),
        ...     ).collect()
        shape: (4, 3)
        ┌─────┬──────┬─────────────┐
        │ a   ┆ b    ┆ diffs       │
        │ --- ┆ ---  ┆ ---         │
        │ i64 ┆ f64  ┆ struct[2]   │
        ╞═════╪══════╪═════════════╡
        │ 1   ┆ 0.5  ┆ {null,null} │
        │ 2   ┆ 4.0  ┆ {1,3.5}     │
        │ 3   ┆ 10.0 ┆ {1,6.0}     │
        │ 4   ┆ 13.0 ┆ {1,3.0}     │
        └─────┴──────┴─────────────┘
        r  r   r  )	r   r  r  r  r!  r%   r   r   r  r  s        r   r  zLazyFrame.with_columnsL  s}    d RZ^^,CQGGHHII	0
!
 
/8
 
 
 	 6 6w ? ?@@@r   c                    t          t          t          j                            dd                              }t          |i |d|i}|                     | j                            |                    S )a6  
        Add columns to this LazyFrame.

        Added columns will replace existing columns with the same name.

        This will run all expression sequentially instead of in parallel.
        Use this when the work per expression is cheap.

        Parameters
        ----------
        *exprs
            Column(s) to add, specified as positional arguments.
            Accepts expression input. Strings are parsed as column names, other
            non-expression inputs are parsed as literals.
        **named_exprs
            Additional columns to add, specified as keyword arguments.
            The columns will be renamed to the keyword used.

        Returns
        -------
        LazyFrame
            A new LazyFrame with the columns added.

        See Also
        --------
        with_columns
        r  r   r  )	r   r  r  r  r!  r%   r   r   with_columns_seqr  s        r   r2  zLazyFrame.with_columns_seq  s}    @ RZ^^,CQGGHHII	0
!
 
/8
 
 
 	 : :7 C CDDDr   zW`LazyFrame.with_context` is deprecated; use `pl.concat(..., how='horizontal')` instead.Self | list[Self]c                    t          |t                    s|g}|                     | j                            d |D                                 S )u  
        Add an external context to the computation graph.

        .. deprecated:: 1.0.0
            Use :func:`concat` instead, with `how='horizontal'`

        This allows expressions to also access columns from DataFrames
        that are not part of this one.

        Parameters
        ----------
        other
            Lazy DataFrame to join with.

        Examples
        --------
        >>> lf = pl.LazyFrame({"a": [1, 2, 3], "b": ["a", "c", None]})
        >>> lf_other = pl.LazyFrame({"c": ["foo", "ham"]})
        >>> lf.with_context(lf_other).select(  # doctest: +SKIP
        ...     pl.col("b") + pl.col("c").first()
        ... ).collect()
        shape: (3, 1)
        ┌──────┐
        │ b    │
        │ ---  │
        │ str  │
        ╞══════╡
        │ afoo │
        │ cfoo │
        │ null │
        └──────┘

        Fill nulls with the median from another DataFrame:

        >>> train_lf = pl.LazyFrame(
        ...     {"feature_0": [-1.0, 0, 1], "feature_1": [-1.0, 0, 1]}
        ... )
        >>> test_lf = pl.LazyFrame(
        ...     {"feature_0": [-1.0, None, 1], "feature_1": [-1.0, 0, 1]}
        ... )
        >>> test_lf.with_context(  # doctest: +SKIP
        ...     train_lf.select(pl.all().name.suffix("_train"))
        ... ).select(
        ...     pl.col("feature_0").fill_null(pl.col("feature_0_train").median())
        ... ).collect()
        shape: (3, 1)
        ┌───────────┐
        │ feature_0 │
        │ ---       │
        │ f64       │
        ╞═══════════╡
        │ -1.0      │
        │ 0.0       │
        │ 1.0       │
        └───────────┘
        c                    g | ]	}|j         
S rQ  )r   )rx  r  s     r   r  z*LazyFrame.with_context.<locals>.<listcomp>L  s    7P7P7PB7P7P7Pr   )r   r   r   r   with_contextr  s     r   r6  zLazyFrame.with_context  sQ    z %&& 	GE	 6 67P7P%7P7P7P Q QRRRr   r  5ColumnNameOrSelector | Iterable[ColumnNameOrSelector]c               r    t          | }|                     | j                            ||                    S )u  
        Remove columns from the DataFrame.

        Parameters
        ----------
        *columns
            Names of the columns that should be removed from the dataframe.
            Accepts column selector input.
        strict
            Validate that all column names exist in the current schema,
            and throw an exception if any do not.

        Examples
        --------
        Drop a single column by passing the name of that column.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6.0, 7.0, 8.0],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.drop("ham").collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ foo ┆ bar │
        │ --- ┆ --- │
        │ i64 ┆ f64 │
        ╞═════╪═════╡
        │ 1   ┆ 6.0 │
        │ 2   ┆ 7.0 │
        │ 3   ┆ 8.0 │
        └─────┴─────┘

        Drop multiple columns by passing a selector.

        >>> import polars.selectors as cs
        >>> lf.drop(cs.numeric()).collect()
        shape: (3, 1)
        ┌─────┐
        │ ham │
        │ --- │
        │ str │
        ╞═════╡
        │ a   │
        │ b   │
        │ c   │
        └─────┘

        Use positional arguments to drop multiple columns.

        >>> lf.drop("foo", "ham").collect()
        shape: (3, 1)
        ┌─────┐
        │ bar │
        │ --- │
        │ f64 │
        ╞═════╡
        │ 6.0 │
        │ 7.0 │
        │ 8.0 │
        └─────┘
        r  )r%   r   r   drop)r   r   r  	drop_colss       r   r9  zLazyFrame.dropN  s5    J 3G<		y H HIIIr   mapping(Mapping[str, str] | Callable[[str], str]c               ~   t          |          r>|                     t          j                    j                            |                    S t          |                                          }t          |                                          }| 	                    | j
                            |||                    S )u  
        Rename column names.

        Parameters
        ----------
        mapping
            Key value pairs that map from old name to new name, or a function
            that takes the old name as input and returns the new name.
        strict
            Validate that all column names exist in the current schema,
            and throw an exception if any do not. (Note that this parameter
            is a no-op when passing a function to `mapping`).

        Notes
        -----
        If existing names are swapped (e.g. 'A' points to 'B' and 'B' points to 'A'),
        polars will block projection and predicate pushdowns at this node.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6, 7, 8],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.rename({"foo": "apple"}).collect()
        shape: (3, 3)
        ┌───────┬─────┬─────┐
        │ apple ┆ bar ┆ ham │
        │ ---   ┆ --- ┆ --- │
        │ i64   ┆ i64 ┆ str │
        ╞═══════╪═════╪═════╡
        │ 1     ┆ 6   ┆ a   │
        │ 2     ┆ 7   ┆ b   │
        │ 3     ┆ 8   ┆ c   │
        └───────┴─────┴─────┘
        >>> lf.rename(lambda column_name: "c" + column_name[1:]).collect()
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ coo ┆ car ┆ cam │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        │ 2   ┆ 7   ┆ b   │
        │ 3   ┆ 8   ┆ c   │
        └─────┴─────┴─────┘
        )r   r  r  r  r  mapr   keysr  r   r   rename)r   r;  r   existingnews        r   r@  zLazyFrame.rename  s    j G 	M;;quww|//88999GLLNN++Hw~~''((C##DI$4$4XsF$K$KLLLr   c                Z    |                      | j                                                  S )u_  
        Reverse the DataFrame.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "key": ["a", "b", "c"],
        ...         "val": [1, 2, 3],
        ...     }
        ... )
        >>> lf.reverse().collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ key ┆ val │
        │ --- ┆ --- │
        │ str ┆ i64 │
        ╞═════╪═════╡
        │ c   ┆ 3   │
        │ b   ┆ 2   │
        │ a   ┆ 1   │
        └─────┴─────┘
        )r   r   r  r   s    r   r  zLazyFrame.reverse  s&    0 	 1 1 3 3444r   r  )
fill_valueint | IntoExprColumnrD  IntoExpr | Nonec                   |t          |d          }t          |          }|                     | j                            ||                    S )u  
        Shift values by the given number of indices.

        Parameters
        ----------
        n
            Number of indices to shift forward. If a negative value is passed, values
            are shifted in the opposite direction instead.
        fill_value
            Fill the resulting null values with this value. Accepts scalar expression
            input. Non-expression inputs are parsed as literals.

        Notes
        -----
        This method is similar to the `LAG` operation in SQL when the value for `n`
        is positive. With a negative value for `n`, it is similar to `LEAD`.

        Examples
        --------
        By default, values are shifted forward by one index.

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [5, 6, 7, 8],
        ...     }
        ... )
        >>> lf.shift().collect()
        shape: (4, 2)
        ┌──────┬──────┐
        │ a    ┆ b    │
        │ ---  ┆ ---  │
        │ i64  ┆ i64  │
        ╞══════╪══════╡
        │ null ┆ null │
        │ 1    ┆ 5    │
        │ 2    ┆ 6    │
        │ 3    ┆ 7    │
        └──────┴──────┘

        Pass a negative value to shift in the opposite direction instead.

        >>> lf.shift(-2).collect()
        shape: (4, 2)
        ┌──────┬──────┐
        │ a    ┆ b    │
        │ ---  ┆ ---  │
        │ i64  ┆ i64  │
        ╞══════╪══════╡
        │ 3    ┆ 7    │
        │ 4    ┆ 8    │
        │ null ┆ null │
        │ null ┆ null │
        └──────┴──────┘

        Specify `fill_value` to fill the resulting null values.

        >>> lf.shift(-2, fill_value=100).collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 3   ┆ 7   │
        │ 4   ┆ 8   │
        │ 100 ┆ 100 │
        │ 100 ┆ 100 │
        └─────┴─────┘
        NT)
str_as_lit)r$   r   r   shift)r   r  rD  s      r   rI  zLazyFrame.shift  sN    R !.zdKKKJ!!$$	: > >???r   lengthc                    |r|dk     rd|d}t          |          |                     | j                            ||                    S )u  
        Get a slice of this DataFrame.

        Parameters
        ----------
        offset
            Start index. Negative indexing is supported.
        length
            Length of the slice. If set to `None`, all rows starting at the offset
            will be selected.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["x", "y", "z"],
        ...         "b": [1, 3, 5],
        ...         "c": [2, 4, 6],
        ...     }
        ... )
        >>> lf.slice(1, 2).collect()
        shape: (2, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ str ┆ i64 ┆ i64 │
        ╞═════╪═════╪═════╡
        │ y   ┆ 3   ┆ 4   │
        │ z   ┆ 5   ┆ 6   │
        └─────┴─────┴─────┘
        r   znegative slice lengths (z) are invalid for LazyFrame)r   r   r   r4  )r   r  rJ  r   s       r   r4  zLazyFrame.slice:  sU    @  	"fqjjRVRRRCS//!	 ? ?@@@r      c                ,    |                      |          S )uw  
        Get the first `n` rows.

        Alias for :func:`LazyFrame.head`.

        Parameters
        ----------
        n
            Number of rows to return.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4, 5, 6],
        ...         "b": [7, 8, 9, 10, 11, 12],
        ...     }
        ... )
        >>> lf.limit().collect()
        shape: (5, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 7   │
        │ 2   ┆ 8   │
        │ 3   ┆ 9   │
        │ 4   ┆ 10  │
        │ 5   ┆ 11  │
        └─────┴─────┘
        >>> lf.limit(2).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 7   │
        │ 2   ┆ 8   │
        └─────┴─────┘
        )headr  s     r   limitzLazyFrame.limit_  s    V yy||r   c                .    |                      d|          S )uJ  
        Get the first `n` rows.

        Parameters
        ----------
        n
            Number of rows to return.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4, 5, 6],
        ...         "b": [7, 8, 9, 10, 11, 12],
        ...     }
        ... )
        >>> lf.head().collect()
        shape: (5, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 7   │
        │ 2   ┆ 8   │
        │ 3   ┆ 9   │
        │ 4   ┆ 10  │
        │ 5   ┆ 11  │
        └─────┴─────┘
        >>> lf.head(2).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 7   │
        │ 2   ┆ 8   │
        └─────┴─────┘
        r   r4  r  s     r   rN  zLazyFrame.head  s    R zz!Qr   c                \    |                      | j                            |                    S )uI  
        Get the last `n` rows.

        Parameters
        ----------
        n
            Number of rows to return.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4, 5, 6],
        ...         "b": [7, 8, 9, 10, 11, 12],
        ...     }
        ... )
        >>> lf.tail().collect()
        shape: (5, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 2   ┆ 8   │
        │ 3   ┆ 9   │
        │ 4   ┆ 10  │
        │ 5   ┆ 11  │
        │ 6   ┆ 12  │
        └─────┴─────┘
        >>> lf.tail(2).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 5   ┆ 11  │
        │ 6   ┆ 12  │
        └─────┴─────┘
        )r   r   tailr  s     r   rS  zLazyFrame.tail  s'    R 	q 1 1222r   c                ,    |                      d          S )u&  
        Get the last row of the DataFrame.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 5, 3],
        ...         "b": [2, 4, 6],
        ...     }
        ... )
        >>> lf.last().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 3   ┆ 6   │
        └─────┴─────┘
        r  )rS  r   s    r   lastzLazyFrame.last  s    , yy||r   c                .    |                      dd          S )u(  
        Get the first row of the DataFrame.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 3, 5],
        ...         "b": [2, 4, 6],
        ...     }
        ... )
        >>> lf.first().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 2   │
        └─────┴─────┘
        r   r  rQ  r   s    r   firstzLazyFrame.first  s    , zz!Qr   z\`LazyFrame.approx_n_unique` is deprecated; use `select(pl.all().approx_n_unique())` instead.c                r    |                      t          j                                                              S )u  
        Approximate count of unique values.

        .. deprecated:: 0.20.11
            Use `select(pl.all().approx_n_unique())` instead.

        This is done using the HyperLogLog++ algorithm for cardinality estimation.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.approx_n_unique().collect()  # doctest: +SKIP
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ u32 ┆ u32 │
        ╞═════╪═════╡
        │ 4   ┆ 2   │
        └─────┴─────┘
        )r  r  r  approx_n_uniquer   s    r   rY  zLazyFrame.approx_n_unique  s(    > {{15772244555r   indexr  c                    	 |                      | j                            ||                    S # t          $ r# |dk     rdnd}d| d| }t	          |          dw xY w)u	  
        Add a row index as the first column in the LazyFrame.

        Parameters
        ----------
        name
            Name of the index column.
        offset
            Start the index at this offset. Cannot be negative.

        Warnings
        --------
        Using this function can have a negative effect on query performance.
        This may, for instance, block predicate pushdown optimization.

        Notes
        -----
        The resulting column does not have any special properties. It is a regular
        column of type `UInt32` (or `UInt64` in `polars-u64-idx`).

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 3, 5],
        ...         "b": [2, 4, 6],
        ...     }
        ... )
        >>> lf.with_row_index().collect()
        shape: (3, 3)
        ┌───────┬─────┬─────┐
        │ index ┆ a   ┆ b   │
        │ ---   ┆ --- ┆ --- │
        │ u32   ┆ i64 ┆ i64 │
        ╞═══════╪═════╪═════╡
        │ 0     ┆ 1   ┆ 2   │
        │ 1     ┆ 3   ┆ 4   │
        │ 2     ┆ 5   ┆ 6   │
        └───────┴─────┴─────┘
        >>> lf.with_row_index("id", offset=1000).collect()
        shape: (3, 3)
        ┌──────┬─────┬─────┐
        │ id   ┆ a   ┆ b   │
        │ ---  ┆ --- ┆ --- │
        │ u32  ┆ i64 ┆ i64 │
        ╞══════╪═════╪═════╡
        │ 1000 ┆ 1   ┆ 2   │
        │ 1001 ┆ 3   ┆ 4   │
        │ 1002 ┆ 5   ┆ 6   │
        └──────┴─────┴─────┘

        An index column can also be created using the expressions :func:`int_range`
        and :func:`len`.

        >>> lf.select(
        ...     pl.int_range(pl.len(), dtype=pl.UInt32).alias("index"),
        ...     pl.all(),
        ... ).collect()
        shape: (3, 3)
        ┌───────┬─────┬─────┐
        │ index ┆ a   ┆ b   │
        │ ---   ┆ --- ┆ --- │
        │ u32   ┆ i64 ┆ i64 │
        ╞═══════╪═════╪═════╡
        │ 0     ┆ 1   ┆ 2   │
        │ 1     ┆ 3   ┆ 4   │
        │ 2     ┆ 5   ┆ 6   │
        └───────┴─────┴─────┘
        r   negativez$greater than the maximum index valuez.`offset` input for `with_row_index` cannot be z, got N)r   r   with_row_indexOverflowErrorr   )r   r  r  issuer   s        r   r]  zLazyFrame.with_row_index3  s    L	,##DI$<$<T6$J$JKKK 	, 	, 	,"(1**JJ2XEX5XXPVXXCS//t+	,s	   -0 -Az`LazyFrame.with_row_count` is deprecated; use `LazyFrame.with_row_index` instead. Note that the default column name has changed from 'row_nr' to 'index'.row_nrc                .    |                      ||          S )u	  
        Add a column at index 0 that counts the rows.

        .. deprecated:: 0.20.4
            Use the :meth:`with_row_index` method instead.
            Note that the default column name has changed from 'row_nr' to 'index'.

        Parameters
        ----------
        name
            Name of the column to add.
        offset
            Start the row count at this offset.

        Warnings
        --------
        This can have a negative effect on query performance.
        This may, for instance, block predicate pushdown optimization.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 3, 5],
        ...         "b": [2, 4, 6],
        ...     }
        ... )
        >>> lf.with_row_count().collect()  # doctest: +SKIP
        shape: (3, 3)
        ┌────────┬─────┬─────┐
        │ row_nr ┆ a   ┆ b   │
        │ ---    ┆ --- ┆ --- │
        │ u32    ┆ i64 ┆ i64 │
        ╞════════╪═════╪═════╡
        │ 0      ┆ 1   ┆ 2   │
        │ 1      ┆ 3   ┆ 4   │
        │ 2      ┆ 5   ┆ 6   │
        └────────┴─────┴─────┘
        )r]  )r   r  r  s      r   with_row_countzLazyFrame.with_row_count  s    X ""4000r   c                x    |                      t          j        d                              ||                    S )uW  
        Take every nth row in the LazyFrame and return as a new LazyFrame.

        Parameters
        ----------
        n
            Gather every *n*-th row.
        offset
            Starting index.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [5, 6, 7, 8],
        ...     }
        ... )
        >>> lf.gather_every(2).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 5   │
        │ 3   ┆ 7   │
        └─────┴─────┘
        >>> lf.gather_every(2, offset=1).collect()
        shape: (2, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 2   ┆ 6   │
        │ 4   ┆ 8   │
        └─────┴─────┘
        *)r  r  r  gather_every)r   r  r  s      r   re  zLazyFrame.gather_every  s/    P {{15::221f==>>>r   )matches_supertyper  Any | Expr | NoneFillNullStrategy | NonerO  rf  c               D   ddl m} |t          |t          j                  rd}nt          |t
                    r
t          g}nb|rbt          |t          t          f          rFt          t          t          t          t          t          t          t           t"          t$          t&          |g}nt          |t                    r	t          g}nt          |t                    r	t&          g}nt          |t(                    rt*          gd t,          D             z   }nt          |t.                    rt0          gd t,          D             z   }nbt          |t2                    r	t4          g}nDt          |t6                    r	t8          g}n&t          |t:                    rt<          t>          g}nd}|r<|                      tC          j"        |          #                    |||                    S | $                    tC          j%                    #                    |||                    S )uB
  
        Fill null values using the specified value or strategy.

        Parameters
        ----------
        value
            Value used to fill null values.
        strategy : {None, 'forward', 'backward', 'min', 'max', 'mean', 'zero', 'one'}
            Strategy used to fill null values.
        limit
            Number of consecutive null values to fill when using the 'forward' or
            'backward' strategy.
        matches_supertype
            Fill all matching supertypes of the fill `value` literal.

        See Also
        --------
        fill_nan

        Notes
        -----
        A null value is not the same as a NaN value.
        To fill NaN values, use :func:`fill_nan`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, None, 4],
        ...         "b": [0.5, 4, None, 13],
        ...     }
        ... )
        >>> lf.fill_null(99).collect()
        shape: (4, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ i64 ┆ f64  │
        ╞═════╪══════╡
        │ 1   ┆ 0.5  │
        │ 2   ┆ 4.0  │
        │ 99  ┆ 99.0 │
        │ 4   ┆ 13.0 │
        └─────┴──────┘
        >>> lf.fill_null(strategy="forward").collect()
        shape: (4, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ i64 ┆ f64  │
        ╞═════╪══════╡
        │ 1   ┆ 0.5  │
        │ 2   ┆ 4.0  │
        │ 2   ┆ 4.0  │
        │ 4   ┆ 13.0 │
        └─────┴──────┘

        >>> lf.fill_null(strategy="max").collect()
        shape: (4, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ i64 ┆ f64  │
        ╞═════╪══════╡
        │ 1   ┆ 0.5  │
        │ 2   ┆ 4.0  │
        │ 4   ┆ 13.0 │
        │ 4   ┆ 13.0 │
        └─────┴──────┘

        >>> lf.fill_null(strategy="zero").collect()
        shape: (4, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ i64 ┆ f64  │
        ╞═════╪══════╡
        │ 1   ┆ 0.5  │
        │ 2   ┆ 4.0  │
        │ 0   ┆ 0.0  │
        │ 4   ┆ 13.0 │
        └─────┴──────┘
        r   )DecimalNc                ,    g | ]}t          |          S rQ  )r<   rx  us     r   r  z'LazyFrame.fill_null.<locals>.<listcomp>P      &Q&Q&Qqx{{&Q&Q&Qr   c                ,    g | ]}t          |          S rQ  )r=   rl  s     r   r  z'LazyFrame.fill_null.<locals>.<listcomp>R  rn  r   )&polarsrj  r   r  rn   r   r9   r  r  rA   rB   rC   rD   rE   rJ   rK   rL   rM   r?   r@   r   r<   r7   r	   r=   r   r;   r   rI   r   rH   r:   r  r  r  	fill_nullr  r  )r   r  r  rO  rf  rj  r  s          r   rq  zLazyFrame.fill_null  s   v 	#""""" %)) #E4(( !!" z%#u'F'F  E3'' E5)) !E8,, "&Q&Q<P&Q&Q&QQE9-- 
"&Q&Q<P&Q&Q&QQE4(( E4(( E3''  +.  ((E&MM++E8UCC   {{1577,,UHeDDEEEr   int | float | Expr | Nonec                    t          |t          j                  st          j        |          }|                     | j                            |j                            S )u  
        Fill floating point NaN values.

        Parameters
        ----------
        value
            Value used to fill NaN values.

        See Also
        --------
        fill_null

        Notes
        -----
        A NaN value is not the same as a null value.
        To fill null values, use :func:`fill_null`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1.5, 2, float("nan"), 4],
        ...         "b": [0.5, 4, float("nan"), 13],
        ...     }
        ... )
        >>> lf.fill_nan(99).collect()
        shape: (4, 2)
        ┌──────┬──────┐
        │ a    ┆ b    │
        │ ---  ┆ ---  │
        │ f64  ┆ f64  │
        ╞══════╪══════╡
        │ 1.5  ┆ 0.5  │
        │ 2.0  ┆ 4.0  │
        │ 99.0 ┆ 99.0 │
        │ 4.0  ┆ 13.0 │
        └──────┴──────┘
        )	r   r  rn   r  r  r   r   fill_nanr  )r   r  s     r   rt  zLazyFrame.fill_nand  sL    N %)) 	!E%LLE	 2 25= A ABBBr   ddofc                \    |                      | j                            |                    S )u:  
        Aggregate the columns in the LazyFrame to their standard deviation value.

        Parameters
        ----------
        ddof
            “Delta Degrees of Freedom”: the divisor used in the calculation is N - ddof,
            where N represents the number of elements.
            By default ddof is 1.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.std().collect()
        shape: (1, 2)
        ┌──────────┬─────┐
        │ a        ┆ b   │
        │ ---      ┆ --- │
        │ f64      ┆ f64 │
        ╞══════════╪═════╡
        │ 1.290994 ┆ 0.5 │
        └──────────┴─────┘
        >>> lf.std(ddof=0).collect()
        shape: (1, 2)
        ┌──────────┬──────────┐
        │ a        ┆ b        │
        │ ---      ┆ ---      │
        │ f64      ┆ f64      │
        ╞══════════╪══════════╡
        │ 1.118034 ┆ 0.433013 │
        └──────────┴──────────┘
        )r   r   rr  r   ru  s     r   rr  zLazyFrame.std  '    L 	d 3 3444r   c                \    |                      | j                            |                    S )u  
        Aggregate the columns in the LazyFrame to their variance value.

        Parameters
        ----------
        ddof
            “Delta Degrees of Freedom”: the divisor used in the calculation is N - ddof,
            where N represents the number of elements.
            By default ddof is 1.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.var().collect()
        shape: (1, 2)
        ┌──────────┬──────┐
        │ a        ┆ b    │
        │ ---      ┆ ---  │
        │ f64      ┆ f64  │
        ╞══════════╪══════╡
        │ 1.666667 ┆ 0.25 │
        └──────────┴──────┘
        >>> lf.var(ddof=0).collect()
        shape: (1, 2)
        ┌──────┬────────┐
        │ a    ┆ b      │
        │ ---  ┆ ---    │
        │ f64  ┆ f64    │
        ╞══════╪════════╡
        │ 1.25 ┆ 0.1875 │
        └──────┴────────┘
        )r   r   varrw  s     r   rz  zLazyFrame.var  rx  r   c                Z    |                      | j                                                  S )uG  
        Aggregate the columns in the LazyFrame to their maximum value.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.max().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 4   ┆ 2   │
        └─────┴─────┘
        )r   r   r{  r   s    r   r{  zLazyFrame.max  "    , 	000r   c                Z    |                      | j                                                  S )uG  
        Aggregate the columns in the LazyFrame to their minimum value.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.min().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 1   │
        └─────┴─────┘
        )r   r   rs  r   s    r   rs  zLazyFrame.min  r|  r   c                Z    |                      | j                                                  S )uC  
        Aggregate the columns in the LazyFrame to their sum value.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.sum().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 10  ┆ 5   │
        └─────┴─────┘
        )r   r   sumr   s    r   r  zLazyFrame.sum  r|  r   c                Z    |                      | j                                                  S )uR  
        Aggregate the columns in the LazyFrame to their mean value.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.mean().collect()
        shape: (1, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ f64 ┆ f64  │
        ╞═════╪══════╡
        │ 2.5 ┆ 1.25 │
        └─────┴──────┘
        )r   r   rq  r   s    r   rq  zLazyFrame.mean'  s$    , 	 0 0111r   c                Z    |                      | j                                                  S )uI  
        Aggregate the columns in the LazyFrame to their median value.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.median().collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ f64 ┆ f64 │
        ╞═════╪═════╡
        │ 2.5 ┆ 1.0 │
        └─────┴─────┘
        )r   r   medianr   s    r   r  zLazyFrame.median?  s&    , 	 0 0 2 2333r   c                Z    |                      | j                                                  S )u  
        Aggregate the columns in the LazyFrame as the sum of their null value count.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, None, 3],
        ...         "bar": [6, 7, None],
        ...         "ham": ["a", "b", "c"],
        ...     }
        ... )
        >>> lf.null_count().collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ u32 ┆ u32 ┆ u32 │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 1   ┆ 0   │
        └─────┴─────┴─────┘
        )r   r   rp  r   s    r   rp  zLazyFrame.null_countW  s&    . 	 4 4 6 6777r   r  float | Exprc                |    t          |          }|                     | j                            ||                    S )u1  
        Aggregate the columns in the LazyFrame to their quantile value.

        Parameters
        ----------
        quantile
            Quantile between 0.0 and 1.0.
        interpolation : {'nearest', 'higher', 'lower', 'midpoint', 'linear', 'equiprobable'}
            Interpolation method.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [1, 2, 3, 4],
        ...         "b": [1, 2, 1, 1],
        ...     }
        ... )
        >>> lf.quantile(0.7).collect()
        shape: (1, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ f64 ┆ f64 │
        ╞═════╪═════╡
        │ 3.0 ┆ 1.0 │
        └─────┴─────┘
        )r$   r   r   r  )r   r  rj  s      r   r  zLazyFrame.quantilep  s8    B )22	 2 28] K KLLLr   !str | Expr | Sequence[str | Expr]more_columns
str | Exprc                v    t          |g|R  }|                     | j                            |                    S )u,  
        Explode the DataFrame to long format by exploding the given columns.

        Parameters
        ----------
        columns
            Column names, expressions, or a selector defining them. The underlying
            columns being exploded must be of the `List` or `Array` data type.
        *more_columns
            Additional names of columns to explode, specified as positional arguments.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "letters": ["a", "a", "b", "c"],
        ...         "numbers": [[1], [2, 3], [4, 5], [6, 7, 8]],
        ...     }
        ... )
        >>> lf.explode("numbers").collect()
        shape: (8, 2)
        ┌─────────┬─────────┐
        │ letters ┆ numbers │
        │ ---     ┆ ---     │
        │ str     ┆ i64     │
        ╞═════════╪═════════╡
        │ a       ┆ 1       │
        │ a       ┆ 2       │
        │ a       ┆ 3       │
        │ b       ┆ 4       │
        │ b       ┆ 5       │
        │ c       ┆ 6       │
        │ c       ┆ 7       │
        │ c       ┆ 8       │
        └─────────┴─────────┘
        )r%   r   r   exploder   r  r  s      r   r  zLazyFrame.explode  s>    R 1H<HHH	 1 1' : :;;;r   r  )keepr  subset>ColumnNameOrSelector | Collection[ColumnNameOrSelector] | Noner  r   c                   |t          |          }|                     | j                            |||                    S )uN  
        Drop duplicate rows from this DataFrame.

        Parameters
        ----------
        subset
            Column name(s) or selector(s), to consider when identifying
            duplicate rows. If set to `None` (default), use all columns.
        keep : {'first', 'last', 'any', 'none'}
            Which of the duplicate rows to keep.

            * 'any': Does not give any guarantee of which row is kept.
                     This allows more optimizations.
            * 'none': Don't keep duplicate rows.
            * 'first': Keep first unique row.
            * 'last': Keep last unique row.
        maintain_order
            Keep the same order as the original DataFrame. This is more expensive to
            compute.
            Settings this to `True` blocks the possibility
            to run on the streaming engine.

        Returns
        -------
        LazyFrame
            LazyFrame with unique rows.

        Warnings
        --------
        This method will fail if there is a column of type `List` in the DataFrame or
        subset.

        Notes
        -----
        If you're coming from pandas, this is similar to
        `pandas.DataFrame.drop_duplicates`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3, 1],
        ...         "bar": ["a", "a", "a", "a"],
        ...         "ham": ["b", "b", "b", "b"],
        ...     }
        ... )
        >>> lf.unique(maintain_order=True).collect()
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ str ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ a   ┆ b   │
        │ 2   ┆ a   ┆ b   │
        │ 3   ┆ a   ┆ b   │
        └─────┴─────┴─────┘
        >>> lf.unique(subset=["bar", "ham"], maintain_order=True).collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ str ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ a   ┆ b   │
        └─────┴─────┴─────┘
        >>> lf.unique(keep="last", maintain_order=True).collect()
        shape: (3, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ str ┆ str │
        ╞═════╪═════╪═════╡
        │ 2   ┆ a   ┆ b   │
        │ 3   ┆ a   ┆ b   │
        │ 1   ┆ a   ┆ b   │
        └─────┴─────┴─────┘
        )r%   r   r   unique)r   r  r  r  s       r   r  zLazyFrame.unique  s@    j 3F;;F	 0 0 N NOOOr   c                ~    |t          |          }|                     | j                            |                    S )u  
        Drop all rows that contain one or more NaN values.

        The original order of the remaining rows is preserved.

        Parameters
        ----------
        subset
            Column name(s) for which NaN values are considered; if set to `None`
            (default), use all columns (note that only floating-point columns
            can contain NaNs).

        See Also
        --------
        drop_nulls

        Notes
        -----
        A NaN value is not the same as a null value.
        To drop null values, use :func:`drop_nulls`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [-20.5, float("nan"), 80.0],
        ...         "bar": [float("nan"), 110.0, 25.5],
        ...         "ham": ["xxx", "yyy", None],
        ...     }
        ... )

        The default behavior of this method is to drop rows where any single
        value in the row is NaN:

        >>> lf.drop_nans().collect()
        shape: (1, 3)
        ┌──────┬──────┬──────┐
        │ foo  ┆ bar  ┆ ham  │
        │ ---  ┆ ---  ┆ ---  │
        │ f64  ┆ f64  ┆ str  │
        ╞══════╪══════╪══════╡
        │ 80.0 ┆ 25.5 ┆ null │
        └──────┴──────┴──────┘

        This behaviour can be constrained to consider only a subset of columns, as
        defined by name, or with a selector. For example, dropping rows only if
        there is a NaN in the "bar" column:

        >>> lf.drop_nans(subset=["bar"]).collect()
        shape: (2, 3)
        ┌──────┬───────┬──────┐
        │ foo  ┆ bar   ┆ ham  │
        │ ---  ┆ ---   ┆ ---  │
        │ f64  ┆ f64   ┆ str  │
        ╞══════╪═══════╪══════╡
        │ NaN  ┆ 110.0 ┆ yyy  │
        │ 80.0 ┆ 25.5  ┆ null │
        └──────┴───────┴──────┘

        Dropping a row only if *all* values are NaN requires a different formulation:

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [float("nan"), float("nan"), float("nan"), float("nan")],
        ...         "b": [10.0, 2.5, float("nan"), 5.25],
        ...         "c": [65.75, float("nan"), float("nan"), 10.5],
        ...     }
        ... )
        >>> lf.filter(~pl.all_horizontal(pl.all().is_nan())).collect()
        shape: (3, 3)
        ┌─────┬──────┬───────┐
        │ a   ┆ b    ┆ c     │
        │ --- ┆ ---  ┆ ---   │
        │ f64 ┆ f64  ┆ f64   │
        ╞═════╪══════╪═══════╡
        │ NaN ┆ 10.0 ┆ 65.75 │
        │ NaN ┆ 2.5  ┆ NaN   │
        │ NaN ┆ 5.25 ┆ 10.5  │
        └─────┴──────┴───────┘
        )r%   r   r   	drop_nansr   r  s     r   r  zLazyFrame.drop_nans  s<    h 3F;;F	 3 3F ; ;<<<r   c                ~    |t          |          }|                     | j                            |                    S )uX
  
        Drop all rows that contain one or more null values.

        The original order of the remaining rows is preserved.

        See Also
        --------
        drop_nans

        Notes
        -----
        A null value is not the same as a NaN value.
        To drop NaN values, use :func:`drop_nans`.


        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, 2, 3],
        ...         "bar": [6, None, 8],
        ...         "ham": ["a", "b", None],
        ...     }
        ... )

        The default behavior of this method is to drop rows where any single
        value in the row is null:

        >>> lf.drop_nulls().collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ foo ┆ bar ┆ ham │
        │ --- ┆ --- ┆ --- │
        │ i64 ┆ i64 ┆ str │
        ╞═════╪═════╪═════╡
        │ 1   ┆ 6   ┆ a   │
        └─────┴─────┴─────┘

        This behaviour can be constrained to consider only a subset of columns, as
        defined by name or with a selector. For example, dropping rows if there is
        a null in any of the integer columns:

        >>> import polars.selectors as cs
        >>> lf.drop_nulls(subset=cs.integer()).collect()
        shape: (2, 3)
        ┌─────┬─────┬──────┐
        │ foo ┆ bar ┆ ham  │
        │ --- ┆ --- ┆ ---  │
        │ i64 ┆ i64 ┆ str  │
        ╞═════╪═════╪══════╡
        │ 1   ┆ 6   ┆ a    │
        │ 3   ┆ 8   ┆ null │
        └─────┴─────┴──────┘

        Dropping a row only if *all* values are null requires a different formulation:

        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": [None, None, None, None],
        ...         "b": [1, 2, None, 1],
        ...         "c": [1, None, None, 1],
        ...     }
        ... )
        >>> lf.filter(~pl.all_horizontal(pl.all().is_null())).collect()
        shape: (3, 3)
        ┌──────┬─────┬──────┐
        │ a    ┆ b   ┆ c    │
        │ ---  ┆ --- ┆ ---  │
        │ null ┆ i64 ┆ i64  │
        ╞══════╪═════╪══════╡
        │ null ┆ 1   ┆ 1    │
        │ null ┆ 2   ┆ null │
        │ null ┆ 1   ┆ 1    │
        └──────┴─────┴──────┘
        )r%   r   r   
drop_nullsr  s     r   r  zLazyFrame.drop_nullsq  s<    ^ 3F;;F	 4 4V < <===r   )rZ  variable_name
value_name
streamable<ColumnNameOrSelector | Sequence[ColumnNameOrSelector] | Noner  r  r  c                   |st          dd           |g nt          |          }|g nt          |          }|                     | j                            ||||                    S )u  
        Unpivot a DataFrame from wide to long format.

        Optionally leaves identifiers set.

        This function is useful to massage a DataFrame into a format where one or more
        columns are identifier variables (index) while all other columns, considered
        measured variables (on), are "unpivoted" to the row axis leaving just
        two non-identifier columns, 'variable' and 'value'.

        Parameters
        ----------
        on
            Column(s) or selector(s) to use as values variables; if `on`
            is empty all columns that are not in `index` will be used.
        index
            Column(s) or selector(s) to use as identifier variables.
        variable_name
            Name to give to the `variable` column. Defaults to "variable"
        value_name
            Name to give to the `value` column. Defaults to "value"
        streamable
            deprecated

        Notes
        -----
        If you're coming from pandas, this is similar to `pandas.DataFrame.melt`,
        but with `index` replacing `id_vars` and `on` replacing `value_vars`.
        In other frameworks, you might know this operation as `pivot_longer`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "a": ["x", "y", "z"],
        ...         "b": [1, 3, 5],
        ...         "c": [2, 4, 6],
        ...     }
        ... )
        >>> import polars.selectors as cs
        >>> lf.unpivot(cs.numeric(), index="a").collect()
        shape: (6, 3)
        ┌─────┬──────────┬───────┐
        │ a   ┆ variable ┆ value │
        │ --- ┆ ---      ┆ ---   │
        │ str ┆ str      ┆ i64   │
        ╞═════╪══════════╪═══════╡
        │ x   ┆ b        ┆ 1     │
        │ y   ┆ b        ┆ 3     │
        │ z   ┆ b        ┆ 5     │
        │ x   ┆ c        ┆ 2     │
        │ y   ┆ c        ┆ 4     │
        │ z   ┆ c        ┆ 6     │
        └─────┴──────────┴───────┘
        z\the `streamable` parameter for `LazyFrame.unpivot` is deprecatedThis parameter has no effectz1.5.0r  )r"   r%   r   r   unpivot)r   r  rZ  r  r  r  s         r   r  zLazyFrame.unpivot  s    @  	%/    :RR#A"#E#Em)G)N)N	 1 1"eZ W WXXXr   )r  r  r  no_optimizationsr   validate_output_schemar   Callable[[DataFrame], DataFrame]r  None | SchemaDictr  c               z    |rd}d}d}|                      | j                            |||||||                    S )u/  
        Apply a custom function.

        It is important that the function returns a Polars DataFrame.

        Parameters
        ----------
        function
            Lambda/ function to apply.
        predicate_pushdown
            Allow predicate pushdown optimization to pass this node.
        projection_pushdown
            Allow projection pushdown optimization to pass this node.
        slice_pushdown
            Allow slice pushdown optimization to pass this node.
        no_optimizations
            Turn off all optimizations past this point.
        schema
            Output schema of the function, if set to `None` we assume that the schema
            will remain unchanged by the applied function.
        validate_output_schema
            It is paramount that polars' schema is correct. This flag will ensure that
            the output schema of this function will be checked with the expected schema.
            Setting this to `False` will not do this check, but may lead to hard to
            debug bugs.
        streamable
            Whether the function that is given is eligible to be running with the
            streaming engine. That means that the function must produce the same result
            when it is executed in batches or when it is be executed on the full
            dataset.

        Warnings
        --------
        The `schema` of a `LazyFrame` must always be correct. It is up to the caller
        of this function to ensure that this invariant is upheld.

        It is important that the optimization flags are correct. If the custom function
        for instance does an aggregation of a column, `predicate_pushdown` should not
        be allowed, as this prunes rows and will influence your aggregation results.

        Examples
        --------
        >>> lf = (  # doctest: +SKIP
        ...     pl.LazyFrame(
        ...         {
        ...             "a": pl.int_range(-100_000, 0, eager=True),
        ...             "b": pl.int_range(0, 100_000, eager=True),
        ...         }
        ...     )
        ...     .map_batches(lambda x: 2 * x, streamable=True)
        ...     .collect(engine="streaming")
        ... )
        shape: (100_000, 2)
        ┌─────────┬────────┐
        │ a       ┆ b      │
        │ ---     ┆ ---    │
        │ i64     ┆ i64    │
        ╞═════════╪════════╡
        │ -200000 ┆ 0      │
        │ -199998 ┆ 2      │
        │ -199996 ┆ 4      │
        │ -199994 ┆ 6      │
        │ …       ┆ …      │
        │ -8      ┆ 199992 │
        │ -6      ┆ 199994 │
        │ -4      ┆ 199996 │
        │ -2      ┆ 199998 │
        └─────────┴────────┘
        F)r  r   validate_output)r   r   r  )	r   r`  r  r  r  r  r   r  r  s	            r   r  zLazyFrame.map_batches  se    b  	#!&"'"NI!!"#% 6 "  

 

 
	
r   c                t    |                      t          j        d                                                    S )u  
        Interpolate intermediate values. The interpolation method is linear.

        Nulls at the beginning and end of the series remain null.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "foo": [1, None, 9, 10],
        ...         "bar": [6, 7, 9, None],
        ...         "baz": [1, None, None, 9],
        ...     }
        ... )
        >>> lf.interpolate().collect()
        shape: (4, 3)
        ┌──────┬──────┬──────────┐
        │ foo  ┆ bar  ┆ baz      │
        │ ---  ┆ ---  ┆ ---      │
        │ f64  ┆ f64  ┆ f64      │
        ╞══════╪══════╪══════════╡
        │ 1.0  ┆ 6.0  ┆ 1.0      │
        │ 5.0  ┆ 7.0  ┆ 3.666667 │
        │ 9.0  ┆ 9.0  ┆ 6.333333 │
        │ 10.0 ┆ null ┆ 9.0      │
        └──────┴──────┴──────────┘
        rd  )r  r  r  interpolater   s    r   r  zLazyFrame.interpolater  s*    8 {{15::1133444r   7ColumnNameOrSelector | Collection[ColumnNameOrSelector]rq   c                v    t          |g|R  }|                     | j                            |                    S )u	  
        Decompose struct columns into separate columns for each of their fields.

        The new columns will be inserted into the DataFrame at the location of the
        struct column.

        Parameters
        ----------
        columns
            Name of the struct column(s) that should be unnested.
        *more_columns
            Additional columns to unnest, specified as positional arguments.

        Examples
        --------
        >>> df = pl.LazyFrame(
        ...     {
        ...         "before": ["foo", "bar"],
        ...         "t_a": [1, 2],
        ...         "t_b": ["a", "b"],
        ...         "t_c": [True, None],
        ...         "t_d": [[1, 2], [3]],
        ...         "after": ["baz", "womp"],
        ...     }
        ... ).select("before", pl.struct(pl.col("^t_.$")).alias("t_struct"), "after")
        >>> df.collect()
        shape: (2, 3)
        ┌────────┬─────────────────────┬───────┐
        │ before ┆ t_struct            ┆ after │
        │ ---    ┆ ---                 ┆ ---   │
        │ str    ┆ struct[4]           ┆ str   │
        ╞════════╪═════════════════════╪═══════╡
        │ foo    ┆ {1,"a",true,[1, 2]} ┆ baz   │
        │ bar    ┆ {2,"b",null,[3]}    ┆ womp  │
        └────────┴─────────────────────┴───────┘
        >>> df.unnest("t_struct").collect()
        shape: (2, 6)
        ┌────────┬─────┬─────┬──────┬───────────┬───────┐
        │ before ┆ t_a ┆ t_b ┆ t_c  ┆ t_d       ┆ after │
        │ ---    ┆ --- ┆ --- ┆ ---  ┆ ---       ┆ ---   │
        │ str    ┆ i64 ┆ str ┆ bool ┆ list[i64] ┆ str   │
        ╞════════╪═════╪═════╪══════╪═══════════╪═══════╡
        │ foo    ┆ 1   ┆ a   ┆ true ┆ [1, 2]    ┆ baz   │
        │ bar    ┆ 2   ┆ b   ┆ null ┆ [3]       ┆ womp  │
        └────────┴─────┴─────┴──────┴───────────┴───────┘
        )r%   r   r   unnestr  s      r   r  zLazyFrame.unnest  s>    f 1H<HHH	 0 0 9 9:::r   c                    t          | |           |                     | j                            |j        |                    S )uR	  
        Take two sorted DataFrames and merge them by the sorted key.

        The output of this operation will also be sorted.
        It is the callers responsibility that the frames
        are sorted in ascending order by that key otherwise
        the output will not make sense.

        The schemas of both LazyFrames must be equal.

        Parameters
        ----------
        other
            Other DataFrame that must be merged
        key
            Key that is sorted.

        Examples
        --------
        >>> df0 = pl.LazyFrame(
        ...     {"name": ["steve", "elise", "bob"], "age": [42, 44, 18]}
        ... ).sort("age")
        >>> df0.collect()
        shape: (3, 2)
        ┌───────┬─────┐
        │ name  ┆ age │
        │ ---   ┆ --- │
        │ str   ┆ i64 │
        ╞═══════╪═════╡
        │ bob   ┆ 18  │
        │ steve ┆ 42  │
        │ elise ┆ 44  │
        └───────┴─────┘
        >>> df1 = pl.LazyFrame(
        ...     {"name": ["anna", "megan", "steve", "thomas"], "age": [21, 33, 42, 20]}
        ... ).sort("age")
        >>> df1.collect()
        shape: (4, 2)
        ┌────────┬─────┐
        │ name   ┆ age │
        │ ---    ┆ --- │
        │ str    ┆ i64 │
        ╞════════╪═════╡
        │ thomas ┆ 20  │
        │ anna   ┆ 21  │
        │ megan  ┆ 33  │
        │ steve  ┆ 42  │
        └────────┴─────┘
        >>> df0.merge_sorted(df1, key="age").collect()
        shape: (7, 2)
        ┌────────┬─────┐
        │ name   ┆ age │
        │ ---    ┆ --- │
        │ str    ┆ i64 │
        ╞════════╪═════╡
        │ bob    ┆ 18  │
        │ thomas ┆ 20  │
        │ anna   ┆ 21  │
        │ megan  ┆ 33  │
        │ steve  ┆ 42  │
        │ steve  ┆ 42  │
        │ elise  ┆ 44  │
        └────────┴─────┘

        Notes
        -----
        No guarantee is given over the output row order when the key is equal
        between the both dataframes.

        The key must be sorted in ascending order.
        )r4   r   r   merge_sorted)r   r  r&  s      r   r  zLazyFrame.merge_sorted  s=    P 	$&&&	 6 6uz3 G GHHHr   r  columnc                   t          |t                    sd}t          |          |                     t	          j        |                              |                    S )a  
        Flag a column as sorted.

        This can speed up future operations.

        Parameters
        ----------
        column
            Column that is sorted
        descending
            Whether the column is sorted in descending order.

        Warnings
        --------
        This can lead to incorrect results if the data is NOT sorted!!
        Use with care!

        z6expected a 'str' for argument 'column' in 'set_sorted'r  )r   r   r   r  r  r  
set_sorted)r   r  r  r   s       r   r  zLazyFrame.set_sorted  sT    4 &#&& 	!JCC..   v!9!9Z!9!P!PQQQr   )r  r  include_nullsr   Literal['left', 'inner', 'full']r  c          	     4   t          | |           |dv rd}t          dd           |dvrd|}t          |          d}	|_|6|4d
}	d}
|                     |
          } |                    |
          }|
gx}}n+|d}t          |          |d}t          |          n|x}}t	          |t
                    r|g}t	          |t
                    r|g}|                                 }|D ]}||vrd|d}t          |          |                                }|D ]}||vrd|d}t          |          |dk    r9t          |          t          |          k    r|	r|                     |
          S | S t          |          
                    |          t          |          z
  }rCd|                    t          j        d
                              d                             }nddg fd|D             }|                      |j        g ||R  |||d
|                              fd|D                                           |          }|	r|                    |
          }|                     |j                  S )u  
        Update the values in this `LazyFrame` with the values in `other`.

        .. warning::
            This functionality is considered **unstable**. It may be changed
            at any point without it being considered a breaking change.

        Parameters
        ----------
        other
            LazyFrame that will be used to update the values
        on
            Column names that will be joined on. If set to `None` (default),
            the implicit row index of each frame is used as a join key.
        how : {'left', 'inner', 'full'}
            * 'left' will keep all rows from the left table; rows may be duplicated
              if multiple rows in the right frame match the left row's key.
            * 'inner' keeps only those rows where the key exists in both frames.
            * 'full' will update existing rows where the key matches while also
              adding any new rows contained in the given frame.
        left_on
           Join column(s) of the left DataFrame.
        right_on
           Join column(s) of the right DataFrame.
        include_nulls
            Overwrite values in the left frame with null values from the right frame.
            If set to `False` (default), null values in the right frame are ignored.
        maintain_order : {'none', 'left', 'right', 'left_right', 'right_left'}
            Which order of rows from the inputs to preserve. See :func:`~LazyFrame.join`
            for details. Unlike `join` this function preserves the left order by
            default.

        Notes
        -----
        This is syntactic sugar for a left/inner join that preserves the order
        of the left `DataFrame` by default, with an optional coalesce when
        `include_nulls = False`.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {
        ...         "A": [1, 2, 3, 4],
        ...         "B": [400, 500, 600, 700],
        ...     }
        ... )
        >>> lf.collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ A   ┆ B   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ 400 │
        │ 2   ┆ 500 │
        │ 3   ┆ 600 │
        │ 4   ┆ 700 │
        └─────┴─────┘
        >>> new_lf = pl.LazyFrame(
        ...     {
        ...         "B": [-66, None, -99],
        ...         "C": [5, 3, 1],
        ...     }
        ... )

        Update `df` values with the non-null values in `new_df`, by row index:

        >>> lf.update(new_lf).collect()
        shape: (4, 2)
        ┌─────┬─────┐
        │ A   ┆ B   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ -66 │
        │ 2   ┆ 500 │
        │ 3   ┆ -99 │
        │ 4   ┆ 700 │
        └─────┴─────┘

        Update `df` values with the non-null values in `new_df`, by row index,
        but only keeping those rows that are common to both frames:

        >>> lf.update(new_lf, how="inner").collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ A   ┆ B   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ -66 │
        │ 2   ┆ 500 │
        │ 3   ┆ -99 │
        └─────┴─────┘

        Update `df` values with the non-null values in `new_df`, using a full
        outer join strategy that defines explicit join columns in each frame:

        >>> lf.update(new_lf, left_on=["A"], right_on=["C"], how="full").collect()
        shape: (5, 2)
        ┌─────┬─────┐
        │ A   ┆ B   │
        │ --- ┆ --- │
        │ i64 ┆ i64 │
        ╞═════╪═════╡
        │ 1   ┆ -99 │
        │ 2   ┆ 500 │
        │ 3   ┆ 600 │
        │ 4   ┆ 700 │
        │ 5   ┆ -66 │
        └─────┴─────┘

        Update `df` values including null values in `new_df`, using a full
        outer join strategy that defines explicit join columns in each frame:

        >>> lf.update(
        ...     new_lf, left_on="A", right_on="C", how="full", include_nulls=True
        ... ).collect()
        shape: (5, 2)
        ┌─────┬──────┐
        │ A   ┆ B    │
        │ --- ┆ ---  │
        │ i64 ┆ i64  │
        ╞═════╪══════╡
        │ 1   ┆ -99  │
        │ 2   ┆ 500  │
        │ 3   ┆ null │
        │ 4   ┆ 700  │
        │ 5   ┆ -66  │
        └─────┴──────┘
        )r!  r$  rf  r"  r#  r  )r  r  rf  z6`how` must be one of {'left', 'inner', 'full'}; found FNT__POLARS_ROW_INDEXz#missing join columns for left framez$missing join columns for right framezleft join column z
 not foundzright join column )__POLARS_VALIDITYr   rQ  __POLARS_RIGHTc              3  $   K   | ]
}|  V  d S r   rQ  )rx  r  tmp_names     r   rz  z#LazyFrame.update.<locals>.<genexpr>  s.      FF$T-8--FFFFFFr   )r  r  r  r  r  r  c              3    K   | ]}rt          j        t          j                                                                                t          j        |                                        t          j        |                      n+t          j        |  t          j        |          g                              |          V  d S r   )r  whenr  is_nullthen	otherwiser  r  )rx  r  r  r  validitys     r   rz  z#LazyFrame.update.<locals>.<genexpr>  s       
 
  %HAF15??224455T!%++&&Yqu%8h%8%899:::%8h%8%8!%++$FGG%++
 
 
 
 
 
r   )r4   r"   r   r]  r   r   r   r	  r9  r  intersectionr  r  r  r  r&  r  r   r   )r   r  r  r  r  r  r  r  r   row_index_usedrow_index_nameleft_schemar  right_schemaright_otherdrop_columnsrG  r  r  s         `          @@r   r  zLazyFrame.update0  sq   ^ 	$&&&---C%L!   
 ///TSTTCS//!:8#3!%!5**>::,,^<<&4%55(( ??C$S//)#@C$S//) $
 "$#Ghgs## 	 iGh$$ 	" zH))++ 	& 	&D;&&<$<<< oo% ' ++-- 	& 	&D<''=4=== oo% (
 &==S..#h--?? 1yy000K ,''44[AACMMQ  	-H&&quT{{'8'8!'E'EFFEEH#RFFFF+FFFRRII@h@@x@@@!-    \ 
 
 
 
 
 
 (
 
 
 
 
 T,+ 	.  	1[[00F,,,r   c                Z    |                      | j                                                  S )u  
        Return the number of non-null elements for each column.

        Examples
        --------
        >>> lf = pl.LazyFrame(
        ...     {"a": [1, 2, 3, 4], "b": [1, 2, 1, None], "c": [None, None, None, None]}
        ... )
        >>> lf.count().collect()
        shape: (1, 3)
        ┌─────┬─────┬─────┐
        │ a   ┆ b   ┆ c   │
        │ --- ┆ --- ┆ --- │
        │ u32 ┆ u32 ┆ u32 │
        ╞═════╪═════╪═════╡
        │ 4   ┆ 3   ┆ 0   │
        └─────┴─────┴─────┘
        )r   r   ro  r   s    r   ro  zLazyFrame.count!  s$    & 	 1 1222r   z`LazyFrame.melt` is deprecated; use `LazyFrame.unpivot` instead, with `index` instead of `id_vars` and `on` instead of `value_vars`)r  id_vars
value_varsc               6    |                      |||||          S )a  
        Unpivot a DataFrame from wide to long format.

        Optionally leaves identifiers set.

        This function is useful to massage a DataFrame into a format where one or more
        columns are identifier variables (id_vars) while all other columns, considered
        measured variables (value_vars), are "unpivoted" to the row axis leaving just
        two non-identifier columns, 'variable' and 'value'.

        .. deprecated:: 1.0.0
            Use the :meth:`.unpivot` method instead.

        Parameters
        ----------
        id_vars
            Column(s) or selector(s) to use as identifier variables.
        value_vars
            Column(s) or selector(s) to use as values variables; if `value_vars`
            is empty all columns that are not in `id_vars` will be used.
        variable_name
            Name to give to the `variable` column. Defaults to "variable"
        value_name
            Name to give to the `value` column. Defaults to "value"
        streamable
            Allow this node to run in the streaming engine.
            If this runs in streaming, the output of the unpivot operation
            will not have a stable ordering.
        )rZ  r  r  r  r  )r  )r   r  r  r  r  r  s         r   meltzLazyFrame.melt6  s/    T ||'!!  
 
 	
r   rC  contextpc.ComputeContext | None	plan_typepc._typing.PlanTypePreferencepc.LazyFrameExtc                0    t          j        | ||          S )u  
        Run a query remotely on Polars Cloud.

        This allows you to run Polars remotely on
        one or more workers via several strategies
        for distributed compute.

        Read more in the `Announcement post <https://pola.rs/posts/polars-cloud-what-we-are-building/>`_

        Parameters
        ----------
        context
            Compute context in which queries are executed.
            If none given, it will take the default context.
        plan_type
            Whether to give a dot diagram of a plain text
            version of logical plan.

        Examples
        --------
        Run a query on a cloud instance.

        >>> lf = pl.LazyFrame([1, 2, 3]).sum()
        >>> in_progress = lf.remote().collect()  # doctest: +SKIP
        >>> # do some other work
        >>> in_progress.await_result()  # doctest: +SKIP
        shape: (1, 1)
        ┌──────────┐
        │ column_0 │
        │ ---      │
        │ i64      │
        ╞══════════╡
        │ 6        │
        └──────────┘

        Run a query distributed.

        >>> lf = (
        ...     pl.scan_parquet("s3://my_bucket/").group_by("key").agg(pl.sum("values"))
        ... )
        >>> in_progress = lf.remote().distributed().collect()  # doctest: +SKIP
        >>> in_progress.await_result()  # doctest: +SKIP
        shape: (1, 1)
        ┌──────────┐
        │ column_0 │
        │ ---      │
        │ i64      │
        ╞══════════╡
        │ 6        │
        └──────────┘

        )r  r  r  )pcLazyFrameExt)r   r  r  s      r   remotezLazyFrame.remoteh  s    t $9MMMMr   raiseforbid)missing_columnsmissing_struct_fieldsextra_columnsextra_struct_fieldsinteger_cast
float_castSchemaDict | Schemar  LLiteral['insert', 'raise'] | Mapping[str, Literal['insert', 'raise'] | Expr]r  ELiteral['insert', 'raise'] | Mapping[str, Literal['insert', 'raise']]r  Literal['ignore', 'raise']r  ELiteral['ignore', 'raise'] | Mapping[str, Literal['ignore', 'raise']]r  GLiteral['upcast', 'forbid'] | Mapping[str, Literal['upcast', 'forbid']]r  c                 
 ddl m
 d

fdt          |t                    rt	          |          }n|}t          |t                    r!fd|                                D             }	nt          |
          r |          }	n|}	t                              | j        	                    ||	|||||	                    S )u{  
        Match or evolve the schema of a LazyFrame into a specific schema.

        By default, match_to_schema returns an error if the input schema does not
        exactly match the target schema. It also allows columns to be freely reordered,
        with additional coercion rules available through optional parameters.

        .. warning::
            This functionality is considered **unstable**. It may be changed
            at any point without it being considered a breaking change.

        Parameters
        ----------
        schema
            Target schema to match or evolve to.
        missing_columns
            Raise of insert missing columns from the input with respect to the `schema`.

            This can also be an expression per column with what to insert if it is
            missing.
        missing_struct_fields
            Raise of insert missing struct fields from the input with respect to the
            `schema`.
        extra_columns
            Raise of ignore extra columns from the input with respect to the `schema`.
        extra_struct_fields
            Raise of ignore extra struct fields from the input with respect to the
            `schema`.
        integer_cast
            Forbid of upcast for integer columns from the input to the respective column
            in `schema`.
        float_cast
            Forbid of upcast for float columns from the input to the respective column
            in `schema`.

        Examples
        --------
        Ensuring the schema matches

        >>> lf = pl.LazyFrame({"a": [1, 2, 3], "b": ["A", "B", "C"]})
        >>> lf.match_to_schema({"a": pl.Int64, "b": pl.String}).collect()
        shape: (3, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ str │
        ╞═════╪═════╡
        │ 1   ┆ A   │
        │ 2   ┆ B   │
        │ 3   ┆ C   │
        └─────┴─────┘
        >>> (lf.match_to_schema({"a": pl.Int64}).collect())  # doctest: +SKIP
        polars.exceptions.SchemaError: extra columns in `match_to_schema`: "b"

        Adding missing columns

        >>> (
        ...     pl.LazyFrame({"a": [1, 2, 3]})
        ...     .match_to_schema(
        ...         {"a": pl.Int64, "b": pl.String},
        ...         missing_columns="insert",
        ...     )
        ...     .collect()
        ... )
        shape: (3, 2)
        ┌─────┬──────┐
        │ a   ┆ b    │
        │ --- ┆ ---  │
        │ i64 ┆ str  │
        ╞═════╪══════╡
        │ 1   ┆ null │
        │ 2   ┆ null │
        │ 3   ┆ null │
        └─────┴──────┘
        >>> (
        ...     pl.LazyFrame({"a": [1, 2, 3]})
        ...     .match_to_schema(
        ...         {"a": pl.Int64, "b": pl.String},
        ...         missing_columns={"b": pl.col.a.cast(pl.String)},
        ...     )
        ...     .collect()
        ... )
        shape: (3, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ str │
        ╞═════╪═════╡
        │ 1   ┆ 1   │
        │ 2   ┆ 2   │
        │ 3   ┆ 3   │
        └─────┴─────┘

        Removing extra columns

        >>> (
        ...     pl.LazyFrame({"a": [1, 2, 3], "b": ["A", "B", "C"]})
        ...     .match_to_schema(
        ...         {"a": pl.Int64},
        ...         extra_columns="ignore",
        ...     )
        ...     .collect()
        ... )
        shape: (3, 1)
        ┌─────┐
        │ a   │
        │ --- │
        │ i64 │
        ╞═════╡
        │ 1   │
        │ 2   │
        │ 3   │
        └─────┘

        Upcasting integers and floats

        >>> (
        ...     pl.LazyFrame(
        ...         {"a": [1, 2, 3], "b": [1.0, 2.0, 3.0]},
        ...         schema={"a": pl.Int32, "b": pl.Float32},
        ...     )
        ...     .match_to_schema(
        ...         {"a": pl.Int64, "b": pl.Float64},
        ...         integer_cast="upcast",
        ...         float_cast="upcast",
        ...     )
        ...     .collect()
        ... )
        shape: (3, 2)
        ┌─────┬─────┐
        │ a   ┆ b   │
        │ --- ┆ --- │
        │ i64 ┆ f64 │
        ╞═════╪═════╡
        │ 1   ┆ 1.0 │
        │ 2   ┆ 2.0 │
        │ 3   ┆ 3.0 │
        └─────┴─────┘
        r   )rn   r  !Literal['insert', 'raise'] | Exprr   #Literal['insert', 'raise'] | PyExprc                6    t          |           r| j        S | S r   )r   r  )r  rn   s    r   prepare_missing_columnsz:LazyFrame.match_to_schema.<locals>.prepare_missing_columnsB   s$     %&& %}$Lr   c                .    i | ]\  }}| |          S rQ  rQ  )rx  r&  r  r  s      r   
<dictcomp>z-LazyFrame.match_to_schema.<locals>.<dictcomp>S   s;     & & &C ,,U33& & &r   )r   r  r  r  r  r  r  )r  r  r   r  )
rp  rn   r   r   r^   r   r   r   r   match_to_schema)r   r   r  r  r  r  r  r  schema_prepmissing_columns_pyexprrn   r  s             @@r   r  zLazyFrame.match_to_schema  s   x 	 	 	 	 	 	 	 fg&& 	! ..KK K
 ow// 	5& & & &"1"7"7"9"9& & &"" .. 	5%<%<_%M%M""%4"$$I%%" 6&;+$7)% &  

 

 
	
r   None | str | list[str]statsc                    | }|-t          |t                    r|g}|                    |          }|                                                    |          S )zz
        Get all runtime metadata for each column.

        This is unstable and is meant for debugging purposes.
        N)r  )r   r   r  r  _to_metadata)r   r  r  r  s       r   r  zLazyFrame._to_metadatah   sX     '3'' $")7##Bzz||((u(555r   )NN)r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   )r   ra   r   r   )r   r   )r   r   r   r   )
r   r   r   r   rV   r   r   r   r   r   )r   r   r   r   r   r   )r   r   )r   r  )r   r^   )r   r  )r   r   )r  r   r   r   )r  r  r   r   )r  r   r   r   )r&  r   r   r   )r   r   r   )r.  r   r   r   )r1  r2  r   r   )r   r   ).)rN  r   r   rO  r   r   )rN  r   r   rS  r   r   )rN  rU  r   r   r   r   )rN  rW  r   r   r   rX  )r`  ra  rb  rc  rd  re  r   r   )rh  )rk  rl  rj  r   r   rl   ) r   rt   r9  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   r   r   rs   r  r  r  ri   r   r   )(r9  r   r  r   r  r  r  r   r  r  r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rs   r  r   r  r   r  ri   r   r  )r  )r  r   r   r   )r  r  r  rw   r  r  r  r  r  r   r  r   r   r   )r  r   r  r   r   r   )r  r  r  r  r  r  r   r   )"r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r  r  r  r   rs   r  ri   r  r   r   r  )r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rs   r   r4  r  ri   r   r[   )r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rs   r   r7  r  ri   r   rl   )r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rs   r   r   r  ri   r  r   r   r9  )r<  r4  r   rs   r  ri   r   r=  )r<  r7  r   rs   r  ri   r   rA  )r<  r   r   rs   r  ri   r   rC  )$r   rX  rL  r   rM  r   rN  rY  rO  r   rP  r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r7  rV  r]  r   rs   rW  r^  r  ri   r   r   )$r   rX  rL  r   rM  r   rN  rY  rO  r   rP  r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r4  rV  r]  r   rs   rW  r^  r  ri   r   r   )$r   rX  rL  r   rM  r   rN  rY  rO  r   rP  r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rW  r^  rU  r   r   r   rV  r]  r   rs   r  ri   r   rc  )r   rX  rL  ry  rx  rz  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r7  r   rs   r  ri   r   r   )r   rX  rL  ry  rx  rz  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r4  r   rs   r  ri   r   r   )r   rX  rL  ry  rx  rz  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r   r   rs   r  ri   r   rc  )0r   r   r  r   r  r   r  r   r  r   r  r   r  r  r  r  r  r  r  r  r  r  r  r   r  r  r  r  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r7  r   rs   r  ri   r   r   )0r   r   r  r   r  r   r  r   r  r   r  r   r  r  r  r  r  r  r  r  r  r  r  r   r  r  r  r  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r4  r   rs   r  ri   r   r   )0r   r   r  r   r  r   r  r   r  r   r  r   r  r  r  r  r  r  r  r  r  r  r  r   r  r  r  r  r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r   r   rs   r  ri   r   rc  )r   r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r7  r   rs   r  ri   r   r   )r   r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r4  r   rs   r  ri   r   r   )r   r   r  r   rQ  rZ  rR  r[  rS  r  rT  r\  rU  r   r   r   r   rs   r  ri   r   rc  )r  )r  r  r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rl   )r  r  r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r  r   r   rl   )r  r  r   r   r   r   )r   )r  r  r   r   )r  r  r  r  r  r   r   r   )r  r  r  r   r   r   )r  r  r  rw   r   r   )r  r  r  r   r  rw   r   rZ   )r  rw   r  r  r  r  r  rp   r  r  r   rZ   )r  rw   r  r  r  r  r  r  r  r   r  rp   r  r|   r  r  r  r   r   rZ   ) r  r   r  r  r  r  r  r  r  r  r  r  r  r  r  ro   r  r   r	  r  r
  r   r  r   r  r   r  r   r  r   r   r   )Nr  )r  r   r  r  r  rz   r  r  r  r  r  r   r  r{   r  r   r  r  r  r  r
  r   r  r   r   r   )r  r   r  r-  r  r   r   r   )r  r3  r   r   )r  r7  r   r   r   r   )r;  r<  r   r   r   r   )r  )r  rE  rD  rF  r   r   )r  r  rJ  r   r   r   )rL  )rZ  r   )r  r   r  r  r   r   )r`  r   )r  r  r  r  r   r   )NNN)
r  rg  r  rh  rO  r   rf  r   r   r   )r  rr  r   r   )ru  r  r   r   )ri  )r  r  rj  r   r   r   )r  r  r  r  r   r   )r  r  r  r   r  r   r   r   )r  r  r   r   )r  r  rZ  r  r  r  r  r  r  r   r   r   )r`  r  r  r   r  r   r  r   r  r   r   r  r  r   r  r   r   r   )r  r  r  rq   r   r   )r  r   r&  r   r   r   )r  r   r  r   r   r   )Nr  )r  r   r  r  r  r  r  r  r  r  r  r   r  r  r   r   )NNNN)r  r  r  r  r  r  r  r  r  r   r   r   )NrC  )r  r  r  r  r   r  )r   r  r  r  r  r  r  r  r  r  r  r  r  r  r   r   )r  r  r  r  r   rl   )zr?  
__module____qualname____doc____annotations__r  r   r8   r   classmethodr   r   r   r   r   propertyr  r  r   r
  r  r  r  r  r  r!  r#  r%  r(  r,  r0  r6  r;  rA  rM  r   r   rg  r  r    r]   r\   r:  r  r  r  r  r   r  r  r"  r  r@  r   ra  r}  r  r  r!   r  r  r   r  r  r  r+  r  r  r  r  r  r  r  r  r  r&  r)   r/  r  r2  r6  r9  r@  r  rI  r4  rO  rN  rS  rU  rW  rY  r]  rb  re  rq  rt  rr  rz  r{  rs  r  rq  r  rp  r  r  r  r  r  r  r  r  r  r  r  r  ro  r  r  r  r  rQ  r   r   r   r      s        V Vp %(SUUJ**** '+*.

 /3%)*9!
 
 
 
 
 
6    [
       : : : :   %     [4 KS=5 =5 =5 =5 =5 [=5~ '- '- '- X'-R '. '. '. X'.R  %  %  % X %D %+ %+ %+ X%+N      % % % %% % % %$ $ $ $$ $ $ $% % % %% % % %, , , ,       1 1 1 1   @ @ @ @   & ?B     X QQQQ XQJM     X ,0>A '/	>A >A >A >A >A >A@E/ E/ E/ E/R 7IL )2	L L L L L L\ #"$$ !("#'$($(#"&"&%)###''>#Z- Z- Z- Z- Z-  %$Z-x #"$$ )- '3" #'$($(#"&"&%)## $!'>+[
 [
 [
 [
 [
  %$[
z
 
 
 
 
< -2,1$"v
 v
 v
 v
 v
 v
p 4: R& R& R& R& R& R&h ! y'JJJ */KL KL KL KL KL KJKLZ ! y'JJJ */KO KO KO KO KO KJKOZ  ##'$($( %#"&"&%)##*#'>#V V V V V Vp  ##'$($(#"&"&%)# %#'>     X$  ##'$($(#"&"&%)# %#%*'>     X$ #"$$ ##'$($(#"&"&%)# %# '>e6 e6 e6 e6 e6  %$e6N 
 $'>0 0 0 0 0 X0  "'#'># # # # # X# #"$$ #'>d d d d d %$dLF F F F@ 
 "(,37%)%)#15 26" #+/'>1     X6 
 "(,37%)%)#15 26
 #+/'>1     X> "(,37%)%)#15 26+/ #'>1K* K* K* K* K* K*Z 
 .4+/#15 26"#'>!     X& 
 .4+/#15 26#'>!     X. .<+/#15 26#'>!b* b* b* b* b* b*H 
 "##&*"&"&(,&*!%,0#15 26"#'>7     X< 
 "##&*"&"&(,&*!%,0#15 26#'>7     XD "##&*"&"&(,&*!%,0#15 26#'>7`* `* `* `* `* `*D 
  $15 26"#'>     X" 
  $15 26#'>     X*  $15 26#'>M* M* M* M* M* M*^ Z	9  1
 # #'$($( %#"&"&%)#1
 1
 1
 1
 1
	 1
j p) # #'$($( %#"&"&%)#!p) p) p) p) p) p)d   23 3 3 3" fB fB fB fB fB fBP,J ,J ,J ,J ,J\3 3 3 3J SK SK SK SK SK SKjp
 p
 p
 p
dX
 X
 X
 X
tk; k; k; k;Z? ? ? ?B  %j  j  j  j  j  j X ! z9EEE *.!(9=H  H  H  H  H  FEH T ! z9EEE *.)-#(!'9=$O  O  O  O  O  FEO j
 &*&* $.2/3)-%/:>#$$(!%#q
 q
 q
 q
 q
 q
f ! }fMMM 8<#	]
 =A=A#(! $37#$]
 ]
 ]
 ]
 ]
 NM]
~ XZZ
 	M
 M
 M
 M
 M
 ZM
^WA WA WA WAr%E %E %E %EN Z	: <S <S <S	 <SB FJ FJ FJ FJ FJ FJR TX:M :M :M :M :M :Mx5 5 5 56 )*L@LPL@ L@ L@ L@ L@ L@\#A #A #A #A #AJ+ + + + +Z)  )  )  )  ) V)3 )3 )3 )3 )3V   0       0 Z	< 6 6 6	 6:K, K, K, K, K,Z Z	S (1 (1 (1 (1	 (1T(? (? (? (? (?X $(,0 	JF #'JF JF JF JF JF JFX)C )C )C )CV&5 &5 &5 &5 &5P&5 &5 &5 &5 &5P1 1 1 101 1 1 101 1 1 102 2 2 204 4 4 408 8 8 88 )2"M "M "M "M "MH*< *< *< *<\ RVWP $)$WP WP WP WP WP WPv RVV= V= V= V= V=t RVQ> Q> Q> Q> Q>j LPJY OS$(!%JY JY JY JY JY JY` $($(#!&$('+ `
 `
 `
 `
 `
 `
D5 5 5 5<4; 4; 4; 4;lII II II II^ !	R R R R R R> XZZ *.06	n- /3/3#39n- n- n- n- n- Zn-`3 3 3 3* Z	H  QUSW$(!%,
  ,
 ,
 ,
 ,
 ,
	 ,
\ XZZ -1389N 9N 9N 9N Z9Nv XZZ =D5<4;5<6>6>A
 A
 A
 A
 A
 ZA
J +/(,6 6 6 6 6 6 6r   r   )r   rs   r   rs   )r   r   r   r   )r   rs   r   r   r   r   r   r   r   r   r   r   )
__future__r   
contextlibr   r  r\  collections.abcr   r   r   r   r   r	   	functoolsr
   r   r   r   r   r  r   pathlibr   typingr   r   r   r   r   r   r   polars._reexport	_reexportr  rp  r   r  polars._typingr   r   polars._utils.async_r   r   polars._utils.convertr   r   polars._utils.deprecationr   r    r!   r"   polars._utils.parquetr#   polars._utils.parser$   r%   polars._utils.serder&   polars._utils.slicer'   polars._utils.unstabler(   r)   polars._utils.variousr*   r+   r,   r-   r.   r/   r0   r1   r2   r3   r4   polars._utils.wrapr5   r6   polars.datatypesr7   r8   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   rG   rH   rI   rJ   rK   rL   rM   rN   rO   rP   polars.datatypes.grouprQ   polars.dependenciesrR   rS   rT   rU   r  rV   r   polars.exceptionsrW   polars.interchange.protocolrX   polars.lazyframe.engine_configrY   polars.lazyframe.group_byrZ   polars.lazyframe.in_processr[   polars.lazyframe.opt_flagsr\   r]   polars.schemar^   polars.selectorsr_   r`   suppressImportErrorpolars.polarsra   rb   sysrc   rd   re   rf   rg   rh   ri   rj   rk   rl   rm   rn   ro   rp   rq   rr   rs   rt   ru   rv   rw   rx   ry   rz   r{   r|   r}   r~   r   r   r   r   r   r   r   r   r   r   r   nppolars.io.cloudr   polars.io.parquetr   version_infor   r   typing_extensionsr   r   r   r   r   r   r   rQ  r   r   <module>r     sY	   " " " " " "     				 				  / / / / / / / / 4 4 4 4 4 4 4 4 4 4 4 4 0 0 0 0 0 0 0 0 0 0                                                    ! ! ! ! ! !        M L L L L L L L R R R R R R R R            A @ @ @ @ @        8 7 7 7 7 7 / / / / / / C C C C C C C C                          2 1 1 1 1 1 1 1                                                       8 1 0 0 0 0 0         
 3 2 2 2 2 2 - - - - - - 0 0 0 0 0 0 3 3 3 3 3 3 4 4 4 4 4 4 1 1 1 1 1 1 6 6 6 6 6 6 U U U U U U U U             6 6 6 6 6 6 6 6Z%% ? ?>>>>>>>>? ? ? ? ? ? ? ? ? ? ? ? ? ? ?  =JJJ==========""""""""888888		[	)	) 9 9888888889 9 9 9 9 9 9 9 9 9 9 9 9 9 9 1000000000                                                         : 0/////::::::888888
7""111111111<<<<<<<<
7""******
7""'''''''000000A	#AA A A A   "(A (A (A (AVO~6 O~6 O~6 O~6 O~6 O~6 O~6 O~6 O~6 O~6s$   '	E<<F F <	GGG