polars

`DummyLearner`

Bases: SupervisedLearner, SupervisedIncrementalLearner

Dummy learner that learns nothing.

This learner is useful for testing purposes.

`DummyModel(output_names)`

Bases: Model

Dummy model that predicts zeros.

This model is useful for testing purposes.

Initialize the model.

Parameters:

Name	Type	Description	Default
`output_names`	`list[str]`	The names of the output features.	required

Source code in src/flowcean/polars/dummy.py

def __init__(self, output_names: list[str]) -> None:
    """Initialize the model.

    Args:
        output_names: The names of the output features.
    """
    self.output_names = output_names

`DataFrame(data)`

Bases: OfflineEnvironment

A dataset environment.

This environment represents static tabular datasets.

Attributes:

Name	Type	Description
`data`	`LazyFrame`	The data to represent.

Initialize the dataset environment.

Parameters:

Name	Type	Description	Default
`data`	`DataFrame \| LazyFrame`	The data to represent.	required

Source code in src/flowcean/polars/environments/dataframe.py

def __init__(self, data: pl.DataFrame | pl.LazyFrame) -> None:
    """Initialize the dataset environment.

    Args:
        data: The data to represent.
    """
    if isinstance(data, pl.DataFrame):
        self.data = data.lazy()
        self._length = len(data)
    else:
        self.data = data
    super().__init__()

`to_incremental(batch_size=1)`

Convert the DataFrame to an incremental environment.

Parameters:

Name	Type	Description	Default
`batch_size`	`int`	The size of each batch. Defaults to 1.	`1`

Source code in src/flowcean/polars/environments/dataframe.py

def to_incremental(
    self,
    batch_size: int = 1,
) -> StreamingOfflineEnvironment:
    """Convert the DataFrame to an incremental environment.

    Args:
        batch_size: The size of each batch. Defaults to 1.
    """
    return StreamingOfflineEnvironment(self, batch_size, size=len(self))

`from_csv(path, separator=',')` `classmethod`

Load a dataset from a CSV file.

Parameters:

Name	Type	Description	Default
`path`	`str \| PathLike[str]`	Path to the CSV file.	required
`separator`	`str`	Value separator. Defaults to ",".	`','`

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_csv(cls, path: str | PathLike[str], separator: str = ",") -> Self:
    """Load a dataset from a CSV file.

    Args:
        path: Path to the CSV file.
        separator: Value separator. Defaults to ",".
    """
    data = pl.scan_csv(Path(path), separator=separator)
    data = data.rename(lambda column_name: column_name.strip())
    return cls(data)

`from_json(path)` `classmethod`

Load a dataset from a JSON file.

Parameters:

Name	Type	Description	Default
`path`	`str \| PathLike[str]`	Path to the JSON file.	required

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_json(cls, path: str | PathLike[str]) -> Self:
    """Load a dataset from a JSON file.

    Args:
        path: Path to the JSON file.
    """
    data = pl.read_json(Path(path))
    return cls(data)

`from_parquet(path)` `classmethod`

Load a dataset from a Parquet file.

Parameters:

Name	Type	Description	Default
`path`	`str \| PathLike[str]`	Path to the Parquet file.	required

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_parquet(cls, path: str | PathLike[str]) -> Self:
    """Load a dataset from a Parquet file.

    Args:
        path: Path to the Parquet file.
    """
    data = pl.scan_parquet(Path(path))
    return cls(data)

`from_yaml(path)` `classmethod`

Load a dataset from a YAML file.

Parameters:

Name	Type	Description	Default
`path`	`str \| Path`	Path to the YAML file.	required

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_yaml(cls, path: str | Path) -> Self:
    """Load a dataset from a YAML file.

    Args:
        path: Path to the YAML file.
    """
    data = pl.LazyFrame(YAML(typ="safe").load(path))
    return cls(data)

`from_uri(uri)` `classmethod`

Load a dataset from a URI.

Parameters:

Name	Type	Description	Default
`uri`	`str`	The URI to load the dataset from.	required

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_uri(cls, uri: str) -> Self:
    """Load a dataset from a URI.

    Args:
        uri: The URI to load the dataset from.
    """
    path = _file_uri_to_path(uri)
    suffix = path.suffix

    if suffix == ".csv":
        return cls.from_csv(path)
    if suffix == ".json":
        return cls.from_json(path)
    if suffix == ".parquet":
        return cls.from_parquet(path)
    if suffix in (".yaml", ".yml"):
        return cls.from_yaml(path)

    raise UnsupportedFileTypeError(suffix)

`from_rosbag(path, topics, *, message_paths=None, cache=True, cache_path=None)` `classmethod`

Load a dataset from a ROS2 Humble rosbag file.

The structure of the data is inferred from the message definitions. If a message definition is not found in the ROS2 Humble typestore, it is added from the provided paths. Once all the message definitions are added, the data is loaded from the rosbag file.

Parameters:

Name	Type	Description	Default
`path`	`str \| PathLike[str]`	Path to the rosbag.	required
`topics`	`dict[str, list[str]]`	Dictionary of topics to load (`topic: [paths]`).	required
`message_paths`	`Iterable[str \| PathLike[str]] \| None`	List of paths to additional message definitions.	`None`
`cache`	`bool`	Whether to cache the data to a Parquet file.	`True`
`cache_path`	`str \| PathLike[str] \| None`	Path to the cache file. If None, defaults to the same directory as the rosbag file with a .parquet extension.	`None`

Source code in src/flowcean/polars/environments/dataframe.py

@classmethod
def from_rosbag(
    cls,
    path: str | PathLike[str],
    topics: dict[str, list[str]],
    *,
    message_paths: Iterable[str | PathLike[str]] | None = None,
    cache: bool = True,
    cache_path: str | PathLike[str] | None = None,
) -> Self:
    """Load a dataset from a ROS2 Humble rosbag file.

    The structure of the data is inferred from the message definitions. If
    a message definition is not found in the ROS2 Humble typestore, it is
    added from the provided paths. Once all the message definitions are
    added, the data is loaded from the rosbag file.

    Args:
        path: Path to the rosbag.
        topics: Dictionary of topics to load (`topic: [paths]`).
        message_paths: List of paths to additional message definitions.
        cache: Whether to cache the data to a Parquet file.
        cache_path: Path to the cache file. If None, defaults to the same
            directory as the rosbag file with a .parquet extension.
    """
    from flowcean.ros import load_rosbag

    return cls(
        load_rosbag(
            path,
            topics,
            message_paths=message_paths,
            cache=cache,
            cache_path=cache_path,
        ),
    )

`len()`

Return the number of samples in the dataset.

Source code in src/flowcean/polars/environments/dataframe.py

def __len__(self) -> int:
    """Return the number of samples in the dataset."""
    if self._length is None:
        # This operation is potentially very slow / costly
        self._length = cast(
            "int",
            self.data.select(pl.len()).collect().item(),
        )
    return self._length

`InvalidUriSchemeError(scheme)`

Bases: Exception

Exception raised when an URI scheme is invalid.

Initialize the InvalidUriSchemeError.

Parameters:

Name	Type	Description	Default
`scheme`	`str`	Invalid URI scheme.	required

Source code in src/flowcean/polars/environments/dataframe.py

def __init__(self, scheme: str) -> None:
    """Initialize the InvalidUriSchemeError.

    Args:
        scheme: Invalid URI scheme.
    """
    super().__init__(
        f"only file URIs can be converted to a path, but got `{scheme}`",
    )

`UnsupportedFileTypeError(suffix)`

Bases: Exception

Exception raised when a file type is not supported.

Initialize the UnsupportedFileTypeError.

Parameters:

Name	Type	Description	Default
`suffix`	`str`	File type suffix.	required

Source code in src/flowcean/polars/environments/dataframe.py

def __init__(self, suffix: str) -> None:
    """Initialize the UnsupportedFileTypeError.

    Args:
        suffix: File type suffix.
    """
    super().__init__(f"file type `{suffix}` is not supported")

`DatasetPredictionEnvironment(environment, batch_size)`

Bases: ActiveEnvironment

Dataset prediction environment.

Initialize the dataset prediction environment.

Parameters:

Name	Type	Description	Default
`environment`	`DataFrame`	The dataset to use for prediction.	required
`batch_size`	`int`	The batch size of the prediction.	required

Source code in src/flowcean/polars/environments/datasetprediction.py

def __init__(
    self,
    environment: DataFrame,
    batch_size: int,
) -> None:
    """Initialize the dataset prediction environment.

    Args:
        environment: The dataset to use for prediction.
        batch_size: The batch size of the prediction.
    """
    super().__init__()
    self.environment = environment
    self.batch_size = batch_size

`JoinedOfflineEnvironment(environments)`

Bases: OfflineEnvironment

Environment that joins multiple offline environments.

Attributes:

Name	Type	Description
`environments`	`Iterable[OfflineEnvironment]`	The offline environments to join.

Initialize the joined offline environment.

Parameters:

Name	Type	Description	Default
`environments`	`Iterable[OfflineEnvironment]`	The offline environments to join.	required

Source code in src/flowcean/polars/environments/join.py

def __init__(self, environments: Iterable[OfflineEnvironment]) -> None:
    """Initialize the joined offline environment.

    Args:
        environments: The offline environments to join.
    """
    self.environments = environments
    super().__init__()

`StreamingOfflineEnvironment(environment, batch_size, *, size=None)`

Bases: IncrementalEnvironment

Streaming offline environment.

This environment streams data from an offline environment in batches.

Initialize the streaming offline environment.

Parameters:

Name	Type	Description	Default
`environment`	`OfflineEnvironment`	The offline environment to stream.	required
`batch_size`	`int`	The batch size of the streaming environment.	required
`size`	`int \| None`	The number of samples in the environment. If provided, the number of steps will be calculated based on this value.	`None`

Source code in src/flowcean/polars/environments/streaming.py

def __init__(
    self,
    environment: OfflineEnvironment,
    batch_size: int,
    *,
    size: int | None = None,
) -> None:
    """Initialize the streaming offline environment.

    Args:
        environment: The offline environment to stream.
        batch_size: The batch size of the streaming environment.
        size: The number of samples in the environment. If provided, the
            number of steps will be calculated based on this value.
    """
    self.environment = environment
    self.batch_size = batch_size
    self.sample_count = size

`TrainTestSplit(ratio, *, shuffle=False)`

Split data into train and test sets.

Initialize the train-test splitter.

Parameters:

Name	Type	Description	Default
`ratio`	`float`	The ratio of the data to put in the training set.	required
`shuffle`	`bool`	Whether to shuffle the data before splitting.	`False`

Source code in src/flowcean/polars/environments/train_test_split.py

def __init__(
    self,
    ratio: float,
    *,
    shuffle: bool = False,
) -> None:
    """Initialize the train-test splitter.

    Args:
        ratio: The ratio of the data to put in the training set.
        shuffle: Whether to shuffle the data before splitting.
    """
    if ratio < 0 or ratio > 1:
        message = "ratio must be between 0 and 1"
        raise ValueError(message)
    self.ratio = ratio
    self.shuffle = shuffle

`split(environment)`

Split the data into train and test sets.

Parameters:

Name	Type	Description	Default
`environment`	`OfflineEnvironment`	The environment to split.	required

Source code in src/flowcean/polars/environments/train_test_split.py

def split(
    self,
    environment: OfflineEnvironment,
) -> tuple[DataFrame, DataFrame]:
    """Split the data into train and test sets.

    Args:
        environment: The environment to split.
    """
    logger.info("Splitting data into train and test sets")
    data = environment.observe().collect(engine="streaming")
    pivot = int(len(data) * self.ratio)
    splits = _split(
        data,
        lengths=[pivot, len(data) - pivot],
        shuffle=self.shuffle,
        seed=get_seed(),
    )
    return DataFrame(splits[0].lazy()), DataFrame(splits[1].lazy())

`LazyMixin(**kwargs)`

If input is a polars.LazyFrame, collect() it before passing on.

Source code in src/flowcean/polars/metric.py

def __init__(self, **kwargs: Any) -> None:
    super().__init__(**kwargs)

`SelectMixin(*, features=None, **kwargs)`

Select only specified columns from DataFrame-like objects.

Source code in src/flowcean/polars/metric.py

def __init__(
    self,
    *,
    features: Sequence[str] | None = None,
    **kwargs: Any,
) -> None:
    super().__init__(**kwargs)
    self.features = features

Name	Type	Description	Default
`target_type`	`PolarsDataType \| dict[str, PolarsDataType]`	Type to which the features will be cast. If a single type is provided, all features or those provided in the `features` keyword argument will be cast to that specific type. To cast features to different types, provide a dictionary with feature names as keys and target types as values.	required
`features`	`Iterable[str] \| None`	The features to cast. If `None` all features will be cast. This is the default behaviour.	`None`

Name	Type	Description	Default
`features`	`str \| Iterable[str]`	Features that shall be differentiated. Result features will be named `<feature>_derivative`.	required
`method`	`DiscreteDerivativeKind`	Method to use for calculating the derivative. Valid options are "forward", "backward", and "central". Defaults to "central".	`'central'`
`derivative_suffix`	`str`	Suffix to append to the feature name for the resulting derivative feature. Defaults to "_derivative".	`'_derivative'`

Name	Type	Description	Default
`features`	`str \| Iterable[str]`	The features to apply this transform to.	required
`replace`	`bool`	Whether to replace the original features with the transformed ones. If set to False, the default, the value will be added as a new feature named `{feature}_first`.	`False`

Name	Type	Description	Default
`reference_feature_name`	`str`	Reference timeseries feature.	required
`feature_interpolation_map`	`dict[str, MatchSamplingRateMethod] \| None`	Key-value pairs of the timeseries features that are targeted in interpolation columns and the interpolation method to use. The interpolation method can be 'linear' or 'nearest'.	`None`
`fill_strategy`	`FillStrategy`	Strategy to fill missing values after interpolation.	`'both_ways'`

Name	Type	Description	Default
`features`	`str \| Iterable[str]`	The feature or features the mean should be calculated for.	required
`replace`	`bool`	Whether to replace the original features with the transformed ones. If set to False, the default, the value will be added as a new feature named `{feature}_mean`.	`False`

Name	Type	Description	Default
`features`	`str \| Iterable[str]`	The feature or features the median should be calculated for.	required
`replace`	`bool`	Whether to replace the original features with the transformed ones. If set to False, the default, the value will be added as a new feature named `{feature}_median`.	`False`

Name	Type	Description	Default
`feature_categories`	`dict[str, list[Any]]`	Dictionary of features and a list of categorical values to encode for each.	required
`check_for_missing_categories`	`bool`	If set to true, a check is performed to see if all values belong to a category. If an unknown value is found which does not belong to any category, a NoMatchingCategoryError is thrown. To perform this check, the dataframe must be materialised, resulting in a potential performance decrease. Therefore it defaults to false.	`False`

Name	Type	Description	Default
`data`	`DataFrame`	A dataframe containing sample data for determining the categories of the transform.	required
`features`	`Iterable[str]`	Name of the features for which the one hot transformation will determine the categories.	required
`check_for_missing_categories`	`bool`	If set to true, a check is performed to see if all values belong to a category. If an unknown value is found which does not belong to any category, a NoMatchingCategoryError is thrown. To perform this check, the dataframe must be materialised, resulting in a potential performance decrease. Therefore it defaults to false.	`False`

Name	Type	Description	Default
`length`	`float`	The length (time) to pad the features to. This is the minimum length that the features will have after applying this transform.	required
`features`	`None \| str \| Iterable[str]`	The features to apply this transform to. Defaults to `None`, which will apply the transform to all time-series features.	`None`

Name	Type	Description	Default
`sampling_rate`	`float \| dict[str, float]`	Target sampling rate for time series features. If a float is provided, all possible time series features will be resampled. Alternatively, a dictionary can be provided where the key is the feature and the value is the target sample rate.	required
`interpolation_method`	`InterpolationMethod`	The interpolation method to use. Supported are "linear" and "cubic", with the default being "linear".	`'linear'`

Name	Type	Description
`m`	`dict[str, float] \| None`	The scaling factor \(m\) of each feature.
`b`	`dict[str, float] \| None`	The offset \(b\) of each feature.

Name	Type	Description	Default
`feature_limits`	`dict[str, tuple[float, float]]`	A dictionary mapping each features name to its (min_value, max_value) tuple.	required
`lower_range`	`float`	The lower bound of the range to scale to.	`-1.0`
`upper_range`	`float`	The upper bound of the range to scale to.	`1.0`

Name	Type	Description	Default
`features`	`Iterable[str]`	Features that shall be filtered.	required
`filter_type`	`SignalFilterType`	Type of the filter to apply. Valid options are "lowpass" and "highpass".	required
`filter_frequency`	`float`	Characteristic frequency of the filter in Hz. For high- and lowpass this is the cutoff frequency.	required
`order`	`int`	Order of the Butterworth filter to uses. Defaults to 5.	`5`

time_series	slice_points
[(00:00:03, 1),	[(00:00:05, 0),
(00:00:04, 2),	(00:00:08, 1)]
(00:00:06, 7),
(00:00:09, 0)]

time_series	slice_points
[(00:00:03, 1),	[(00:00:05, 0)]
(00:00:04, 2)]
[(00:00:06, 7)]	[(00:00:08, 1)]

Name	Type	Description	Default
`time_series`	`str`	the time series column to slice.	required
`slice_points`	`str`	the column that specifies the slice points.	required

Name	Type	Description	Default
`window_size`	`int`	The size of the sliding window.	required
`features`	`str \| Iterable[str] \| None`	The features to apply the sliding window to. If None, all time series features are selected.	`None`
`stride`	`int`	The stride of the sliding window.	`1`
`rechunk`	`bool`	Whether to rechunk the data after applying the transform. Rechunking improves performance of subsequent operations, but increases memory usage and may slow down the initial operation.	`True`

Name	Type	Description
`mean`	`dict[str, float] \| None`	The mean \(\mu\) of each feature.
`std`	`dict[str, float] \| None`	The standard deviation \(\sigma\) of each feature.

Name	Type	Description	Default
`features`	`Iterable[str] \| None`	The features to apply this transformation to. If `None`, all applicable features will be affected.	`None`
`time_start`	`float`	Window start time. Defaults to zero. All data before this time will be removed from the time series when applying the transform.	`0.0`
`time_end`	`float`	Window end time. Defaults to infinite. All data after this time will be removed from the time series when applying the transform.	`inf`

Name	Type	Description	Default
`features`	`list[str]`	List of topics to align.	required
`name`	`str`	Name of the output time series feature.	`'aligned'`
`drop`	`bool`	Whether to drop the original features after alignment.	`True`

polars

DummyLearner

DummyModel(output_names)

DataFrame(data)

to_incremental(batch_size=1)

from_csv(path, separator=',') classmethod

from_json(path) classmethod

from_parquet(path) classmethod

from_yaml(path) classmethod

from_uri(uri) classmethod

from_rosbag(path, topics, *, message_paths=None, cache=True, cache_path=None) classmethod

__len__()

InvalidUriSchemeError(scheme)

UnsupportedFileTypeError(suffix)

DatasetPredictionEnvironment(environment, batch_size)

JoinedOfflineEnvironment(environments)

StreamingOfflineEnvironment(environment, batch_size, *, size=None)

TrainTestSplit(ratio, *, shuffle=False)

split(environment)

LazyMixin(**kwargs)

SelectMixin(*, features=None, **kwargs)

Cast(target_type, *, features=None)

DiscreteDerivative(features, *, method='central', derivative_suffix='_derivative')

Drop(features, *more_features)

Explode(features=None, *more_features)

ExplodeTimeSeries(features)

Filter(expression)

FilterExpr

get() abstractmethod

First(features, *, replace=False)

FeatureLengthVaryError

Flatten(features=None)

NoTimeSeriesFeatureError

Lambda(fn)

Last(features, *, replace=False)

FeatureNotFoundError(feature)

MatchSamplingRate(reference_feature_name, feature_interpolation_map=None, fill_strategy='both_ways')

apply(data)

Mean(features, *, replace=False)

Median(features, *, replace=False)

Mode(features, *, replace=False)

OneCold(feature_categories, *, check_for_missing_categories=False)

apply(data)

from_dataframe(data, features, *, check_for_missing_categories=False) classmethod

OneHot(feature_categories, *, check_for_missing_categories=False)

apply(data)

from_dataframe(data, features, *, check_for_missing_categories=False) classmethod

Pad(length, *, features=None)

Rename(mapping)

Resample(sampling_rate, *, interpolation_method='linear')

ScaleToRange(*, features=None, lower_range=-1.0, upper_range=1.0) dataclass

from_limits(feature_limits, *, lower_range=-1.0, upper_range=1.0) classmethod

Select(features)

SignalFilter(features, filter_type, filter_frequency, *, order=5)

SliceTimeSeries(time_series, slice_points)

SlidingWindow(window_size)

TimeSeriesSlidingWindow(window_size, *, features=None, stride=1, rechunk=True)

Standardize(mean=None, std=None) dataclass

TimeWindow(*, features=None, time_start=0.0, time_end=math.inf)

Unnest(features)

ZeroOrderHold(features, name='aligned', *, drop=True)

collect(environment, n=None, *, progress_bar=True)

is_timeseries_feature(target, name)

`DummyLearner`

`DummyModel(output_names)`

`DataFrame(data)`

`to_incremental(batch_size=1)`

`from_csv(path, separator=',')` `classmethod`

`from_json(path)` `classmethod`

`from_parquet(path)` `classmethod`

`from_yaml(path)` `classmethod`

`from_uri(uri)` `classmethod`

`from_rosbag(path, topics, *, message_paths=None, cache=True, cache_path=None)` `classmethod`

`len()`

`InvalidUriSchemeError(scheme)`

`UnsupportedFileTypeError(suffix)`

`DatasetPredictionEnvironment(environment, batch_size)`

`JoinedOfflineEnvironment(environments)`

`StreamingOfflineEnvironment(environment, batch_size, *, size=None)`

`TrainTestSplit(ratio, *, shuffle=False)`

`split(environment)`

`LazyMixin(**kwargs)`

`SelectMixin(*, features=None, **kwargs)`

`Cast(target_type, *, features=None)`

`DiscreteDerivative(features, *, method='central', derivative_suffix='_derivative')`

`Drop(features, *more_features)`

`Explode(features=None, *more_features)`

`ExplodeTimeSeries(features)`

`Filter(expression)`

`FilterExpr`

`get()` `abstractmethod`

`First(features, *, replace=False)`

`FeatureLengthVaryError`

`Flatten(features=None)`

`NoTimeSeriesFeatureError`

`Lambda(fn)`

`Last(features, *, replace=False)`

`FeatureNotFoundError(feature)`

`MatchSamplingRate(reference_feature_name, feature_interpolation_map=None, fill_strategy='both_ways')`

`apply(data)`

`Mean(features, *, replace=False)`

`Median(features, *, replace=False)`

`Mode(features, *, replace=False)`

`OneCold(feature_categories, *, check_for_missing_categories=False)`

`apply(data)`

`from_dataframe(data, features, *, check_for_missing_categories=False)` `classmethod`

`OneHot(feature_categories, *, check_for_missing_categories=False)`

`apply(data)`

`from_dataframe(data, features, *, check_for_missing_categories=False)` `classmethod`

`Pad(length, *, features=None)`

`Rename(mapping)`

`Resample(sampling_rate, *, interpolation_method='linear')`

`ScaleToRange(*, features=None, lower_range=-1.0, upper_range=1.0)` `dataclass`

`from_limits(feature_limits, *, lower_range=-1.0, upper_range=1.0)` `classmethod`

`Select(features)`

`SignalFilter(features, filter_type, filter_frequency, *, order=5)`

`SliceTimeSeries(time_series, slice_points)`

`SlidingWindow(window_size)`

`TimeSeriesSlidingWindow(window_size, *, features=None, stride=1, rechunk=True)`

`Standardize(mean=None, std=None)` `dataclass`

`TimeWindow(*, features=None, time_start=0.0, time_end=math.inf)`

`Unnest(features)`

`ZeroOrderHold(features, name='aligned', *, drop=True)`

`collect(environment, n=None, *, progress_bar=True)`

`is_timeseries_feature(target, name)`

Name	Type	Description	Default
`environment`	`Iterable[LazyFrame] \| Collection[LazyFrame]`	The environment to collect data from.	required
`n`	`int \| None`	Number of samples to collect. If None, all samples are collected.	`None`
`progress_bar`	`bool \| dict[str, Any]`	Whether to show a progress bar. If a dictionary is provided, it will be passed to the progress bar.	`True`

Name	Type	Description	Default
`target`	`DataFrame \| LazyFrame \| Schema`	The LazyFrame, DataFrame or schema to check.	required
`name`	`str`	The column to check.	required