107 lines
3.4 KiB
Python
107 lines
3.4 KiB
Python
from __future__ import annotations
|
|
|
|
from typing import TYPE_CHECKING
|
|
|
|
import dask.dataframe as dd
|
|
|
|
if TYPE_CHECKING:
|
|
from typing_extensions import Self
|
|
|
|
from narwhals._dask.expr import DaskExpr
|
|
|
|
|
|
class DaskExprStringNamespace:
|
|
def __init__(self: Self, expr: DaskExpr) -> None:
|
|
self._compliant_expr = expr
|
|
|
|
def len_chars(self: Self) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(lambda _input: _input.str.len(), "len")
|
|
|
|
def replace(
|
|
self: Self, pattern: str, value: str, *, literal: bool, n: int
|
|
) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, pattern, value, literal, n: _input.str.replace(
|
|
pattern, value, regex=not literal, n=n
|
|
),
|
|
"replace",
|
|
pattern=pattern,
|
|
value=value,
|
|
literal=literal,
|
|
n=n,
|
|
)
|
|
|
|
def replace_all(self: Self, pattern: str, value: str, *, literal: bool) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, pattern, value, literal: _input.str.replace(
|
|
pattern, value, n=-1, regex=not literal
|
|
),
|
|
"replace",
|
|
pattern=pattern,
|
|
value=value,
|
|
literal=literal,
|
|
)
|
|
|
|
def strip_chars(self: Self, characters: str | None) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, characters: _input.str.strip(characters),
|
|
"strip",
|
|
characters=characters,
|
|
)
|
|
|
|
def starts_with(self: Self, prefix: str) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, prefix: _input.str.startswith(prefix),
|
|
"starts_with",
|
|
prefix=prefix,
|
|
)
|
|
|
|
def ends_with(self: Self, suffix: str) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, suffix: _input.str.endswith(suffix), "ends_with", suffix=suffix
|
|
)
|
|
|
|
def contains(self: Self, pattern: str, *, literal: bool) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, pattern, literal: _input.str.contains(
|
|
pat=pattern, regex=not literal
|
|
),
|
|
"contains",
|
|
pattern=pattern,
|
|
literal=literal,
|
|
)
|
|
|
|
def slice(self: Self, offset: int, length: int | None) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, offset, length: _input.str.slice(
|
|
start=offset, stop=offset + length if length else None
|
|
),
|
|
"slice",
|
|
offset=offset,
|
|
length=length,
|
|
)
|
|
|
|
def split(self: Self, by: str) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, by: _input.str.split(pat=by),
|
|
"split",
|
|
by=by,
|
|
)
|
|
|
|
def to_datetime(self: Self, format: str | None) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input, format: dd.to_datetime(_input, format=format),
|
|
"to_datetime",
|
|
format=format,
|
|
)
|
|
|
|
def to_uppercase(self: Self) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input: _input.str.upper(), "to_uppercase"
|
|
)
|
|
|
|
def to_lowercase(self: Self) -> DaskExpr:
|
|
return self._compliant_expr._with_callable(
|
|
lambda _input: _input.str.lower(), "to_lowercase"
|
|
)
|