Skip to content

Commit

Permalink
first use of ak.str
Browse files Browse the repository at this point in the history
  • Loading branch information
douglasdavis committed Sep 6, 2023
1 parent 6716eea commit 8925f22
Show file tree
Hide file tree
Showing 4 changed files with 44 additions and 0 deletions.
1 change: 1 addition & 0 deletions src/dask_awkward/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@
import dask_awkward.lib.operations as operations
import dask_awkward.lib.optimize as optimize
import dask_awkward.lib.reducers as reducers
import dask_awkward.lib.str as str
import dask_awkward.lib.structure as structure
from dask_awkward.lib.core import Array, PartitionCompatibility, Record, Scalar
from dask_awkward.lib.core import _type as type
Expand Down
1 change: 1 addition & 0 deletions src/dask_awkward/lib/__init__.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,4 @@
import dask_awkward.lib.str as str
from dask_awkward.lib.core import Array, PartitionCompatibility, Record, Scalar
from dask_awkward.lib.core import _type as type
from dask_awkward.lib.core import (
Expand Down
20 changes: 20 additions & 0 deletions src/dask_awkward/lib/str.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
import awkward as ak

from dask_awkward.lib.core import Array, map_partitions


def split_whitespace(
array: Array,
*,
max_splits: int | None = None,
reverse: bool = False,
highlevel: bool = True,
behavior: dict | None = None,
):
return map_partitions(
ak.str.split_whitespace,
array,
max_splits=max_splits,
reverse=reverse,
behavior=behavior,
)
22 changes: 22 additions & 0 deletions tests/test_str.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
from __future__ import annotations

import awkward as ak

import dask_awkward as dak
from dask_awkward.lib.testutils import assert_eq


def test_split_whitespace():
a = ak.Array(
[
["abc 123", "fooo ooo", "123"],
["hij\tj"],
["lmn op", ""],
["123 456 789", "98765 43210"],
]
)
b = dak.from_awkward(a, npartitions=2)
a2 = ak.str.split_whitespace(a)
b2 = dak.str.split_whitespace(b)
assert_eq(a2, b2)
assert_eq(ak.num(a2, axis=2), ak.num(b2, axis=2))

0 comments on commit 8925f22

Please sign in to comment.