-
Notifications
You must be signed in to change notification settings - Fork 917
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Migrate reshape.pxd to pylibcudf (#15827)
xref #15162 Authors: - Thomas Li (https://github.com/lithomas1) Approvers: - Matthew Roeschke (https://github.com/mroeschke) - Vyas Ramasubramani (https://github.com/vyasr) URL: #15827
- Loading branch information
Showing
9 changed files
with
147 additions
and
24 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,6 @@ | ||
======= | ||
reshape | ||
======= | ||
|
||
.. automodule:: cudf._lib.pylibcudf.reshape | ||
:members: |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -27,6 +27,7 @@ set(cython_sources | |
merge.pyx | ||
reduce.pyx | ||
replace.pyx | ||
reshape.pyx | ||
rolling.pyx | ||
scalar.pyx | ||
search.pyx | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -13,6 +13,7 @@ from . cimport ( | |
merge, | ||
reduce, | ||
replace, | ||
reshape, | ||
rolling, | ||
search, | ||
sorting, | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -13,6 +13,7 @@ | |
merge, | ||
reduce, | ||
replace, | ||
reshape, | ||
rolling, | ||
search, | ||
sorting, | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,11 @@ | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
from cudf._lib.pylibcudf.libcudf.types cimport size_type | ||
|
||
from .column cimport Column | ||
from .scalar cimport Scalar | ||
from .table cimport Table | ||
|
||
|
||
cpdef Column interleave_columns(Table source_table) | ||
cpdef Table tile(Table source_table, size_type count) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
from libcpp.memory cimport unique_ptr | ||
from libcpp.utility cimport move | ||
|
||
from cudf._lib.pylibcudf.libcudf.column.column cimport column | ||
from cudf._lib.pylibcudf.libcudf.reshape cimport ( | ||
interleave_columns as cpp_interleave_columns, | ||
tile as cpp_tile, | ||
) | ||
from cudf._lib.pylibcudf.libcudf.table.table cimport table | ||
from cudf._lib.pylibcudf.libcudf.types cimport size_type | ||
|
||
from .column cimport Column | ||
from .table cimport Table | ||
|
||
|
||
cpdef Column interleave_columns(Table source_table): | ||
"""Interleave columns of a table into a single column. | ||
Converts the column major table `input` into a row major column. | ||
Example: | ||
in = [[A1, A2, A3], [B1, B2, B3]] | ||
return = [A1, B1, A2, B2, A3, B3] | ||
Parameters | ||
---------- | ||
source_table: Table | ||
The input table to interleave | ||
Returns | ||
------- | ||
Column | ||
A new column which is the result of interleaving the input columns | ||
""" | ||
cdef unique_ptr[column] c_result | ||
|
||
with nogil: | ||
c_result = move(cpp_interleave_columns(source_table.view())) | ||
|
||
return Column.from_libcudf(move(c_result)) | ||
|
||
|
||
cpdef Table tile(Table source_table, size_type count): | ||
"""Repeats the rows from input table count times to form a new table. | ||
Parameters | ||
---------- | ||
source_table: Table | ||
The input table containing rows to be repeated | ||
count: size_type | ||
The number of times to tile "rows". Must be non-negative | ||
Returns | ||
------- | ||
Table | ||
The table containing the tiled "rows" | ||
""" | ||
cdef unique_ptr[table] c_result | ||
|
||
with nogil: | ||
c_result = move(cpp_tile(source_table.view(), count)) | ||
|
||
return Table.from_libcudf(move(c_result)) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,43 @@ | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
import pyarrow as pa | ||
import pytest | ||
from utils import assert_column_eq, assert_table_eq | ||
|
||
from cudf._lib import pylibcudf as plc | ||
|
||
|
||
@pytest.fixture(scope="module") | ||
def reshape_data(): | ||
data = [[1, 2, 3], [4, 5, 6]] | ||
return data | ||
|
||
|
||
@pytest.fixture(scope="module") | ||
def reshape_plc_tbl(reshape_data): | ||
arrow_tbl = pa.Table.from_arrays(reshape_data, names=["a", "b"]) | ||
plc_tbl = plc.interop.from_arrow(arrow_tbl) | ||
return plc_tbl | ||
|
||
|
||
def test_interleave_columns(reshape_data, reshape_plc_tbl): | ||
res = plc.reshape.interleave_columns(reshape_plc_tbl) | ||
|
||
interleaved_data = [pa.array(pair) for pair in zip(*reshape_data)] | ||
|
||
expect = pa.concat_arrays(interleaved_data) | ||
|
||
assert_column_eq(res, expect) | ||
|
||
|
||
@pytest.mark.parametrize("cnt", [0, 1, 3]) | ||
def test_tile(reshape_data, reshape_plc_tbl, cnt): | ||
res = plc.reshape.tile(reshape_plc_tbl, cnt) | ||
|
||
tiled_data = [pa.array(col * cnt) for col in reshape_data] | ||
|
||
expect = pa.Table.from_arrays( | ||
tiled_data, schema=plc.interop.to_arrow(reshape_plc_tbl).schema | ||
) | ||
|
||
assert_table_eq(res, expect) |