Path: blob/main/py-polars/tests/unit/functions/test_concat.py
6939 views
import pytest12import polars as pl3from polars.testing import assert_frame_equal456@pytest.mark.may_fail_cloud # reason: @serialize-stack-overflow7@pytest.mark.slow8def test_concat_expressions_stack_overflow() -> None:9n = 1000010e = pl.concat([pl.lit(x) for x in range(n)])1112df = pl.select(e)13assert df.shape == (n, 1)141516@pytest.mark.may_fail_cloud # reason: @serialize-stack-overflow17@pytest.mark.slow18def test_concat_lf_stack_overflow() -> None:19n = 100020bar = pl.DataFrame({"a": 0}).lazy()2122for i in range(n):23bar = pl.concat([bar, pl.DataFrame({"a": i}).lazy()])24assert bar.collect().shape == (1001, 1)252627def test_concat_vertically_relaxed() -> None:28a = pl.DataFrame(29data={"a": [1, 2, 3], "b": [True, False, None]},30schema={"a": pl.Int8, "b": pl.Boolean},31)32b = pl.DataFrame(33data={"a": [43, 2, 3], "b": [32, 1, None]},34schema={"a": pl.Int16, "b": pl.Int64},35)36out = pl.concat([a, b], how="vertical_relaxed")37assert out.schema == {"a": pl.Int16, "b": pl.Int64}38assert out.to_dict(as_series=False) == {39"a": [1, 2, 3, 43, 2, 3],40"b": [1, 0, None, 32, 1, None],41}42out = pl.concat([b, a], how="vertical_relaxed")43assert out.schema == {"a": pl.Int16, "b": pl.Int64}44assert out.to_dict(as_series=False) == {45"a": [43, 2, 3, 1, 2, 3],46"b": [32, 1, None, 1, 0, None],47}4849c = pl.DataFrame({"a": [1, 2], "b": [2, 1]})50d = pl.DataFrame({"a": [1.0, 0.2], "b": [None, 0.1]})5152out = pl.concat([c, d], how="vertical_relaxed")53assert out.schema == {"a": pl.Float64, "b": pl.Float64}54assert out.to_dict(as_series=False) == {55"a": [1.0, 2.0, 1.0, 0.2],56"b": [2.0, 1.0, None, 0.1],57}58out = pl.concat([d, c], how="vertical_relaxed")59assert out.schema == {"a": pl.Float64, "b": pl.Float64}60assert out.to_dict(as_series=False) == {61"a": [1.0, 0.2, 1.0, 2.0],62"b": [None, 0.1, 2.0, 1.0],63}646566def test_concat_group_by() -> None:67df = pl.DataFrame(68{69"g": [0, 0, 0, 0, 1, 1, 1, 1],70"a": [0, 1, 2, 3, 4, 5, 6, 7],71"b": [8, 9, 10, 11, 12, 13, 14, 15],72}73)74out = df.group_by("g").agg(pl.concat([pl.col.a, pl.col.b]))7576assert_frame_equal(77out,78pl.DataFrame(79{80"g": [0, 1],81"a": [[0, 1, 2, 3, 8, 9, 10, 11], [4, 5, 6, 7, 12, 13, 14, 15]],82}83),84check_row_order=False,85)868788def test_concat_19877() -> None:89df = pl.DataFrame({"a": [1, 2], "b": [3, 4]})90out = df.select(pl.concat([pl.col("a"), pl.col("b")]))91assert_frame_equal(out, pl.DataFrame({"a": [1, 2, 3, 4]}))929394def test_concat_zip_series_21980() -> None:95df = pl.DataFrame({"x": 1, "y": 2})96out = df.select(pl.concat([pl.col.x, pl.col.y]), pl.Series([3, 4]))97assert_frame_equal(out, pl.DataFrame({"x": [1, 2], "": [3, 4]}))9899100