Path: blob/main/docs/source/src/python/user-guide/io/multiple.py
7890 views
# --8<-- [start:create]1import polars as pl23df = pl.DataFrame({"foo": [1, 2, 3], "bar": [None, "ham", "spam"]})45for i in range(5):6df.write_csv(f"docs/assets/data/my_many_files_{i}.csv")7# --8<-- [end:create]89# --8<-- [start:read]10df = pl.read_csv("docs/assets/data/my_many_files_*.csv")11print(df)12# --8<-- [end:read]1314# --8<-- [start:creategraph]15import base641617pl.scan_csv("docs/assets/data/my_many_files_*.csv").show_graph(18output_path="docs/assets/images/multiple.png", show=False19)20with open("docs/assets/images/multiple.png", "rb") as f:21png = base64.b64encode(f.read()).decode()22print(f'<img src="data:image/png;base64, {png}"/>')23# --8<-- [end:creategraph]2425# --8<-- [start:graph]26pl.scan_csv("docs/assets/data/my_many_files_*.csv").show_graph()27# --8<-- [end:graph]2829# --8<-- [start:glob]30import glob3132import polars as pl3334queries = []35for file in glob.glob("docs/assets/data/my_many_files_*.csv"):36q = pl.scan_csv(file).group_by("bar").agg(pl.len(), pl.sum("foo"))37queries.append(q)3839dataframes = pl.collect_all(queries)40print(dataframes)41# --8<-- [end:glob]424344