Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
pola-rs
GitHub Repository: pola-rs/polars
Path: blob/main/pyo3-polars/example/extend_polars_python_dispatch/run.py
6939 views
1
import polars as pl
2
from extend_polars import parallel_jaccard, lazy_parallel_jaccard, debug
3
4
df = pl.DataFrame({"list_a": [[1, 2, 3], [5, 5]], "list_b": [[1, 2, 3, 8], [5, 1, 1]]})
5
6
print(df)
7
print(parallel_jaccard(df, "list_a", "list_b"))
8
9
# warning this serializes/deserialized the data
10
# it is recommended to only use LazyFrames that don't have any
11
# DataFrame in their logical plan.
12
print(lazy_parallel_jaccard(df.lazy(), "list_a", "list_b").collect())
13
14
df = pl.DataFrame({"string": ["ab", "c"]})
15
print(debug(df))
16
17