pub mod constants;
mod warning;
use std::borrow::Cow;
use std::collections::TryReserveError;
use std::convert::Infallible;
use std::error::Error;
use std::fmt::{self, Display, Formatter, Write};
use std::ops::Deref;
use std::sync::{Arc, LazyLock};
use std::{env, io};
pub mod signals;
pub use warning::*;
#[cfg(feature = "python")]
mod python;
enum ErrorStrategy {
Panic,
WithBacktrace,
Normal,
}
static ERROR_STRATEGY: LazyLock<ErrorStrategy> = LazyLock::new(|| {
if env::var("POLARS_PANIC_ON_ERR").as_deref() == Ok("1") {
ErrorStrategy::Panic
} else if env::var("POLARS_BACKTRACE_IN_ERR").as_deref() == Ok("1") {
ErrorStrategy::WithBacktrace
} else {
ErrorStrategy::Normal
}
});
#[derive(Debug, Clone)]
pub struct ErrString(Cow<'static, str>);
impl ErrString {
pub const fn new_static(s: &'static str) -> Self {
Self(Cow::Borrowed(s))
}
}
impl<T> From<T> for ErrString
where
T: Into<Cow<'static, str>>,
{
fn from(msg: T) -> Self {
match &*ERROR_STRATEGY {
ErrorStrategy::Panic => panic!("{}", msg.into()),
ErrorStrategy::WithBacktrace => ErrString(Cow::Owned(format!(
"{}\n\nRust backtrace:\n{}",
msg.into(),
std::backtrace::Backtrace::force_capture()
))),
ErrorStrategy::Normal => ErrString(msg.into()),
}
}
}
impl AsRef<str> for ErrString {
fn as_ref(&self) -> &str {
&self.0
}
}
impl Deref for ErrString {
type Target = str;
fn deref(&self) -> &Self::Target {
&self.0
}
}
impl Display for ErrString {
fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
write!(f, "{}", self.0)
}
}
#[derive(Debug, Clone)]
pub enum PolarsError {
AssertionError(ErrString),
ColumnNotFound(ErrString),
ComputeError(ErrString),
Duplicate(ErrString),
InvalidOperation(ErrString),
IO {
error: Arc<io::Error>,
msg: Option<ErrString>,
},
NoData(ErrString),
OutOfBounds(ErrString),
SchemaFieldNotFound(ErrString),
SchemaMismatch(ErrString),
ShapeMismatch(ErrString),
SQLInterface(ErrString),
SQLSyntax(ErrString),
StringCacheMismatch(ErrString),
StructFieldNotFound(ErrString),
Context {
error: Box<PolarsError>,
msg: ErrString,
},
#[cfg(feature = "python")]
Python {
error: python::PyErrWrap,
},
}
impl Error for PolarsError {}
impl Display for PolarsError {
fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
use PolarsError::*;
match self {
ComputeError(msg)
| InvalidOperation(msg)
| OutOfBounds(msg)
| SchemaMismatch(msg)
| SQLInterface(msg)
| SQLSyntax(msg) => write!(f, "{msg}"),
AssertionError(msg) => write!(f, "assertion failed: {msg}"),
ColumnNotFound(msg) => write!(f, "not found: {msg}"),
Duplicate(msg) => write!(f, "duplicate: {msg}"),
IO { error, msg } => match msg {
Some(m) => write!(f, "{m}"),
None => write!(f, "{error}"),
},
NoData(msg) => write!(f, "no data: {msg}"),
SchemaFieldNotFound(msg) => write!(f, "field not found: {msg}"),
ShapeMismatch(msg) => write!(f, "lengths don't match: {msg}"),
StringCacheMismatch(msg) => write!(f, "string caches don't match: {msg}"),
StructFieldNotFound(msg) => write!(f, "field not found: {msg}"),
Context { error, msg } => write!(f, "{error}: {msg}"),
#[cfg(feature = "python")]
Python { error } => write!(f, "python: {error}"),
}
}
}
impl From<io::Error> for PolarsError {
fn from(value: io::Error) -> Self {
PolarsError::IO {
error: Arc::new(value),
msg: None,
}
}
}
#[cfg(feature = "regex")]
impl From<regex::Error> for PolarsError {
fn from(err: regex::Error) -> Self {
PolarsError::ComputeError(format!("regex error: {err}").into())
}
}
#[cfg(feature = "object_store")]
impl From<object_store::Error> for PolarsError {
fn from(err: object_store::Error) -> Self {
if let object_store::Error::Generic { store, source } = &err {
if let Some(polars_err) = source.as_ref().downcast_ref::<PolarsError>() {
return polars_err.wrap_msg(|s| format!("{s} (store: {store})"));
}
}
std::io::Error::other(format!("object-store error: {err}")).into()
}
}
#[cfg(feature = "avro-schema")]
impl From<avro_schema::error::Error> for PolarsError {
fn from(value: avro_schema::error::Error) -> Self {
polars_err!(ComputeError: "avro-error: {}", value)
}
}
impl From<simdutf8::basic::Utf8Error> for PolarsError {
fn from(value: simdutf8::basic::Utf8Error) -> Self {
polars_err!(ComputeError: "invalid utf8: {}", value)
}
}
#[cfg(feature = "arrow-format")]
impl From<arrow_format::ipc::planus::Error> for PolarsError {
fn from(err: arrow_format::ipc::planus::Error) -> Self {
polars_err!(ComputeError: "parquet error: {err:?}")
}
}
impl From<TryReserveError> for PolarsError {
fn from(value: TryReserveError) -> Self {
polars_err!(ComputeError: "OOM: {}", value)
}
}
impl From<Infallible> for PolarsError {
fn from(_: Infallible) -> Self {
unreachable!()
}
}
pub type PolarsResult<T> = Result<T, PolarsError>;
impl PolarsError {
pub fn context_trace(self) -> Self {
use PolarsError::*;
match self {
Context { error, msg } => {
if !matches!(&*error, PolarsError::Context { .. }) {
return *error;
}
let mut current_error = &*error;
let material_error = error.get_err();
let mut messages = vec![&msg];
while let PolarsError::Context { msg, error } = current_error {
current_error = error;
messages.push(msg)
}
let mut bt = String::new();
let mut count = 0;
while let Some(msg) = messages.pop() {
count += 1;
writeln!(&mut bt, "\t[{count}] {msg}").unwrap();
}
material_error.wrap_msg(move |msg| {
format!("{msg}\n\nThis error occurred with the following context stack:\n{bt}")
})
},
err => err,
}
}
pub fn wrap_msg<F: FnOnce(&str) -> String>(&self, func: F) -> Self {
use PolarsError::*;
match self {
AssertionError(msg) => AssertionError(func(msg).into()),
ColumnNotFound(msg) => ColumnNotFound(func(msg).into()),
ComputeError(msg) => ComputeError(func(msg).into()),
Duplicate(msg) => Duplicate(func(msg).into()),
InvalidOperation(msg) => InvalidOperation(func(msg).into()),
IO { error, msg } => {
let msg = match msg {
Some(msg) => func(msg),
None => func(&format!("{error}")),
};
IO {
error: error.clone(),
msg: Some(msg.into()),
}
},
NoData(msg) => NoData(func(msg).into()),
OutOfBounds(msg) => OutOfBounds(func(msg).into()),
SchemaFieldNotFound(msg) => SchemaFieldNotFound(func(msg).into()),
SchemaMismatch(msg) => SchemaMismatch(func(msg).into()),
ShapeMismatch(msg) => ShapeMismatch(func(msg).into()),
StringCacheMismatch(msg) => StringCacheMismatch(func(msg).into()),
StructFieldNotFound(msg) => StructFieldNotFound(func(msg).into()),
SQLInterface(msg) => SQLInterface(func(msg).into()),
SQLSyntax(msg) => SQLSyntax(func(msg).into()),
Context { error, .. } => error.wrap_msg(func),
#[cfg(feature = "python")]
Python { error } => pyo3::Python::with_gil(|py| {
use pyo3::types::{PyAnyMethods, PyStringMethods};
use pyo3::{IntoPyObject, PyErr};
let value = error.value(py);
let msg = if let Ok(s) = value.str() {
func(&s.to_string_lossy())
} else {
func("<exception str() failed>")
};
let cls = value.get_type();
let out = PyErr::from_type(cls, (msg,));
let out = if let Ok(out_with_traceback) = (|| {
out.clone_ref(py)
.into_pyobject(py)?
.getattr("with_traceback")
.unwrap()
.call1((value.getattr("__traceback__").unwrap(),))
})() {
PyErr::from_value(out_with_traceback)
} else {
out
};
Python {
error: python::PyErrWrap(out),
}
}),
}
}
fn get_err(&self) -> &Self {
use PolarsError::*;
match self {
Context { error, .. } => error.get_err(),
err => err,
}
}
pub fn context(self, msg: ErrString) -> Self {
PolarsError::Context {
msg,
error: Box::new(self),
}
}
pub fn remove_context(mut self) -> Self {
while let Self::Context { error, .. } = self {
self = *error;
}
self
}
}
pub fn map_err<E: Error>(error: E) -> PolarsError {
PolarsError::ComputeError(format!("{error}").into())
}
#[macro_export]
macro_rules! polars_err {
($variant:ident: $fmt:literal $(, $arg:expr)* $(,)?) => {
$crate::__private::must_use(
$crate::PolarsError::$variant(format!($fmt, $($arg),*).into())
)
};
($variant:ident: $fmt:literal $(, $arg:expr)*, hint = $hint:literal) => {
$crate::__private::must_use(
$crate::PolarsError::$variant(format!(concat_str!($fmt, "\n\nHint: ", $hint), $($arg),*).into())
)
};
($variant:ident: $err:expr $(,)?) => {
$crate::__private::must_use(
$crate::PolarsError::$variant($err.into())
)
};
(expr = $expr:expr, $variant:ident: $err:expr $(,)?) => {
$crate::__private::must_use(
$crate::PolarsError::$variant(
format!("{}\n\nError originated in expression: '{:?}'", $err, $expr).into()
)
)
};
(expr = $expr:expr, $variant:ident: $fmt:literal, $($arg:tt)+) => {
polars_err!(expr = $expr, $variant: format!($fmt, $($arg)+))
};
(op = $op:expr, got = $arg:expr, expected = $expected:expr) => {
$crate::polars_err!(
InvalidOperation: "{} operation not supported for dtype `{}` (expected: {})",
$op, $arg, $expected
)
};
(opq = $op:ident, got = $arg:expr, expected = $expected:expr) => {
$crate::polars_err!(
op = concat!("`", stringify!($op), "`"), got = $arg, expected = $expected
)
};
(un_impl = $op:ident) => {
$crate::polars_err!(
InvalidOperation: "{} operation is not implemented.", concat!("`", stringify!($op), "`")
)
};
(op = $op:expr, $arg:expr) => {
$crate::polars_err!(
InvalidOperation: "{} operation not supported for dtype `{}`", $op, $arg
)
};
(op = $op:expr, $arg:expr, hint = $hint:literal) => {
$crate::polars_err!(
InvalidOperation: "{} operation not supported for dtype `{}`\n\nHint: {}", $op, $arg, $hint
)
};
(op = $op:expr, $lhs:expr, $rhs:expr) => {
$crate::polars_err!(
InvalidOperation: "{} operation not supported for dtypes `{}` and `{}`", $op, $lhs, $rhs
)
};
(op = $op:expr, $arg1:expr, $arg2:expr, $arg3:expr) => {
$crate::polars_err!(
InvalidOperation: "{} operation not supported for dtypes `{}`, `{}` and `{}`", $op, $arg1, $arg2, $arg3
)
};
(opidx = $op:expr, idx = $idx:expr, $arg:expr) => {
$crate::polars_err!(
InvalidOperation: "`{}` operation not supported for dtype `{}` as argument {}", $op, $arg, $idx
)
};
(oos = $($tt:tt)+) => {
$crate::polars_err!(ComputeError: "out-of-spec: {}", $($tt)+)
};
(nyi = $($tt:tt)+) => {
$crate::polars_err!(ComputeError: "not yet implemented: {}", format!($($tt)+) )
};
(opq = $op:ident, $arg:expr) => {
$crate::polars_err!(op = concat!("`", stringify!($op), "`"), $arg)
};
(opq = $op:ident, $lhs:expr, $rhs:expr) => {
$crate::polars_err!(op = stringify!($op), $lhs, $rhs)
};
(bigidx, ctx = $ctx:expr, size = $size:expr) => {
$crate::polars_err!(ComputeError: "\
{} produces {} rows which is more than maximum allowed pow(2, 32) rows; \
consider compiling with bigidx feature (polars-u64-idx package on python)",
$ctx,
$size,
)
};
(append) => {
polars_err!(SchemaMismatch: "cannot append series, data types don't match")
};
(extend) => {
polars_err!(SchemaMismatch: "cannot extend series, data types don't match")
};
(unpack) => {
polars_err!(SchemaMismatch: "cannot unpack series, data types don't match")
};
(not_in_enum,value=$value:expr,categories=$categories:expr) =>{
polars_err!(ComputeError: "value '{}' is not present in Enum: {:?}",$value,$categories)
};
(string_cache_mismatch) => {
polars_err!(StringCacheMismatch: r#"
cannot compare categoricals coming from different sources, consider setting a global StringCache.
Help: if you're using Python, this may look something like:
with pl.StringCache():
df1 = pl.DataFrame({'a': ['1', '2']}, schema={'a': pl.Categorical})
df2 = pl.DataFrame({'a': ['1', '3']}, schema={'a': pl.Categorical})
pl.concat([df1, df2])
Alternatively, if the performance cost is acceptable, you could just set:
import polars as pl
pl.enable_string_cache()
on startup."#.trim_start())
};
(duplicate = $name:expr) => {
$crate::polars_err!(Duplicate: "column with name '{}' has more than one occurrence", $name)
};
(duplicate_field = $name:expr) => {
$crate::polars_err!(Duplicate: "multiple fields with name '{}' found", $name)
};
(col_not_found = $name:expr) => {
$crate::polars_err!(ColumnNotFound: "{:?} not found", $name)
};
(mismatch, col=$name:expr, expected=$expected:expr, found=$found:expr) => {
$crate::polars_err!(
SchemaMismatch: "data type mismatch for column {}: expected: {}, found: {}",
$name,
$expected,
$found,
)
};
(oob = $idx:expr, $len:expr) => {
polars_err!(OutOfBounds: "index {} is out of bounds for sequence of length {}", $idx, $len)
};
(agg_len = $agg_len:expr, $groups_len:expr) => {
polars_err!(
ComputeError:
"returned aggregation is of different length: {} than the groups length: {}",
$agg_len, $groups_len
)
};
(parse_fmt_idk = $dtype:expr) => {
polars_err!(
ComputeError: "could not find an appropriate format to parse {}s, please define a format",
$dtype,
)
};
(length_mismatch = $operation:expr, $lhs:expr, $rhs:expr) => {
$crate::polars_err!(
ShapeMismatch: "arguments for `{}` have different lengths ({} != {})",
$operation, $lhs, $rhs
)
};
(length_mismatch = $operation:expr, $lhs:expr, $rhs:expr, argument = $argument:expr, argument_idx = $argument_idx:expr) => {
$crate::polars_err!(
ShapeMismatch: "argument {} called '{}' for `{}` have different lengths ({} != {})",
$argument_idx, $argument, $operation, $lhs, $rhs
)
};
(assertion_error = $objects:expr, $detail:expr, $lhs:expr, $rhs:expr) => {
$crate::polars_err!(
AssertionError: "{} are different ({})\n[left]: {}\n[right]: {}",
$objects, $detail, $lhs, $rhs
)
};
(to_datetime_tz_mismatch) => {
$crate::polars_err!(
ComputeError: "`strptime` / `to_datetime` was called with no format and no time zone, but a time zone is part of the data.\n\nThis was previously allowed but led to unpredictable and erroneous results. Give a format string, set a time zone or perform the operation eagerly on a Series instead of on an Expr."
)
};
}
#[macro_export]
macro_rules! polars_bail {
($($tt:tt)+) => {
return Err($crate::polars_err!($($tt)+))
};
}
#[macro_export]
macro_rules! polars_ensure {
($cond:expr, $($tt:tt)+) => {
if !$cond {
$crate::polars_bail!($($tt)+);
}
};
}
#[inline]
#[cold]
#[must_use]
pub fn to_compute_err(err: impl Display) -> PolarsError {
PolarsError::ComputeError(err.to_string().into())
}
#[macro_export]
macro_rules! feature_gated {
($($feature:literal);*, $content:expr) => {{
#[cfg(all($(feature = $feature),*))]
{
$content
}
#[cfg(not(all($(feature = $feature),*)))]
{
panic!("activate '{}' feature", concat!($($feature, ", "),*))
}
}};
}
#[doc(hidden)]
pub mod __private {
#[doc(hidden)]
#[inline]
#[cold]
#[must_use]
pub fn must_use(error: crate::PolarsError) -> crate::PolarsError {
error
}
}