use std::fmt::Formatter;
use arrow2::{
array::{get_display, Array},
datatypes::{DataType, IntervalUnit, TimeUnit},
};
use comfy_table::{presets, Cell, Table};
#[repr(transparent)]
pub struct DisplayTimeUnit(TimeUnit);
impl std::fmt::Display for DisplayTimeUnit {
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
let s = match self.0 {
arrow2::datatypes::TimeUnit::Second => "s",
arrow2::datatypes::TimeUnit::Millisecond => "ms",
arrow2::datatypes::TimeUnit::Microsecond => "us",
arrow2::datatypes::TimeUnit::Nanosecond => "ns",
};
f.write_str(s)
}
}
#[repr(transparent)]
pub struct DisplayIntervalUnit(IntervalUnit);
impl std::fmt::Display for DisplayIntervalUnit {
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
let s = match self.0 {
IntervalUnit::YearMonth => "year/month",
IntervalUnit::DayTime => "day/time",
IntervalUnit::MonthDayNano => "month/day/nano",
};
f.write_str(s)
}
}
#[repr(transparent)]
pub struct DisplayDataType(DataType);
impl std::fmt::Display for DisplayDataType {
fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
let s = match &self.0 {
DataType::Null => "null",
DataType::Boolean => "bool",
DataType::Int8 => "i8",
DataType::Int16 => "i16",
DataType::Int32 => "i32",
DataType::Int64 => "i64",
DataType::UInt8 => "u8",
DataType::UInt16 => "u16",
DataType::UInt32 => "u32",
DataType::UInt64 => "u64",
DataType::Float16 => "f16",
DataType::Float32 => "f32",
DataType::Float64 => "f64",
DataType::Timestamp(unit, timezone) => {
let s = if let Some(tz) = timezone {
format!("timestamp({}, {tz})", DisplayTimeUnit(*unit))
} else {
format!("timestamp({})", DisplayTimeUnit(*unit))
};
return f.write_str(&s);
}
DataType::Date32 => "date32",
DataType::Date64 => "date64",
DataType::Time32(unit) => {
let s = format!("time32({})", DisplayTimeUnit(*unit));
return f.write_str(&s);
}
DataType::Time64(unit) => {
let s = format!("time64({})", DisplayTimeUnit(*unit));
return f.write_str(&s);
}
DataType::Duration(unit) => {
let s = format!("duration({})", DisplayTimeUnit(*unit));
return f.write_str(&s);
}
DataType::Interval(unit) => {
let s = format!("interval({})", DisplayIntervalUnit(*unit));
return f.write_str(&s);
}
DataType::Binary => "bin",
DataType::FixedSizeBinary(size) => return write!(f, "fixed-bin[{size}]"),
DataType::LargeBinary => "large-bin",
DataType::Utf8 => "str",
DataType::LargeUtf8 => "large-string",
DataType::List(ref field) => {
let s = format!("list[{}]", DisplayDataType(field.data_type().clone()));
return f.write_str(&s);
}
DataType::FixedSizeList(field, len) => {
let s = format!(
"fixed-list[{}; {len}]",
DisplayDataType(field.data_type().clone())
);
return f.write_str(&s);
}
DataType::LargeList(field) => {
let s = format!("large-list[{}]", DisplayDataType(field.data_type().clone()));
return f.write_str(&s);
}
DataType::Struct(fields) => return write!(f, "struct[{}]", fields.len()),
DataType::Union(fields, _, _) => return write!(f, "union[{}]", fields.len()),
DataType::Map(field, _) => {
return write!(f, "map[{}]", DisplayDataType(field.data_type().clone()))
}
DataType::Dictionary(_, _, _) => "dict",
DataType::Decimal(_, _) => "decimal",
DataType::Decimal256(_, _) => "decimal256",
DataType::Extension(name, data_type, _) => {
let s = format!("extension<{name}>[{}]", DisplayDataType(*data_type.clone()));
return f.write_str(&s);
}
};
f.write_str(s)
}
}
pub fn format_table<A, Ia, N, In>(columns: Ia, names: In) -> Table
where
A: AsRef<dyn Array>,
Ia: IntoIterator<Item = A>,
N: AsRef<str>,
In: IntoIterator<Item = N>,
{
let mut table = Table::new();
table.load_preset(presets::UTF8_FULL);
let arrays = columns.into_iter().collect::<Vec<_>>();
let (displayers, lengths): (Vec<_>, Vec<_>) = arrays
.iter()
.map(|array| (get_display(array.as_ref(), "-"), array.as_ref().len()))
.unzip();
if displayers.is_empty() {
return table;
}
let header = names
.into_iter()
.zip(arrays.iter().map(|array| array.as_ref().data_type()))
.map(|(name, data_type)| {
Cell::new(format!(
"{}\n---\n{}",
name.as_ref(),
DisplayDataType(data_type.clone())
))
});
table.set_header(header);
for row in 0..lengths[0] {
let cells: Vec<_> = displayers
.iter()
.map(|disp| {
let mut string = String::new();
(disp)(&mut string, row).unwrap();
Cell::new(string)
})
.collect();
table.add_row(cells);
}
table
}