mirror of
https://github.com/nushell/nushell.git
synced 2025-04-14 08:18:17 +02:00
polars
: add new command polars dt replace-time-zone
This commit is contained in:
parent
e4cef8a154
commit
d5f79ba51a
@ -11,6 +11,8 @@ mod get_second;
|
||||
mod get_week;
|
||||
mod get_weekday;
|
||||
mod get_year;
|
||||
mod replace_time_zone;
|
||||
mod strftime;
|
||||
|
||||
use crate::PolarsPlugin;
|
||||
use nu_plugin::PluginCommand;
|
||||
@ -28,8 +30,7 @@ pub use get_second::GetSecond;
|
||||
pub use get_week::GetWeek;
|
||||
pub use get_weekday::GetWeekDay;
|
||||
pub use get_year::GetYear;
|
||||
mod strftime;
|
||||
|
||||
pub use replace_time_zone::ReplaceTimeZone;
|
||||
pub use strftime::StrFTime;
|
||||
|
||||
pub(crate) fn datetime_commands() -> Vec<Box<dyn PluginCommand<Plugin = PolarsPlugin>>> {
|
||||
@ -48,5 +49,6 @@ pub(crate) fn datetime_commands() -> Vec<Box<dyn PluginCommand<Plugin = PolarsPl
|
||||
Box::new(GetWeekDay),
|
||||
Box::new(GetYear),
|
||||
Box::new(StrFTime),
|
||||
Box::new(ReplaceTimeZone),
|
||||
]
|
||||
}
|
||||
|
@ -0,0 +1,286 @@
|
||||
use crate::values::{Column, NuDataFrame, NuSchema};
|
||||
use crate::{
|
||||
dataframe::values::NuExpression,
|
||||
values::{cant_convert_err, CustomValueSupport, PolarsPluginObject, PolarsPluginType},
|
||||
PolarsPlugin,
|
||||
};
|
||||
|
||||
use nu_plugin::{EngineInterface, EvaluatedCall, PluginCommand};
|
||||
use nu_protocol::{
|
||||
Category, Example, LabeledError, PipelineData, ShellError, Signature, Span, SyntaxShape, Type,
|
||||
Value,
|
||||
};
|
||||
|
||||
use chrono::DateTime;
|
||||
use polars::prelude::*;
|
||||
|
||||
#[derive(Clone)]
|
||||
pub struct ReplaceTimeZone;
|
||||
|
||||
impl PluginCommand for ReplaceTimeZone {
|
||||
type Plugin = PolarsPlugin;
|
||||
|
||||
fn name(&self) -> &str {
|
||||
"polars replace-time-zone"
|
||||
}
|
||||
|
||||
fn description(&self) -> &str {
|
||||
"Replace the timezone information in a datetime column."
|
||||
}
|
||||
|
||||
fn signature(&self) -> Signature {
|
||||
Signature::build(self.name())
|
||||
.input_output_types(vec![(
|
||||
Type::Custom("expression".into()),
|
||||
Type::Custom("expression".into()),
|
||||
)])
|
||||
.required(
|
||||
"time_zone",
|
||||
SyntaxShape::String,
|
||||
"Timezone for the Datetime Series. Pass `null` to unset time zone.",
|
||||
)
|
||||
.named(
|
||||
"ambiguous",
|
||||
SyntaxShape::OneOf(vec![SyntaxShape::String, SyntaxShape::Nothing]),
|
||||
r#"Determine how to deal with ambiguous datetimes:
|
||||
`raise` (default): raise error
|
||||
`earliest`: use the earliest datetime
|
||||
`latest`: use the latest datetime
|
||||
`null`: set to null"#,
|
||||
Some('a'),
|
||||
)
|
||||
.named(
|
||||
"nonexistent",
|
||||
SyntaxShape::OneOf(vec![SyntaxShape::String, SyntaxShape::Nothing]),
|
||||
r#"Determine how to deal with non-existent datetimes: raise (default) or null."#,
|
||||
Some('n'),
|
||||
)
|
||||
.category(Category::Custom("dataframe".into()))
|
||||
}
|
||||
|
||||
fn examples(&self) -> Vec<Example> {
|
||||
vec![
|
||||
Example {
|
||||
description: "Apply timezone to a naive datetime",
|
||||
example: r#"["2021-12-30 00:00:00" "2021-12-31 00:00:00"] | polars into-df
|
||||
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||
| polars select (polars col datetime | polars replace-time-zone "America/New_York")"#,
|
||||
result: Some(
|
||||
NuDataFrame::try_from_columns(
|
||||
vec![Column::new(
|
||||
"datetime".to_string(),
|
||||
vec![
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2021-12-30 00:00:00 -0500",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2021-12-31 00:00:00 -0500",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
],
|
||||
)],
|
||||
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||
Field::new(
|
||||
"datetime".into(),
|
||||
DataType::Datetime(
|
||||
TimeUnit::Nanoseconds,
|
||||
Some(PlSmallStr::from_static("America/New_York")),
|
||||
),
|
||||
),
|
||||
])))),
|
||||
)
|
||||
.expect("simple df for test should not fail")
|
||||
.into_value(Span::test_data()),
|
||||
),
|
||||
},
|
||||
Example {
|
||||
description: "Apply timezone with ambiguous datetime",
|
||||
example: r#"["2025-11-02 00:00:00", "2025-11-02 01:00:00", "2025-11-02 02:00:00", "2025-11-02 03:00:00"]
|
||||
| polars into-df
|
||||
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||
| polars select (polars col datetime | polars replace-time-zone "America/New_York" --ambiguous null)"#,
|
||||
result: Some(
|
||||
NuDataFrame::try_from_columns(
|
||||
vec![Column::new(
|
||||
"datetime".to_string(),
|
||||
vec![
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-11-02 00:00:00 -0400",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
Value::nothing(Span::test_data()),
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-11-02 02:00:00 -0500",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-11-02 03:00:00 -0500",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
],
|
||||
)],
|
||||
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||
Field::new(
|
||||
"datetime".into(),
|
||||
DataType::Datetime(
|
||||
TimeUnit::Nanoseconds,
|
||||
Some(PlSmallStr::from_static("America/New_York")),
|
||||
),
|
||||
),
|
||||
])))),
|
||||
)
|
||||
.expect("simple df for test should not fail")
|
||||
.into_value(Span::test_data()),
|
||||
),
|
||||
},
|
||||
Example {
|
||||
description: "Apply timezone with nonexistent datetime",
|
||||
example: r#"["2025-03-09 01:00:00", "2025-03-09 02:00:00", "2025-03-09 03:00:00", "2025-03-09 04:00:00"]
|
||||
| polars into-df
|
||||
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||
| polars select (polars col datetime | polars replace-time-zone "America/New_York" --nonexistent null)"#,
|
||||
result: Some(
|
||||
NuDataFrame::try_from_columns(
|
||||
vec![Column::new(
|
||||
"datetime".to_string(),
|
||||
vec![
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-03-09 01:00:00 -0500",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
Value::nothing(Span::test_data()),
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-03-09 03:00:00 -0400",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
Value::date(
|
||||
DateTime::parse_from_str(
|
||||
"2025-03-09 04:00:00 -0400",
|
||||
"%Y-%m-%d %H:%M:%S %z",
|
||||
)
|
||||
.expect("date calculation should not fail in test"),
|
||||
Span::test_data(),
|
||||
),
|
||||
],
|
||||
)],
|
||||
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||
Field::new(
|
||||
"datetime".into(),
|
||||
DataType::Datetime(
|
||||
TimeUnit::Nanoseconds,
|
||||
Some(PlSmallStr::from_static("America/New_York")),
|
||||
),
|
||||
),
|
||||
])))),
|
||||
)
|
||||
.expect("simple df for test should not fail")
|
||||
.into_value(Span::test_data()),
|
||||
),
|
||||
},
|
||||
]
|
||||
}
|
||||
|
||||
fn run(
|
||||
&self,
|
||||
plugin: &Self::Plugin,
|
||||
engine: &EngineInterface,
|
||||
call: &EvaluatedCall,
|
||||
input: PipelineData,
|
||||
) -> Result<PipelineData, LabeledError> {
|
||||
let value = input.into_value(call.head)?;
|
||||
|
||||
let ambiguous = match call.get_flag::<Value>("ambiguous")? {
|
||||
Some(Value::String { val, internal_span }) => match val.as_str() {
|
||||
"raise" | "earliest" | "latest" => Ok(val),
|
||||
_ => Err(ShellError::GenericError {
|
||||
error: "Invalid argument value".into(),
|
||||
msg: "`ambiguous` must be one of raise, earliest, latest, or null".into(),
|
||||
span: Some(internal_span),
|
||||
help: None,
|
||||
inner: vec![],
|
||||
}),
|
||||
},
|
||||
Some(Value::Nothing { .. }) => Ok("null".into()),
|
||||
Some(_) => unreachable!("Argument only accepts string or null."),
|
||||
None => Ok("raise".into()),
|
||||
}
|
||||
.map_err(LabeledError::from)?;
|
||||
|
||||
let nonexistent = match call.get_flag::<Value>("nonexistent")? {
|
||||
Some(Value::String { val, internal_span }) => match val.as_str() {
|
||||
"raise" => Ok(NonExistent::Raise),
|
||||
_ => Err(ShellError::GenericError {
|
||||
error: "Invalid argument value".into(),
|
||||
msg: "`nonexistent` must be one of raise or null".into(),
|
||||
span: Some(internal_span),
|
||||
help: None,
|
||||
inner: vec![],
|
||||
}),
|
||||
},
|
||||
Some(Value::Nothing { .. }) => Ok(NonExistent::Null),
|
||||
Some(_) => unreachable!("Argument only accepts string or null."),
|
||||
None => Ok(NonExistent::Raise),
|
||||
}
|
||||
.map_err(LabeledError::from)?;
|
||||
|
||||
match PolarsPluginObject::try_from_value(plugin, &value)? {
|
||||
PolarsPluginObject::NuExpression(expr) => {
|
||||
let time_zone: String = call.req(0)?;
|
||||
let expr: NuExpression = expr
|
||||
.into_polars()
|
||||
.dt()
|
||||
.replace_time_zone(
|
||||
Some(PlSmallStr::from_str(&time_zone)),
|
||||
Expr::Literal(LiteralValue::String(PlSmallStr::from_string(ambiguous))),
|
||||
nonexistent,
|
||||
)
|
||||
.into();
|
||||
expr.to_pipeline_data(plugin, engine, call.head)
|
||||
}
|
||||
_ => Err(cant_convert_err(&value, &[PolarsPluginType::NuExpression])),
|
||||
}
|
||||
.map_err(LabeledError::from)
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod test {
|
||||
|
||||
use super::*;
|
||||
use crate::test::test_polars_plugin_command;
|
||||
use nu_protocol::ShellError;
|
||||
|
||||
#[test]
|
||||
fn test_examples() -> Result<(), ShellError> {
|
||||
test_polars_plugin_command(&ReplaceTimeZone)
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue
Block a user