mirror of
https://github.com/nushell/nushell.git
synced 2025-04-20 11:18:20 +02:00
polars
: add new command polars dt replace-time-zone
This commit is contained in:
parent
e4cef8a154
commit
d5f79ba51a
@ -11,6 +11,8 @@ mod get_second;
|
|||||||
mod get_week;
|
mod get_week;
|
||||||
mod get_weekday;
|
mod get_weekday;
|
||||||
mod get_year;
|
mod get_year;
|
||||||
|
mod replace_time_zone;
|
||||||
|
mod strftime;
|
||||||
|
|
||||||
use crate::PolarsPlugin;
|
use crate::PolarsPlugin;
|
||||||
use nu_plugin::PluginCommand;
|
use nu_plugin::PluginCommand;
|
||||||
@ -28,8 +30,7 @@ pub use get_second::GetSecond;
|
|||||||
pub use get_week::GetWeek;
|
pub use get_week::GetWeek;
|
||||||
pub use get_weekday::GetWeekDay;
|
pub use get_weekday::GetWeekDay;
|
||||||
pub use get_year::GetYear;
|
pub use get_year::GetYear;
|
||||||
mod strftime;
|
pub use replace_time_zone::ReplaceTimeZone;
|
||||||
|
|
||||||
pub use strftime::StrFTime;
|
pub use strftime::StrFTime;
|
||||||
|
|
||||||
pub(crate) fn datetime_commands() -> Vec<Box<dyn PluginCommand<Plugin = PolarsPlugin>>> {
|
pub(crate) fn datetime_commands() -> Vec<Box<dyn PluginCommand<Plugin = PolarsPlugin>>> {
|
||||||
@ -48,5 +49,6 @@ pub(crate) fn datetime_commands() -> Vec<Box<dyn PluginCommand<Plugin = PolarsPl
|
|||||||
Box::new(GetWeekDay),
|
Box::new(GetWeekDay),
|
||||||
Box::new(GetYear),
|
Box::new(GetYear),
|
||||||
Box::new(StrFTime),
|
Box::new(StrFTime),
|
||||||
|
Box::new(ReplaceTimeZone),
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
|
@ -0,0 +1,286 @@
|
|||||||
|
use crate::values::{Column, NuDataFrame, NuSchema};
|
||||||
|
use crate::{
|
||||||
|
dataframe::values::NuExpression,
|
||||||
|
values::{cant_convert_err, CustomValueSupport, PolarsPluginObject, PolarsPluginType},
|
||||||
|
PolarsPlugin,
|
||||||
|
};
|
||||||
|
|
||||||
|
use nu_plugin::{EngineInterface, EvaluatedCall, PluginCommand};
|
||||||
|
use nu_protocol::{
|
||||||
|
Category, Example, LabeledError, PipelineData, ShellError, Signature, Span, SyntaxShape, Type,
|
||||||
|
Value,
|
||||||
|
};
|
||||||
|
|
||||||
|
use chrono::DateTime;
|
||||||
|
use polars::prelude::*;
|
||||||
|
|
||||||
|
#[derive(Clone)]
|
||||||
|
pub struct ReplaceTimeZone;
|
||||||
|
|
||||||
|
impl PluginCommand for ReplaceTimeZone {
|
||||||
|
type Plugin = PolarsPlugin;
|
||||||
|
|
||||||
|
fn name(&self) -> &str {
|
||||||
|
"polars replace-time-zone"
|
||||||
|
}
|
||||||
|
|
||||||
|
fn description(&self) -> &str {
|
||||||
|
"Replace the timezone information in a datetime column."
|
||||||
|
}
|
||||||
|
|
||||||
|
fn signature(&self) -> Signature {
|
||||||
|
Signature::build(self.name())
|
||||||
|
.input_output_types(vec![(
|
||||||
|
Type::Custom("expression".into()),
|
||||||
|
Type::Custom("expression".into()),
|
||||||
|
)])
|
||||||
|
.required(
|
||||||
|
"time_zone",
|
||||||
|
SyntaxShape::String,
|
||||||
|
"Timezone for the Datetime Series. Pass `null` to unset time zone.",
|
||||||
|
)
|
||||||
|
.named(
|
||||||
|
"ambiguous",
|
||||||
|
SyntaxShape::OneOf(vec![SyntaxShape::String, SyntaxShape::Nothing]),
|
||||||
|
r#"Determine how to deal with ambiguous datetimes:
|
||||||
|
`raise` (default): raise error
|
||||||
|
`earliest`: use the earliest datetime
|
||||||
|
`latest`: use the latest datetime
|
||||||
|
`null`: set to null"#,
|
||||||
|
Some('a'),
|
||||||
|
)
|
||||||
|
.named(
|
||||||
|
"nonexistent",
|
||||||
|
SyntaxShape::OneOf(vec![SyntaxShape::String, SyntaxShape::Nothing]),
|
||||||
|
r#"Determine how to deal with non-existent datetimes: raise (default) or null."#,
|
||||||
|
Some('n'),
|
||||||
|
)
|
||||||
|
.category(Category::Custom("dataframe".into()))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn examples(&self) -> Vec<Example> {
|
||||||
|
vec![
|
||||||
|
Example {
|
||||||
|
description: "Apply timezone to a naive datetime",
|
||||||
|
example: r#"["2021-12-30 00:00:00" "2021-12-31 00:00:00"] | polars into-df
|
||||||
|
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||||
|
| polars select (polars col datetime | polars replace-time-zone "America/New_York")"#,
|
||||||
|
result: Some(
|
||||||
|
NuDataFrame::try_from_columns(
|
||||||
|
vec![Column::new(
|
||||||
|
"datetime".to_string(),
|
||||||
|
vec![
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2021-12-30 00:00:00 -0500",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2021-12-31 00:00:00 -0500",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
],
|
||||||
|
)],
|
||||||
|
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||||
|
Field::new(
|
||||||
|
"datetime".into(),
|
||||||
|
DataType::Datetime(
|
||||||
|
TimeUnit::Nanoseconds,
|
||||||
|
Some(PlSmallStr::from_static("America/New_York")),
|
||||||
|
),
|
||||||
|
),
|
||||||
|
])))),
|
||||||
|
)
|
||||||
|
.expect("simple df for test should not fail")
|
||||||
|
.into_value(Span::test_data()),
|
||||||
|
),
|
||||||
|
},
|
||||||
|
Example {
|
||||||
|
description: "Apply timezone with ambiguous datetime",
|
||||||
|
example: r#"["2025-11-02 00:00:00", "2025-11-02 01:00:00", "2025-11-02 02:00:00", "2025-11-02 03:00:00"]
|
||||||
|
| polars into-df
|
||||||
|
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||||
|
| polars select (polars col datetime | polars replace-time-zone "America/New_York" --ambiguous null)"#,
|
||||||
|
result: Some(
|
||||||
|
NuDataFrame::try_from_columns(
|
||||||
|
vec![Column::new(
|
||||||
|
"datetime".to_string(),
|
||||||
|
vec![
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-11-02 00:00:00 -0400",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
Value::nothing(Span::test_data()),
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-11-02 02:00:00 -0500",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-11-02 03:00:00 -0500",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
],
|
||||||
|
)],
|
||||||
|
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||||
|
Field::new(
|
||||||
|
"datetime".into(),
|
||||||
|
DataType::Datetime(
|
||||||
|
TimeUnit::Nanoseconds,
|
||||||
|
Some(PlSmallStr::from_static("America/New_York")),
|
||||||
|
),
|
||||||
|
),
|
||||||
|
])))),
|
||||||
|
)
|
||||||
|
.expect("simple df for test should not fail")
|
||||||
|
.into_value(Span::test_data()),
|
||||||
|
),
|
||||||
|
},
|
||||||
|
Example {
|
||||||
|
description: "Apply timezone with nonexistent datetime",
|
||||||
|
example: r#"["2025-03-09 01:00:00", "2025-03-09 02:00:00", "2025-03-09 03:00:00", "2025-03-09 04:00:00"]
|
||||||
|
| polars into-df
|
||||||
|
| polars as-datetime "%Y-%m-%d %H:%M:%S" --naive
|
||||||
|
| polars select (polars col datetime | polars replace-time-zone "America/New_York" --nonexistent null)"#,
|
||||||
|
result: Some(
|
||||||
|
NuDataFrame::try_from_columns(
|
||||||
|
vec![Column::new(
|
||||||
|
"datetime".to_string(),
|
||||||
|
vec![
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-03-09 01:00:00 -0500",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
Value::nothing(Span::test_data()),
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-03-09 03:00:00 -0400",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
Value::date(
|
||||||
|
DateTime::parse_from_str(
|
||||||
|
"2025-03-09 04:00:00 -0400",
|
||||||
|
"%Y-%m-%d %H:%M:%S %z",
|
||||||
|
)
|
||||||
|
.expect("date calculation should not fail in test"),
|
||||||
|
Span::test_data(),
|
||||||
|
),
|
||||||
|
],
|
||||||
|
)],
|
||||||
|
Some(NuSchema::new(Arc::new(Schema::from_iter(vec![
|
||||||
|
Field::new(
|
||||||
|
"datetime".into(),
|
||||||
|
DataType::Datetime(
|
||||||
|
TimeUnit::Nanoseconds,
|
||||||
|
Some(PlSmallStr::from_static("America/New_York")),
|
||||||
|
),
|
||||||
|
),
|
||||||
|
])))),
|
||||||
|
)
|
||||||
|
.expect("simple df for test should not fail")
|
||||||
|
.into_value(Span::test_data()),
|
||||||
|
),
|
||||||
|
},
|
||||||
|
]
|
||||||
|
}
|
||||||
|
|
||||||
|
fn run(
|
||||||
|
&self,
|
||||||
|
plugin: &Self::Plugin,
|
||||||
|
engine: &EngineInterface,
|
||||||
|
call: &EvaluatedCall,
|
||||||
|
input: PipelineData,
|
||||||
|
) -> Result<PipelineData, LabeledError> {
|
||||||
|
let value = input.into_value(call.head)?;
|
||||||
|
|
||||||
|
let ambiguous = match call.get_flag::<Value>("ambiguous")? {
|
||||||
|
Some(Value::String { val, internal_span }) => match val.as_str() {
|
||||||
|
"raise" | "earliest" | "latest" => Ok(val),
|
||||||
|
_ => Err(ShellError::GenericError {
|
||||||
|
error: "Invalid argument value".into(),
|
||||||
|
msg: "`ambiguous` must be one of raise, earliest, latest, or null".into(),
|
||||||
|
span: Some(internal_span),
|
||||||
|
help: None,
|
||||||
|
inner: vec![],
|
||||||
|
}),
|
||||||
|
},
|
||||||
|
Some(Value::Nothing { .. }) => Ok("null".into()),
|
||||||
|
Some(_) => unreachable!("Argument only accepts string or null."),
|
||||||
|
None => Ok("raise".into()),
|
||||||
|
}
|
||||||
|
.map_err(LabeledError::from)?;
|
||||||
|
|
||||||
|
let nonexistent = match call.get_flag::<Value>("nonexistent")? {
|
||||||
|
Some(Value::String { val, internal_span }) => match val.as_str() {
|
||||||
|
"raise" => Ok(NonExistent::Raise),
|
||||||
|
_ => Err(ShellError::GenericError {
|
||||||
|
error: "Invalid argument value".into(),
|
||||||
|
msg: "`nonexistent` must be one of raise or null".into(),
|
||||||
|
span: Some(internal_span),
|
||||||
|
help: None,
|
||||||
|
inner: vec![],
|
||||||
|
}),
|
||||||
|
},
|
||||||
|
Some(Value::Nothing { .. }) => Ok(NonExistent::Null),
|
||||||
|
Some(_) => unreachable!("Argument only accepts string or null."),
|
||||||
|
None => Ok(NonExistent::Raise),
|
||||||
|
}
|
||||||
|
.map_err(LabeledError::from)?;
|
||||||
|
|
||||||
|
match PolarsPluginObject::try_from_value(plugin, &value)? {
|
||||||
|
PolarsPluginObject::NuExpression(expr) => {
|
||||||
|
let time_zone: String = call.req(0)?;
|
||||||
|
let expr: NuExpression = expr
|
||||||
|
.into_polars()
|
||||||
|
.dt()
|
||||||
|
.replace_time_zone(
|
||||||
|
Some(PlSmallStr::from_str(&time_zone)),
|
||||||
|
Expr::Literal(LiteralValue::String(PlSmallStr::from_string(ambiguous))),
|
||||||
|
nonexistent,
|
||||||
|
)
|
||||||
|
.into();
|
||||||
|
expr.to_pipeline_data(plugin, engine, call.head)
|
||||||
|
}
|
||||||
|
_ => Err(cant_convert_err(&value, &[PolarsPluginType::NuExpression])),
|
||||||
|
}
|
||||||
|
.map_err(LabeledError::from)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[cfg(test)]
|
||||||
|
mod test {
|
||||||
|
|
||||||
|
use super::*;
|
||||||
|
use crate::test::test_polars_plugin_command;
|
||||||
|
use nu_protocol::ShellError;
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn test_examples() -> Result<(), ShellError> {
|
||||||
|
test_polars_plugin_command(&ReplaceTimeZone)
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user