use crate::{commands::dataframe::utils::parse_polars_error, prelude::*}; use nu_engine::WholeStreamCommand; use nu_errors::ShellError; use nu_protocol::{ dataframe::{Column, NuDataFrame}, Primitive, Signature, SyntaxShape, UntaggedValue, Value, }; use polars::prelude::{ChunkSet, DataType, IntoSeries}; pub struct DataFrame; impl WholeStreamCommand for DataFrame { fn name(&self) -> &str { "dataframe set-with-idx" } fn usage(&self) -> &str { "[Series] Sets value in the given index" } fn signature(&self) -> Signature { Signature::build("dataframe set-with-idx") .required("value", SyntaxShape::Any, "value to be inserted in series") .required_named( "indices", SyntaxShape::Any, "list of indices indicating where to set the value", Some('i'), ) } fn run(&self, args: CommandArgs) -> Result { command(args) } fn examples(&self) -> Vec { vec![Example { description: "Set value in selected rows from series", example: r#"let series = ([4 1 5 2 4 3] | dataframe to-df); let indices = ([0 2] | dataframe to-df); $series | dataframe set-with-idx 6 -i $indices"#, result: Some(vec![NuDataFrame::try_from_columns( vec![Column::new( "0".to_string(), vec![ UntaggedValue::int(6).into(), UntaggedValue::int(1).into(), UntaggedValue::int(6).into(), UntaggedValue::int(2).into(), UntaggedValue::int(4).into(), UntaggedValue::int(3).into(), ], )], &Span::default(), ) .expect("simple df for test should not fail") .into_value(Tag::default())]), }] } } fn command(mut args: CommandArgs) -> Result { let tag = args.call_info.name_tag.clone(); let value: Value = args.req(0)?; let indices: Value = args.req_named("indices")?; let indices = match &indices.value { UntaggedValue::DataFrame(df) => Ok(df), _ => Err(ShellError::labeled_error( "Incorrect type", "can only use a series for set command", value.tag.span, )), }?; let indices = indices.as_series(&value.tag.span)?; let casted = match indices.dtype() { DataType::UInt32 | DataType::UInt64 | DataType::Int32 | DataType::Int64 => indices .as_ref() .cast(&DataType::UInt32) .map_err(|e| parse_polars_error::<&str>(&e, &value.tag.span, None)), _ => Err(ShellError::labeled_error_with_secondary( "Incorrect type", "Series with incorrect type", &value.tag.span, "Consider using a Series with type int type", &value.tag.span, )), }?; let indices = casted .u32() .map_err(|e| parse_polars_error::<&str>(&e, &value.tag.span, None))? .into_iter() .filter_map(|val| val.map(|v| v as usize)); let (df, df_tag) = NuDataFrame::try_from_stream(&mut args.input, &tag.span)?; let series = df.as_series(&df_tag.span)?; match &value.value { UntaggedValue::Primitive(Primitive::Int(val)) => { let chunked = series.i64().map_err(|e| { parse_polars_error::<&str>( &e, &value.tag.span, Some("The value has to match the set value type"), ) })?; let res = chunked .set_at_idx(indices, Some(*val)) .map_err(|e| parse_polars_error::<&str>(&e, &value.tag.span, None))?; let df = NuDataFrame::try_from_series(vec![res.into_series()], &tag.span)?; Ok(OutputStream::one(df.into_value(df_tag))) } UntaggedValue::Primitive(Primitive::Decimal(val)) => { let chunked = series.as_ref().f64().map_err(|e| { parse_polars_error::<&str>( &e, &value.tag.span, Some("The value has to match the series type"), ) })?; let res = chunked .set_at_idx( indices, Some( val.to_f64() .expect("internal error: expected f64-compatible decimal"), ), ) .map_err(|e| parse_polars_error::<&str>(&e, &value.tag.span, None))?; let df = NuDataFrame::try_from_series(vec![res.into_series()], &tag.span)?; Ok(OutputStream::one(df.into_value(df_tag))) } UntaggedValue::Primitive(Primitive::String(val)) => { let chunked = series.as_ref().utf8().map_err(|e| { parse_polars_error::<&str>( &e, &value.tag.span, Some("The value has to match the series type"), ) })?; let res = chunked .set_at_idx(indices, Some(val.as_ref())) .map_err(|e| parse_polars_error::<&str>(&e, &value.tag.span, None))?; let mut res = res.into_series(); res.rename("string"); let df = NuDataFrame::try_from_series(vec![res.into_series()], &tag.span)?; Ok(OutputStream::one(df.into_value(df_tag))) } _ => Err(ShellError::labeled_error( "Incorrect type", format!( "this value cannot be set in a series of type '{}'", series.as_ref().dtype() ), value.tag.span, )), } } #[cfg(test)] mod tests { use super::DataFrame; use super::ShellError; #[test] fn examples_work_as_expected() -> Result<(), ShellError> { use crate::examples::test_dataframe as test_examples; test_examples(DataFrame {}) } }