use crate::prelude::*; use nu_engine::WholeStreamCommand; use nu_errors::ShellError; use nu_protocol::{ dataframe::{Column, NuDataFrame}, Signature, SyntaxShape, UntaggedValue, Value, }; use super::utils::{convert_columns, parse_polars_error}; pub struct DataFrame; impl WholeStreamCommand for DataFrame { fn name(&self) -> &str { "dataframe drop-nulls" } fn usage(&self) -> &str { "[DataFrame, Series] Drops null values in dataframe" } fn signature(&self) -> Signature { Signature::build("dataframe drop-nulls").optional( "subset", SyntaxShape::Table, "subset of columns to drop duplicates", ) } fn run(&self, args: CommandArgs) -> Result { command(args) } fn examples(&self) -> Vec { vec![ Example { description: "drop null values in dataframe", example: r#"let df = ([[a b]; [1 2] [3 0] [1 2]] | dataframe to-df); let res = ($df.b / $df.b); let df = ($df | dataframe with-column $res --name res); $df | dataframe drop-nulls"#, result: Some(vec![NuDataFrame::try_from_columns( vec![ Column::new( "a".to_string(), vec![UntaggedValue::int(1).into(), UntaggedValue::int(1).into()], ), Column::new( "b".to_string(), vec![UntaggedValue::int(2).into(), UntaggedValue::int(2).into()], ), Column::new( "res".to_string(), vec![UntaggedValue::int(1).into(), UntaggedValue::int(1).into()], ), ], &Span::default(), ) .expect("simple df for test should not fail") .into_value(Tag::default())]), }, Example { description: "drop null values in dataframe", example: r#"let s = ([1 2 0 0 3 4] | dataframe to-df); ($s / $s) | dataframe drop-nulls"#, result: Some(vec![NuDataFrame::try_from_columns( vec![Column::new( "div_0_0".to_string(), vec![ UntaggedValue::int(1).into(), UntaggedValue::int(1).into(), UntaggedValue::int(1).into(), UntaggedValue::int(1).into(), ], )], &Span::default(), ) .expect("simple df for test should not fail") .into_value(Tag::default())]), }, ] } } fn command(mut args: CommandArgs) -> Result { let tag = args.call_info.name_tag.clone(); let value = args.input.next().ok_or_else(|| { ShellError::labeled_error("Empty stream", "No value found in stream", &tag.span) })?; match value.value { UntaggedValue::DataFrame(df) => { // Extracting the selection columns of the columns to perform the aggregation let columns: Option> = args.opt(0)?; let (subset, col_span) = match columns { Some(cols) => { let (agg_string, col_span) = convert_columns(&cols, &tag)?; (Some(agg_string), col_span) } None => (None, Span::unknown()), }; let subset_slice = subset.as_ref().map(|cols| &cols[..]); let res = df .as_ref() .drop_nulls(subset_slice) .map_err(|e| parse_polars_error::<&str>(&e, &col_span, None))?; Ok(OutputStream::one(NuDataFrame::dataframe_to_value(res, tag))) } _ => Err(ShellError::labeled_error( "Incorrect type", "drop nulls cannot be done with this value", &value.tag.span, )), } } #[cfg(test)] mod tests { use super::DataFrame; use super::ShellError; #[test] fn examples_work_as_expected() -> Result<(), ShellError> { use crate::examples::test_dataframe as test_examples; test_examples(DataFrame {}) } }