mirror of
https://github.com/nushell/nushell.git
synced 2025-04-01 11:46:20 +02:00
# Description This doesn't really do much that the user could see, but it helps get us ready to do the steps of the refactor to split the span off of Value, so that values can be spanless. This allows us to have top-level values that can hold both a Value and a Span, without requiring that all values have them. We expect to see significant memory reduction by removing so many unnecessary spans from values. For example, a table of 100,000 rows and 5 columns would have a savings of ~8megs in just spans that are almost always duplicated. # User-Facing Changes Nothing yet # Tests + Formatting <!-- Don't forget to add tests that cover your changes. Make sure you've run and fixed any issues with these commands: - `cargo fmt --all -- --check` to check standard code formatting (`cargo fmt --all` applies these changes) - `cargo clippy --workspace -- -D warnings -D clippy::unwrap_used -A clippy::needless_collect -A clippy::result_large_err` to check that you're using the standard code style - `cargo test --workspace` to check that all tests pass - `cargo run -- -c "use std testing; testing run-tests --path crates/nu-std"` to run the tests for the standard library > **Note** > from `nushell` you can also use the `toolkit` as follows > ```bash > use toolkit.nu # or use an `env_change` hook to activate it automatically > toolkit check pr > ``` --> # After Submitting <!-- If your PR had any user-facing changes, update [the documentation](https://github.com/nushell/nushell.github.io) after the PR is merged, if necessary. This will help us keep the docs up to date. -->
212 lines
6.2 KiB
Rust
212 lines
6.2 KiB
Rust
use super::super::super::values::{Column, NuDataFrame};
|
|
|
|
use nu_engine::CallExt;
|
|
use nu_protocol::{
|
|
ast::Call,
|
|
engine::{Command, EngineState, Stack},
|
|
Category, Example, PipelineData, ShellError, Signature, Span, SyntaxShape, Type, Value,
|
|
};
|
|
use polars::prelude::{ChunkSet, DataType, IntoSeries};
|
|
|
|
#[derive(Clone)]
|
|
pub struct SetSeries;
|
|
|
|
impl Command for SetSeries {
|
|
fn name(&self) -> &str {
|
|
"dfr set"
|
|
}
|
|
|
|
fn usage(&self) -> &str {
|
|
"Sets value where given mask is true."
|
|
}
|
|
|
|
fn signature(&self) -> Signature {
|
|
Signature::build(self.name())
|
|
.required("value", SyntaxShape::Any, "value to be inserted in series")
|
|
.required_named(
|
|
"mask",
|
|
SyntaxShape::Any,
|
|
"mask indicating insertions",
|
|
Some('m'),
|
|
)
|
|
.input_output_type(
|
|
Type::Custom("dataframe".into()),
|
|
Type::Custom("dataframe".into()),
|
|
)
|
|
.category(Category::Custom("dataframe".into()))
|
|
}
|
|
|
|
fn examples(&self) -> Vec<Example> {
|
|
vec![Example {
|
|
description: "Shifts the values by a given period",
|
|
example: r#"let s = ([1 2 2 3 3] | dfr into-df | dfr shift 2);
|
|
let mask = ($s | dfr is-null);
|
|
$s | dfr set 0 --mask $mask"#,
|
|
result: Some(
|
|
NuDataFrame::try_from_columns(vec![Column::new(
|
|
"0".to_string(),
|
|
vec![
|
|
Value::test_int(0),
|
|
Value::test_int(0),
|
|
Value::test_int(1),
|
|
Value::test_int(2),
|
|
Value::test_int(2),
|
|
],
|
|
)])
|
|
.expect("simple df for test should not fail")
|
|
.into_value(Span::test_data()),
|
|
),
|
|
}]
|
|
}
|
|
|
|
fn run(
|
|
&self,
|
|
engine_state: &EngineState,
|
|
stack: &mut Stack,
|
|
call: &Call,
|
|
input: PipelineData,
|
|
) -> Result<PipelineData, ShellError> {
|
|
command(engine_state, stack, call, input)
|
|
}
|
|
}
|
|
|
|
fn command(
|
|
engine_state: &EngineState,
|
|
stack: &mut Stack,
|
|
call: &Call,
|
|
input: PipelineData,
|
|
) -> Result<PipelineData, ShellError> {
|
|
let value: Value = call.req(engine_state, stack, 0)?;
|
|
|
|
let mask_value: Value = call
|
|
.get_flag(engine_state, stack, "mask")?
|
|
.expect("required named value");
|
|
let mask_span = mask_value.span();
|
|
let mask = NuDataFrame::try_from_value(mask_value)?.as_series(mask_span)?;
|
|
|
|
let bool_mask = match mask.dtype() {
|
|
DataType::Boolean => mask.bool().map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error casting to bool".into(),
|
|
e.to_string(),
|
|
Some(mask_span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
}),
|
|
_ => Err(ShellError::GenericError(
|
|
"Incorrect type".into(),
|
|
"can only use bool series as mask".into(),
|
|
Some(mask_span),
|
|
None,
|
|
Vec::new(),
|
|
)),
|
|
}?;
|
|
|
|
let df = NuDataFrame::try_from_pipeline(input, call.head)?;
|
|
let series = df.as_series(call.head)?;
|
|
|
|
let res = match value {
|
|
Value::Int { val, span } => {
|
|
let chunked = series.i64().map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error casting to i64".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
let res = chunked.set(bool_mask, Some(val)).map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error setting value".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
NuDataFrame::try_from_series(vec![res.into_series()], call.head)
|
|
}
|
|
Value::Float { val, span } => {
|
|
let chunked = series.f64().map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error casting to f64".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
let res = chunked.set(bool_mask, Some(val)).map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error setting value".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
NuDataFrame::try_from_series(vec![res.into_series()], call.head)
|
|
}
|
|
Value::String { val, span } => {
|
|
let chunked = series.utf8().map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error casting to string".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
let res = chunked.set(bool_mask, Some(val.as_ref())).map_err(|e| {
|
|
ShellError::GenericError(
|
|
"Error setting value".into(),
|
|
e.to_string(),
|
|
Some(span),
|
|
None,
|
|
Vec::new(),
|
|
)
|
|
})?;
|
|
|
|
let mut res = res.into_series();
|
|
res.rename("string");
|
|
|
|
NuDataFrame::try_from_series(vec![res.into_series()], call.head)
|
|
}
|
|
_ => Err(ShellError::GenericError(
|
|
"Incorrect value type".into(),
|
|
format!(
|
|
"this value cannot be set in a series of type '{}'",
|
|
series.dtype()
|
|
),
|
|
Some(value.span()),
|
|
None,
|
|
Vec::new(),
|
|
)),
|
|
};
|
|
|
|
res.map(|df| PipelineData::Value(NuDataFrame::into_value(df, call.head), None))
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod test {
|
|
use super::super::super::super::test_dataframe::test_dataframe;
|
|
use super::super::super::{IsNull, Shift};
|
|
use super::*;
|
|
|
|
#[test]
|
|
fn test_examples() {
|
|
test_dataframe(vec![
|
|
Box::new(SetSeries {}),
|
|
Box::new(IsNull {}),
|
|
Box::new(Shift {}),
|
|
])
|
|
}
|
|
}
|