2019-11-17 04:18:41 +01:00
|
|
|
use crate::prelude::*;
|
|
|
|
use calamine::*;
|
2020-08-18 09:00:02 +02:00
|
|
|
use nu_data::TaggedListBuilder;
|
2021-01-10 03:50:49 +01:00
|
|
|
use nu_engine::WholeStreamCommand;
|
Extract core stuff into own crates
This commit extracts five new crates:
- nu-source, which contains the core source-code handling logic in Nu,
including Text, Span, and also the pretty.rs-based debug logic
- nu-parser, which is the parser and expander logic
- nu-protocol, which is the bulk of the types and basic conveniences
used by plugins
- nu-errors, which contains ShellError, ParseError and error handling
conveniences
- nu-textview, which is the textview plugin extracted into a crate
One of the major consequences of this refactor is that it's no longer
possible to `impl X for Spanned<Y>` outside of the `nu-source` crate, so
a lot of types became more concrete (Value became a concrete type
instead of Spanned<Value>, for example).
This also turned a number of inherent methods in the main nu crate into
plain functions (impl Value {} became a bunch of functions in the
`value` namespace in `crate::data::value`).
2019-11-26 03:30:48 +01:00
|
|
|
use nu_errors::ShellError;
|
2020-03-06 17:06:39 +01:00
|
|
|
use nu_protocol::{ReturnSuccess, Signature, TaggedDictBuilder, UntaggedValue};
|
2019-11-17 04:18:41 +01:00
|
|
|
use std::io::Cursor;
|
|
|
|
|
|
|
|
pub struct FromXLSX;
|
|
|
|
|
|
|
|
#[derive(Deserialize)]
|
|
|
|
pub struct FromXLSXArgs {
|
2021-02-22 08:25:17 +01:00
|
|
|
noheaders: bool,
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
|
|
|
|
2020-05-29 10:22:52 +02:00
|
|
|
#[async_trait]
|
2019-11-17 04:18:41 +01:00
|
|
|
impl WholeStreamCommand for FromXLSX {
|
|
|
|
fn name(&self) -> &str {
|
2020-05-04 10:44:33 +02:00
|
|
|
"from xlsx"
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
fn signature(&self) -> Signature {
|
2020-05-04 10:44:33 +02:00
|
|
|
Signature::build("from xlsx").switch(
|
2021-02-22 08:25:17 +01:00
|
|
|
"noheaders",
|
2020-02-12 03:24:31 +01:00
|
|
|
"don't treat the first row as column names",
|
2021-02-22 08:25:17 +01:00
|
|
|
Some('n'),
|
2020-02-12 03:24:31 +01:00
|
|
|
)
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
fn usage(&self) -> &str {
|
|
|
|
"Parse binary Excel(.xlsx) data and create table."
|
|
|
|
}
|
|
|
|
|
2020-12-18 08:53:49 +01:00
|
|
|
async fn run(&self, args: CommandArgs) -> Result<OutputStream, ShellError> {
|
|
|
|
from_xlsx(args).await
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-18 08:53:49 +01:00
|
|
|
async fn from_xlsx(args: CommandArgs) -> Result<OutputStream, ShellError> {
|
2020-05-16 05:18:24 +02:00
|
|
|
let tag = args.call_info.name_tag.clone();
|
2020-09-21 19:28:31 +02:00
|
|
|
let span = tag.span;
|
2020-06-13 21:13:36 +02:00
|
|
|
let (
|
|
|
|
FromXLSXArgs {
|
2021-02-22 08:25:17 +01:00
|
|
|
noheaders: _noheaders,
|
2020-06-13 21:13:36 +02:00
|
|
|
},
|
|
|
|
input,
|
2020-12-18 08:53:49 +01:00
|
|
|
) = args.process().await?;
|
2020-06-13 21:13:36 +02:00
|
|
|
let value = input.collect_binary(tag.clone()).await?;
|
|
|
|
|
|
|
|
let buf: Cursor<Vec<u8>> = Cursor::new(value.item);
|
|
|
|
let mut xls = Xlsx::<_>::new(buf).map_err(|_| {
|
|
|
|
ShellError::labeled_error("Could not load xlsx file", "could not load xlsx file", &tag)
|
|
|
|
})?;
|
|
|
|
|
|
|
|
let mut dict = TaggedDictBuilder::new(&tag);
|
|
|
|
|
|
|
|
let sheet_names = xls.sheet_names().to_owned();
|
|
|
|
|
|
|
|
for sheet_name in &sheet_names {
|
|
|
|
let mut sheet_output = TaggedListBuilder::new(&tag);
|
|
|
|
|
|
|
|
if let Some(Ok(current_sheet)) = xls.worksheet_range(sheet_name) {
|
|
|
|
for row in current_sheet.rows() {
|
|
|
|
let mut row_output = TaggedDictBuilder::new(&tag);
|
|
|
|
for (i, cell) in row.iter().enumerate() {
|
|
|
|
let value = match cell {
|
|
|
|
DataType::Empty => UntaggedValue::nothing(),
|
|
|
|
DataType::String(s) => UntaggedValue::string(s),
|
2020-09-21 19:28:31 +02:00
|
|
|
DataType::Float(f) => UntaggedValue::decimal_from_float(*f, span),
|
2020-06-13 21:13:36 +02:00
|
|
|
DataType::Int(i) => UntaggedValue::int(*i),
|
|
|
|
DataType::Bool(b) => UntaggedValue::boolean(*b),
|
|
|
|
_ => UntaggedValue::nothing(),
|
|
|
|
};
|
|
|
|
|
|
|
|
row_output.insert_untagged(&format!("Column{}", i), value);
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
|
|
|
|
2020-06-13 21:13:36 +02:00
|
|
|
sheet_output.push_untagged(row_output.into_untagged_value());
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
2020-03-06 17:06:39 +01:00
|
|
|
|
2020-06-13 21:13:36 +02:00
|
|
|
dict.insert_untagged(sheet_name, sheet_output.into_untagged_value());
|
|
|
|
} else {
|
|
|
|
return Err(ShellError::labeled_error(
|
|
|
|
"Could not load sheet",
|
|
|
|
"could not load sheet",
|
|
|
|
&tag,
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
2019-11-17 04:18:41 +01:00
|
|
|
|
2020-06-13 21:13:36 +02:00
|
|
|
Ok(OutputStream::one(ReturnSuccess::value(dict.into_value())))
|
2019-11-17 04:18:41 +01:00
|
|
|
}
|
2020-05-18 14:56:01 +02:00
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::FromXLSX;
|
2020-10-03 16:06:02 +02:00
|
|
|
use super::ShellError;
|
2020-05-18 14:56:01 +02:00
|
|
|
|
|
|
|
#[test]
|
2020-10-03 16:06:02 +02:00
|
|
|
fn examples_work_as_expected() -> Result<(), ShellError> {
|
2020-05-18 14:56:01 +02:00
|
|
|
use crate::examples::test as test_examples;
|
|
|
|
|
2021-02-12 11:13:14 +01:00
|
|
|
test_examples(FromXLSX {})
|
2020-05-18 14:56:01 +02:00
|
|
|
}
|
|
|
|
}
|