compute directory sizes from contained files and directories (#1250)

* compute directory sizes from contained files and directories

* De-lint

* Revert "De-lint"

This reverts commit 9df9fc07d777014fef8f5749a84b4e52e1ee652a.

* Revert "compute directory sizes from contained files and directories"

This reverts commit d43583e9aa20438bd613f78a36e641c9fd48cae3.

* Nu du command

* Nu du for you

* Add async support

* Lints

* so much bug fixing
This commit is contained in:
Corvus Corax 2020-01-25 20:43:29 -06:00 committed by Jonathan Turner
parent 35359cbc22
commit d48f99cb0e
5 changed files with 323 additions and 4 deletions

View File

@ -73,10 +73,9 @@ impl PrettyDebug for ReturnSuccess {
/// The core Result type for pipelines
pub type ReturnValue = Result<ReturnSuccess, ShellError>;
impl Into<ReturnValue> for Value {
/// Lift a Value into a ReturnValue
fn into(self) -> ReturnValue {
Ok(ReturnSuccess::Value(self))
impl From<Value> for ReturnValue {
fn from(v: Value) -> Self {
Ok(ReturnSuccess::Value(v))
}
}

View File

@ -368,3 +368,9 @@ impl From<String> for UntaggedValue {
UntaggedValue::Primitive(Primitive::String(input))
}
}
impl From<ShellError> for UntaggedValue {
fn from(e: ShellError) -> Self {
UntaggedValue::Error(e)
}
}

View File

@ -254,6 +254,7 @@ pub async fn cli() -> Result<(), Box<dyn Error>> {
// System/file operations
whole_stream_command(Pwd),
per_item_command(Ls),
per_item_command(Du),
whole_stream_command(Cd),
whole_stream_command(Env),
per_item_command(Remove),

View File

@ -18,6 +18,7 @@ pub(crate) mod cp;
pub(crate) mod date;
pub(crate) mod debug;
pub(crate) mod default;
pub(crate) mod du;
pub(crate) mod echo;
pub(crate) mod edit;
pub(crate) mod enter;
@ -113,6 +114,7 @@ pub(crate) use cp::Cpy;
pub(crate) use date::Date;
pub(crate) use debug::Debug;
pub(crate) use default::Default;
pub(crate) use du::Du;
pub(crate) use echo::Echo;
pub(crate) use edit::Edit;
pub(crate) mod clear;

311
src/commands/du.rs Normal file
View File

@ -0,0 +1,311 @@
use crate::commands::command::RunnablePerItemContext;
use crate::prelude::*;
use glob::*;
use indexmap::map::IndexMap;
use nu_errors::ShellError;
use nu_protocol::{CallInfo, ReturnSuccess, Signature, SyntaxShape, UntaggedValue, Value};
use nu_source::Tagged;
use std::fs;
use std::path::PathBuf;
use std::sync::atomic::Ordering;
const NAME: &str = "du";
const GLOB_PARAMS: MatchOptions = MatchOptions {
case_sensitive: true,
require_literal_separator: true,
require_literal_leading_dot: false,
};
pub struct Du;
#[derive(Deserialize, Clone)]
pub struct DuArgs {
path: Option<Tagged<PathBuf>>,
all: bool,
deref: bool,
exclude: Option<Tagged<String>>,
#[serde(rename = "max-depth")]
max_depth: Option<Tagged<u64>>,
#[serde(rename = "min-size")]
min_size: Option<Tagged<u64>>,
}
impl PerItemCommand for Du {
fn name(&self) -> &str {
NAME
}
fn signature(&self) -> Signature {
Signature::build(NAME)
.optional("path", SyntaxShape::Pattern, "starting directory")
.switch("all", "Output File sizes as well as directory sizes")
.switch("deref", "Dereference symlinks to their targets for size")
.named("exclude", SyntaxShape::Pattern, "Exclude these file names")
.named("max-depth", SyntaxShape::Int, "Directory recursion limit")
.named(
"min-size",
SyntaxShape::Int,
"Exclude files below this size",
)
}
fn usage(&self) -> &str {
"Find disk usage sizes of specified items"
}
fn run(
&self,
call_info: &CallInfo,
_registry: &CommandRegistry,
raw_args: &RawCommandArgs,
_input: Value,
) -> Result<OutputStream, ShellError> {
call_info
.process(&raw_args.shell_manager, raw_args.ctrl_c.clone(), du)?
.run()
}
}
fn du(args: DuArgs, ctx: &RunnablePerItemContext) -> Result<OutputStream, ShellError> {
let tag = ctx.name.clone();
let exclude = args
.exclude
.clone()
.map_or(Ok(None), move |x| match Pattern::new(&x.item) {
Ok(p) => Ok(Some(p)),
Err(e) => Err(ShellError::labeled_error(
e.msg,
"Glob error",
x.tag.clone(),
)),
})?;
let path = args.path.clone();
let filter_files = path.is_none();
let paths = match path {
Some(p) => match glob::glob_with(
p.item.to_str().expect("Why isn't this encoded properly?"),
GLOB_PARAMS,
) {
Ok(g) => Ok(g),
Err(e) => Err(ShellError::labeled_error(
e.msg,
"Glob error",
p.tag.clone(),
)),
},
None => match glob::glob_with("*", GLOB_PARAMS) {
Ok(g) => Ok(g),
Err(e) => Err(ShellError::labeled_error(e.msg, "Glob error", tag.clone())),
},
}?
.filter(move |p| {
if filter_files {
match p {
Ok(f) if f.is_dir() => true,
Err(e) if e.path().is_dir() => true,
_ => false,
}
} else {
true
}
})
.map(move |p| match p {
Err(e) => Err(glob_err_into(e)),
Ok(s) => Ok(s),
});
let ctrl_c = ctx.ctrl_c.clone();
let all = args.all;
let deref = args.deref;
let max_depth = args.max_depth.map(|f| f.item);
let min_size = args.min_size.map(|f| f.item);
let stream = async_stream! {
for path in paths {
if ctrl_c.load(Ordering::SeqCst) {
break;
}
match path {
Ok(p) => match get_info(p, deref, &min_size, &exclude, &max_depth, all) {
Ok(Some(mut d)) => {
d.set_tag(tag.clone());
yield ReturnSuccess::value(d);
}
Err(e) => yield Err(e),
_ => yield ReturnSuccess::value(UntaggedValue::nothing().into_untagged_value()),
},
Err(e) => yield Err(e),
}
}
};
Ok(stream.to_output_stream())
}
fn get_info<'a>(
path: PathBuf,
deref: bool,
min_size: &'a Option<u64>,
exclude: &'a Option<Pattern>,
depth: &'a Option<u64>,
all: bool,
) -> Result<Option<Info>, ShellError> {
if depth.as_ref().map_or(false, |d| *d == 0) {
Ok(None)
} else if path.is_dir() {
match fs::read_dir(&path) {
Ok(d) => {
let mut info = Info::new(path.to_str().expect("This should be encoded properly"));
for file in d {
match file {
Ok(e) => {
match get_info(
e.path(),
deref,
min_size,
exclude,
&depth.map(|d| d - 1),
all,
) {
Ok(Some(i)) => {
info.size += &i.size;
if i.f_type == Type::Dir || all {
info.add_sub(e.file_name().to_string_lossy().into(), i);
}
}
Ok(None) => continue,
Err(e) => info.add_err(e),
}
}
Err(e) => info.add_err(ShellError::from(e)),
}
}
Ok(Some(info))
}
Err(e) => Err(ShellError::from(e)),
}
} else {
let ex = exclude.as_ref().map_or(false, |x| {
x.matches(
path.file_name()
.expect("How would this even happen?")
.to_str()
.expect("Very invalid filename apparently?"),
)
});
if ex {
Ok(None)
} else {
match fs::metadata(&path) {
Ok(m) => {
let size = if !deref {
match fs::symlink_metadata(&path) {
Ok(s) => Ok(s.len()),
Err(e) => Err(ShellError::from(e)),
}
} else {
Ok(m.len())
}?;
if min_size.map_or(true, |s| size > s) {
Ok(Some(Info::new_file(path.to_string_lossy(), size)))
} else {
Ok(None)
}
}
Err(e) => Err(ShellError::from(e)),
}
}
}
}
#[derive(PartialEq)]
enum Type {
File,
Dir,
}
struct Info {
sub: IndexMap<String, Info>,
errors: Vec<Value>,
size: u64,
name: String,
tag: Tag,
f_type: Type,
}
impl Info {
fn new(name: impl Into<String>) -> Self {
Info {
sub: IndexMap::new(),
errors: Vec::new(),
size: 0,
name: name.into(),
tag: Tag::unknown(),
f_type: Type::Dir,
}
}
fn new_file(name: impl Into<String>, size: u64) -> Info {
let mut new = Info::new(name);
new.f_type = Type::File;
new.size = size;
new
}
fn add_sub(&mut self, s: String, i: Info) {
self.sub.insert(s, i);
}
fn add_err(&mut self, e: impl Into<UntaggedValue>) {
let v = e.into().into_untagged_value();
self.errors.push(v);
}
fn set_tag(&mut self, t: Tag) {
self.tag = t;
}
}
fn glob_err_into(e: GlobError) -> ShellError {
let e = e.into_error();
ShellError::from(e)
}
impl From<Info> for Value {
fn from(i: Info) -> Self {
let n = i.name;
let s = i.size;
let mut subs: Vec<Value> = Vec::new();
let mut row: IndexMap<String, Value> = IndexMap::new();
row.insert(
"name".to_string(),
UntaggedValue::string(n).into_untagged_value(),
);
row.insert(
"size".to_string(),
UntaggedValue::bytes(s).into_untagged_value(),
);
for (_k, v) in i.sub {
subs.push(v.into());
}
if !subs.is_empty() {
row.insert(
"contents".to_string(),
UntaggedValue::Table(subs).into_untagged_value(),
);
} else {
row.insert(
"contents".to_string(),
UntaggedValue::nothing().into_untagged_value(),
);
}
if !i.errors.is_empty() {
row.insert(
"errors".to_string(),
UntaggedValue::Table(i.errors).into_untagged_value(),
);
}
UntaggedValue::row(row).into_untagged_value()
}
}