fixes an issue with an empty selector panic (#5345)

* fixes an issue with an empty selector panic

* missed web_tables

* oops, missed a test
This commit is contained in:
Darren Schroeder 2022-04-27 07:38:36 -05:00 committed by GitHub
parent 5c9fe85ec4
commit e7831d38ae
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 42 additions and 24 deletions

View File

@ -87,12 +87,14 @@ fn begin_selector_query(input_html: String, selector: Selector, span: Span) -> V
input_html.as_str(), input_html.as_str(),
selector.query.as_str(), selector.query.as_str(),
selector.as_html, selector.as_html,
selector.inspect,
span, span,
), ),
false => execute_selector_query_with_attribute( false => execute_selector_query_with_attribute(
input_html.as_str(), input_html.as_str(),
selector.query.as_str(), selector.query.as_str(),
selector.attribute.as_str(), selector.attribute.as_str(),
selector.inspect,
span, span,
), ),
} }
@ -132,10 +134,7 @@ pub fn retrieve_tables(
if tables.len() == 1 { if tables.len() == 1 {
return retrieve_table( return retrieve_table(
tables tables.into_iter().next().expect("Error retrieving table"),
.into_iter()
.next()
.expect("This should never trigger"),
columns, columns,
span, span,
); );
@ -227,12 +226,13 @@ fn execute_selector_query_with_attribute(
input_string: &str, input_string: &str,
query_string: &str, query_string: &str,
attribute: &str, attribute: &str,
inspect: bool,
span: Span, span: Span,
) -> Value { ) -> Value {
let doc = Html::parse_fragment(input_string); let doc = Html::parse_fragment(input_string);
let vals: Vec<Value> = doc let vals: Vec<Value> = doc
.select(&css(query_string)) .select(&css(query_string, inspect))
.map(|selection| { .map(|selection| {
Value::string( Value::string(
selection.value().attr(attribute).unwrap_or("").to_string(), selection.value().attr(attribute).unwrap_or("").to_string(),
@ -247,17 +247,18 @@ fn execute_selector_query(
input_string: &str, input_string: &str,
query_string: &str, query_string: &str,
as_html: bool, as_html: bool,
inspect: bool,
span: Span, span: Span,
) -> Value { ) -> Value {
let doc = Html::parse_fragment(input_string); let doc = Html::parse_fragment(input_string);
let vals: Vec<Value> = match as_html { let vals: Vec<Value> = match as_html {
true => doc true => doc
.select(&css(query_string)) .select(&css(query_string, inspect))
.map(|selection| Value::string(selection.html(), span)) .map(|selection| Value::string(selection.html(), span))
.collect(), .collect(),
false => doc false => doc
.select(&css(query_string)) .select(&css(query_string, inspect))
.map(|selection| { .map(|selection| {
Value::string( Value::string(
selection selection
@ -272,8 +273,12 @@ fn execute_selector_query(
Value::List { vals, span } Value::List { vals, span }
} }
pub fn css(selector: &str) -> ScraperSelector { pub fn css(selector: &str, inspect: bool) -> ScraperSelector {
ScraperSelector::parse(selector).expect("this should never trigger") if inspect {
ScraperSelector::parse("html").expect("Error unwrapping the default scraperselector")
} else {
ScraperSelector::parse(selector).expect("Error unwrapping scraperselector::parse")
}
} }
#[cfg(test)] #[cfg(test)]
@ -290,15 +295,25 @@ mod tests {
#[test] #[test]
fn test_first_child_is_not_empty() { fn test_first_child_is_not_empty() {
assert!( assert!(!execute_selector_query(
!execute_selector_query(SIMPLE_LIST, "li:first-child", false, Span::test_data()) SIMPLE_LIST,
.is_empty() "li:first-child",
false,
false,
Span::test_data()
) )
.is_empty())
} }
#[test] #[test]
fn test_first_child() { fn test_first_child() {
let item = execute_selector_query(SIMPLE_LIST, "li:first-child", false, Span::test_data()); let item = execute_selector_query(
SIMPLE_LIST,
"li:first-child",
false,
false,
Span::test_data(),
);
let config = nu_protocol::Config::default(); let config = nu_protocol::Config::default();
let out = item.into_string("\n", &config); let out = item.into_string("\n", &config);
assert_eq!("[Coffee]".to_string(), out) assert_eq!("[Coffee]".to_string(), out)

View File

@ -14,12 +14,15 @@ impl WebTable {
/// Finds the first table in `html`. /// Finds the first table in `html`.
pub fn find_first(html: &str) -> Option<WebTable> { pub fn find_first(html: &str) -> Option<WebTable> {
let html = Html::parse_fragment(html); let html = Html::parse_fragment(html);
html.select(&css("table")).next().map(WebTable::new) html.select(&css("table", false)).next().map(WebTable::new)
} }
pub fn find_all_tables(html: &str) -> Option<Vec<WebTable>> { pub fn find_all_tables(html: &str) -> Option<Vec<WebTable>> {
let html = Html::parse_fragment(html); let html = Html::parse_fragment(html);
let iter: Vec<WebTable> = html.select(&css("table")).map(WebTable::new).collect(); let iter: Vec<WebTable> = html
.select(&css("table", false))
.map(WebTable::new)
.collect();
if iter.is_empty() { if iter.is_empty() {
return None; return None;
} }
@ -51,9 +54,9 @@ impl WebTable {
return WebTable::find_all_tables(html); return WebTable::find_all_tables(html);
} }
let sel_table = css("table"); let sel_table = css("table", false);
let sel_tr = css("tr"); let sel_tr = css("tr", false);
let sel_th = css("th"); let sel_th = css("th", false);
let html = Html::parse_fragment(html); let html = Html::parse_fragment(html);
let mut tables = html let mut tables = html
@ -98,9 +101,9 @@ impl WebTable {
} }
// fn new(element: ElementRef) -> Table { // fn new(element: ElementRef) -> Table {
// let sel_tr = css("tr"); // let sel_tr = css("tr", false);
// let sel_th = css("th"); // let sel_th = css("th", false);
// let sel_td = css("td"); // let sel_td = css("td", false);
// let mut headers = HashMap::new(); // let mut headers = HashMap::new();
// let mut rows = element.select(&sel_tr).peekable(); // let mut rows = element.select(&sel_tr).peekable();
@ -117,9 +120,9 @@ impl WebTable {
// } // }
fn new(element: ElementRef) -> WebTable { fn new(element: ElementRef) -> WebTable {
let sel_tr = css("tr"); let sel_tr = css("tr", false);
let sel_th = css("th"); let sel_th = css("th", false);
let sel_td = css("td"); let sel_td = css("td", false);
let mut headers = HashMap::new(); let mut headers = HashMap::new();
let mut rows = element.select(&sel_tr).peekable(); let mut rows = element.select(&sel_tr).peekable();