add 'attr' method in the SelectorBase
parent
d02da8ff20
commit
1cf010b5a0
36
src/lib.rs
36
src/lib.rs
|
@ -1,39 +1,3 @@
|
||||||
pub mod request;
|
pub mod request;
|
||||||
pub mod response;
|
pub mod response;
|
||||||
pub mod selector;
|
pub mod selector;
|
||||||
|
|
||||||
#[cfg(test)]
|
|
||||||
mod tests {
|
|
||||||
use crate::request::{Request, RequestBase};
|
|
||||||
use crate::selector::{Selector, SelectorBase};
|
|
||||||
use http::StatusCode;
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn plain_text_selector() {
|
|
||||||
let html = "
|
|
||||||
<html>
|
|
||||||
<body>
|
|
||||||
<h1>hello world</h1>
|
|
||||||
<p id='text'>good bye</p>
|
|
||||||
<a>simple text</a>
|
|
||||||
</body>
|
|
||||||
</html>
|
|
||||||
"
|
|
||||||
.to_string();
|
|
||||||
let sel = Selector::from_html(html);
|
|
||||||
assert_eq!(sel.css::<Selector>("h1")[0].html(), "<h1>hello world</h1>");
|
|
||||||
assert_eq!(sel.css::<Selector>("#text")[0].content(), "good bye");
|
|
||||||
assert_eq!(
|
|
||||||
sel.css_once::<Selector>("body > a").unwrap().content(),
|
|
||||||
"simple text"
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn simple_request() {
|
|
||||||
let req: Request = RequestBase::new("https://httpbin.org/").unwrap();
|
|
||||||
let resp = req.launch();
|
|
||||||
assert_eq!(resp.status_code, StatusCode::OK);
|
|
||||||
assert!(resp.css::<Selector>("h2")[0].html().contains("httpbin.org"));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
|
@ -20,12 +20,20 @@ pub trait SelectorBase {
|
||||||
|
|
||||||
fn content(&self) -> String {
|
fn content(&self) -> String {
|
||||||
let html = nipper::Document::from(self.html().as_str());
|
let html = nipper::Document::from(self.html().as_str());
|
||||||
html.select("*")
|
html.select("body > *")
|
||||||
.iter()
|
.iter()
|
||||||
.map(|element| element.text().to_string())
|
.map(|element| element.text().to_string())
|
||||||
.last()
|
.last()
|
||||||
.unwrap()
|
.unwrap()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
fn attr(&self, attribute: &'static str) -> Option<String> {
|
||||||
|
let html = nipper::Document::from(self.html().as_str());
|
||||||
|
match html.select("body > *").attr(attribute) {
|
||||||
|
Some(text) => Some(format!("{}", text)),
|
||||||
|
None => None,
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(Debug)]
|
#[derive(Debug)]
|
||||||
|
|
|
@ -0,0 +1,64 @@
|
||||||
|
use http::StatusCode;
|
||||||
|
use raspa::request::{Request, RequestBase};
|
||||||
|
use raspa::selector::{Selector, SelectorBase};
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn plain_text_selector() {
|
||||||
|
let html = "
|
||||||
|
<html>
|
||||||
|
<body>
|
||||||
|
<h1>hello world</h1>
|
||||||
|
<p id='text'>good bye</p>
|
||||||
|
<a>simple text</a>
|
||||||
|
</body>
|
||||||
|
</html>
|
||||||
|
"
|
||||||
|
.to_string();
|
||||||
|
let sel = Selector::from_html(html);
|
||||||
|
assert_eq!(sel.css::<Selector>("h1")[0].html(), "<h1>hello world</h1>");
|
||||||
|
assert_eq!(sel.css::<Selector>("#text")[0].content(), "good bye");
|
||||||
|
assert_eq!(
|
||||||
|
sel.css_once::<Selector>("body > a").unwrap().content(),
|
||||||
|
"simple text"
|
||||||
|
);
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn simple_request() {
|
||||||
|
let req: Request = RequestBase::new("https://httpbin.org/").unwrap();
|
||||||
|
let resp = req.launch();
|
||||||
|
assert_eq!(resp.status_code, StatusCode::OK);
|
||||||
|
assert!(resp.css::<Selector>("h2")[0].html().contains("httpbin.org"));
|
||||||
|
}
|
||||||
|
|
||||||
|
#[test]
|
||||||
|
fn complex_selectors() {
|
||||||
|
let html = "
|
||||||
|
<html>
|
||||||
|
<body>
|
||||||
|
<p id='text'>good bye</p>
|
||||||
|
<a href='http://google.com'>simple text</a>
|
||||||
|
<ul>
|
||||||
|
<li class='item' id='item-1'>1</li>
|
||||||
|
<li class='item' id='item-2'>2</li>
|
||||||
|
<li class='item' id='item-3'>3</li>
|
||||||
|
</ul>
|
||||||
|
</body>
|
||||||
|
</html>
|
||||||
|
"
|
||||||
|
.to_string();
|
||||||
|
let sel = Selector::from_html(html);
|
||||||
|
assert_eq!(
|
||||||
|
sel.css_once::<Selector>("p").unwrap().attr("id").unwrap(),
|
||||||
|
"text"
|
||||||
|
);
|
||||||
|
assert_eq!(
|
||||||
|
sel.css::<Selector>("a")[0].attr("href").unwrap(),
|
||||||
|
"http://google.com"
|
||||||
|
);
|
||||||
|
for node in sel.css::<Selector>("ul li").iter() {
|
||||||
|
let text = node.content();
|
||||||
|
assert_eq!(node.attr("class").unwrap(), "item");
|
||||||
|
assert!(node.attr("id").unwrap().contains(&text));
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue