scraper/
selector.rs
use std::convert::TryFrom;
use std::fmt;
use smallvec::SmallVec;
use html5ever::{LocalName, Namespace};
use selectors::{
matching,
parser::{self, ParseRelative, SelectorParseErrorKind},
};
use crate::error::SelectorErrorKind;
use crate::ElementRef;
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct Selector {
selectors: SmallVec<[parser::Selector<Simple>; 1]>,
}
impl Selector {
pub fn parse(selectors: &'_ str) -> Result<Self, SelectorErrorKind> {
let mut parser_input = cssparser::ParserInput::new(selectors);
let mut parser = cssparser::Parser::new(&mut parser_input);
parser::SelectorList::parse(&Parser, &mut parser, ParseRelative::No)
.map(|list| Selector { selectors: list.0 })
.map_err(SelectorErrorKind::from)
}
pub fn matches(&self, element: &ElementRef) -> bool {
self.matches_with_scope(element, None)
}
pub fn matches_with_scope(&self, element: &ElementRef, scope: Option<ElementRef>) -> bool {
let mut nth_index_cache = Default::default();
let mut context = matching::MatchingContext::new(
matching::MatchingMode::Normal,
None,
&mut nth_index_cache,
matching::QuirksMode::NoQuirks,
matching::NeedsSelectorFlags::No,
matching::IgnoreNthChildForInvalidation::No,
);
context.scope_element = scope.map(|x| selectors::Element::opaque(&x));
self.selectors
.iter()
.any(|s| matching::matches_selector(s, 0, None, element, &mut context))
}
}
struct Parser;
impl<'i> parser::Parser<'i> for Parser {
type Impl = Simple;
type Error = SelectorParseErrorKind<'i>;
}
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub struct Simple;
impl parser::SelectorImpl for Simple {
type AttrValue = CssString;
type Identifier = CssLocalName;
type LocalName = CssLocalName;
type NamespacePrefix = CssLocalName;
type NamespaceUrl = Namespace;
type BorrowedNamespaceUrl = Namespace;
type BorrowedLocalName = CssLocalName;
type NonTSPseudoClass = NonTSPseudoClass;
type PseudoElement = PseudoElement;
type ExtraMatchingData<'a> = ();
}
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct CssString(pub String);
impl<'a> From<&'a str> for CssString {
fn from(val: &'a str) -> Self {
Self(val.to_owned())
}
}
impl AsRef<str> for CssString {
fn as_ref(&self) -> &str {
&self.0
}
}
impl cssparser::ToCss for CssString {
fn to_css<W>(&self, dest: &mut W) -> fmt::Result
where
W: fmt::Write,
{
cssparser::serialize_string(&self.0, dest)
}
}
#[derive(Debug, Default, Clone, PartialEq, Eq)]
pub struct CssLocalName(pub LocalName);
impl<'a> From<&'a str> for CssLocalName {
fn from(val: &'a str) -> Self {
Self(val.into())
}
}
impl cssparser::ToCss for CssLocalName {
fn to_css<W>(&self, dest: &mut W) -> fmt::Result
where
W: fmt::Write,
{
dest.write_str(&self.0)
}
}
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum NonTSPseudoClass {}
impl parser::NonTSPseudoClass for NonTSPseudoClass {
type Impl = Simple;
fn is_active_or_hover(&self) -> bool {
false
}
fn is_user_action_state(&self) -> bool {
false
}
}
impl cssparser::ToCss for NonTSPseudoClass {
fn to_css<W>(&self, dest: &mut W) -> fmt::Result
where
W: fmt::Write,
{
dest.write_str("")
}
}
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum PseudoElement {}
impl parser::PseudoElement for PseudoElement {
type Impl = Simple;
}
impl cssparser::ToCss for PseudoElement {
fn to_css<W>(&self, dest: &mut W) -> fmt::Result
where
W: fmt::Write,
{
dest.write_str("")
}
}
impl<'i> TryFrom<&'i str> for Selector {
type Error = SelectorErrorKind<'i>;
fn try_from(s: &'i str) -> Result<Self, Self::Error> {
Selector::parse(s)
}
}
#[cfg(test)]
mod tests {
use super::*;
use std::convert::TryInto;
#[test]
fn selector_conversions() {
let s = "#testid.testclass";
let _sel: Selector = s.try_into().unwrap();
let s = s.to_owned();
let _sel: Selector = (*s).try_into().unwrap();
}
#[test]
#[should_panic]
fn invalid_selector_conversions() {
let s = "<failing selector>";
let _sel: Selector = s.try_into().unwrap();
}
}