mirror of
https://github.com/servo/servo.git
synced 2025-07-19 13:23:46 +01:00
script: Update name validation for attribute, element, and doctype (#37747)
A recent update in the spec (https://github.com/whatwg/dom/pull/1079) introduced new rules for name validation of attribute, element, and doctype. This PR implements the new name validation rules in `components/script/dom/bindings/domname.rs`. The old XML name validation rules are not fully removed because there remains a few usage of it in `ProcessingInstructions` and `xpath`. Testing: Covered by WPT tests Fixes: #37746 --------- Signed-off-by: minghuaw <michael.wu1107@gmail.com> Signed-off-by: Minghua Wu <michael.wu1107@gmail.com> Co-authored-by: Xiaocheng Hu <xiaochengh.work@gmail.com>
This commit is contained in:
parent
e14556959d
commit
5b507dc871
17 changed files with 380 additions and 872 deletions
219
components/script/dom/bindings/domname.rs
Normal file
219
components/script/dom/bindings/domname.rs
Normal file
|
@ -0,0 +1,219 @@
|
|||
/* This Source Code Form is subject to the terms of the Mozilla Public
|
||||
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
||||
* file, You can obtain one at https://mozilla.org/MPL/2.0/. */
|
||||
|
||||
//! Functions for validating names as defined in the DOM Standard: <https://dom.spec.whatwg.org/#namespaces>
|
||||
|
||||
use html5ever::{LocalName, Namespace, Prefix, ns};
|
||||
use script_bindings::error::{Error, Fallible};
|
||||
use script_bindings::str::DOMString;
|
||||
|
||||
/// <https://infra.spec.whatwg.org/#xml-namespace>
|
||||
const XML_NAMESPACE: &str = "http://www.w3.org/XML/1998/namespace";
|
||||
|
||||
/// <https://infra.spec.whatwg.org/#xmlns-namespace>
|
||||
const XMLNS_NAMESPACE: &str = "http://www.w3.org/2000/xmlns/";
|
||||
|
||||
/// <https://dom.spec.whatwg.org/#valid-namespace-prefix>
|
||||
fn is_valid_namespace_prefix(p: &str) -> bool {
|
||||
// A string is a valid namespace prefix if its length
|
||||
// is at least 1 and it does not contain ASCII whitespace,
|
||||
// U+0000 NULL, U+002F (/), or U+003E (>).
|
||||
|
||||
if p.is_empty() {
|
||||
return false;
|
||||
}
|
||||
|
||||
!p.chars()
|
||||
.any(|c| c.is_ascii_whitespace() || matches!(c, '\u{0000}' | '\u{002F}' | '\u{003E}'))
|
||||
}
|
||||
|
||||
/// <https://dom.spec.whatwg.org/#valid-attribute-local-name>
|
||||
pub(crate) fn is_valid_attribute_local_name(name: &str) -> bool {
|
||||
// A string is a valid attribute local name if its length
|
||||
// is at least 1 and it does not contain ASCII whitespace,
|
||||
// U+0000 NULL, U+002F (/), U+003D (=), or U+003E (>).
|
||||
|
||||
if name.is_empty() {
|
||||
return false;
|
||||
}
|
||||
|
||||
!name.chars().any(|c| {
|
||||
c.is_ascii_whitespace() || matches!(c, '\u{0000}' | '\u{002F}' | '\u{003D}' | '\u{003E}')
|
||||
})
|
||||
}
|
||||
|
||||
/// <https://dom.spec.whatwg.org/#valid-element-local-name>
|
||||
pub(crate) fn is_valid_element_local_name(name: &str) -> bool {
|
||||
// Step 1. If name’s length is 0, then return false.
|
||||
if name.is_empty() {
|
||||
return false;
|
||||
}
|
||||
|
||||
let mut iter = name.chars();
|
||||
|
||||
// SAFETY: we have already checked that the &str is not empty
|
||||
let c0 = iter.next().unwrap();
|
||||
|
||||
// Step 2. If name’s 0th code point is an ASCII alpha, then:
|
||||
if c0.is_ascii_alphabetic() {
|
||||
for c in iter {
|
||||
// Step 2.1 If name contains ASCII whitespace,
|
||||
// U+0000 NULL, U+002F (/), or U+003E (>), then return false.
|
||||
if c.is_ascii_whitespace() || matches!(c, '\u{0000}' | '\u{002F}' | '\u{003E}') {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
true
|
||||
}
|
||||
// Step 3. If name’s 0th code point is not U+003A (:), U+005F (_),
|
||||
// or in the range U+0080 to U+10FFFF, inclusive, then return false.
|
||||
else if matches!(c0, '\u{003A}' | '\u{005F}' | '\u{0080}'..='\u{10FFF}') {
|
||||
for c in iter {
|
||||
// Step 4. If name’s subsequent code points,
|
||||
// if any, are not ASCII alphas, ASCII digits,
|
||||
// U+002D (-), U+002E (.), U+003A (:), U+005F (_),
|
||||
// or in the range U+0080 to U+10FFFF, inclusive,
|
||||
// then return false.
|
||||
if !c.is_ascii_alphanumeric() &&
|
||||
!matches!(
|
||||
c,
|
||||
'\u{002D}' | '\u{002E}' | '\u{003A}' | '\u{005F}' | '\u{0080}'..='\u{10FFF}'
|
||||
)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
}
|
||||
true
|
||||
} else {
|
||||
false
|
||||
}
|
||||
}
|
||||
|
||||
/// <https://dom.spec.whatwg.org/#valid-doctype-name>
|
||||
pub(crate) fn is_valid_doctype_name(name: &str) -> bool {
|
||||
// A string is a valid doctype name if it does not contain
|
||||
// ASCII whitespace, U+0000 NULL, or U+003E (>).
|
||||
!name
|
||||
.chars()
|
||||
.any(|c| c.is_ascii_whitespace() || matches!(c, '\u{0000}' | '\u{003E}'))
|
||||
}
|
||||
|
||||
/// Convert a possibly-null URL to a namespace.
|
||||
///
|
||||
/// If the URL is None, returns the empty namespace.
|
||||
pub(crate) fn namespace_from_domstring(url: Option<DOMString>) -> Namespace {
|
||||
match url {
|
||||
None => ns!(),
|
||||
Some(s) => Namespace::from(s),
|
||||
}
|
||||
}
|
||||
|
||||
/// Context for [`validate_and_extract`] a namespace and qualified name
|
||||
///
|
||||
/// <https://dom.spec.whatwg.org/#validate-and-extract>
|
||||
#[derive(Clone, Copy, Debug)]
|
||||
pub(crate) enum Context {
|
||||
Attribute,
|
||||
Element,
|
||||
}
|
||||
|
||||
/// <https://dom.spec.whatwg.org/#validate-and-extract>
|
||||
pub(crate) fn validate_and_extract(
|
||||
namespace: Option<DOMString>,
|
||||
qualified_name: &str,
|
||||
context: Context,
|
||||
) -> Fallible<(Namespace, Option<Prefix>, LocalName)> {
|
||||
// Step 1. If namespace is the empty string, then set it to null.
|
||||
let namespace = namespace_from_domstring(namespace);
|
||||
|
||||
// Step 2. Let prefix be null.
|
||||
let mut prefix = None;
|
||||
// Step 3. Let localName be qualifiedName.
|
||||
let mut local_name = qualified_name;
|
||||
// Step 4. If qualifiedName contains a U+003A (:):
|
||||
if let Some(idx) = qualified_name.find(':') {
|
||||
// Step 4.1. Let splitResult be the result of running
|
||||
// strictly split given qualifiedName and U+003A (:).
|
||||
let p = &qualified_name[..idx];
|
||||
|
||||
// Step 5. If prefix is not a valid namespace prefix,
|
||||
// then throw an "InvalidCharacterError" DOMException.
|
||||
if !is_valid_namespace_prefix(p) {
|
||||
debug!("Not a valid namespace prefix");
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
|
||||
// Step 4.2. Set prefix to splitResult[0].
|
||||
prefix = Some(p);
|
||||
|
||||
// Step 4.3. Set localName to splitResult[1].
|
||||
let remaining = &qualified_name[(idx + 1).min(qualified_name.len())..];
|
||||
match remaining.find(':') {
|
||||
Some(end) => local_name = &remaining[..end],
|
||||
None => local_name = remaining,
|
||||
};
|
||||
}
|
||||
|
||||
if let Some(p) = prefix {
|
||||
// Step 5. If prefix is not a valid namespace prefix,
|
||||
// then throw an "InvalidCharacterError" DOMException.
|
||||
if !is_valid_namespace_prefix(p) {
|
||||
debug!("Not a valid namespace prefix");
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
}
|
||||
|
||||
match context {
|
||||
// Step 6. If context is "attribute" and localName
|
||||
// is not a valid attribute local name, then
|
||||
// throw an "InvalidCharacterError" DOMException.
|
||||
Context::Attribute => {
|
||||
if !is_valid_attribute_local_name(local_name) {
|
||||
debug!("Not a valid attribute name");
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
},
|
||||
// Step 7. If context is "element" and localName
|
||||
// is not a valid element local name, then
|
||||
// throw an "InvalidCharacterError" DOMException.
|
||||
Context::Element => {
|
||||
if !is_valid_element_local_name(local_name) {
|
||||
debug!("Not a valid element name");
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
},
|
||||
}
|
||||
|
||||
match prefix {
|
||||
// Step 8. If prefix is non-null and namespace is null,
|
||||
// then throw a "NamespaceError" DOMException.
|
||||
Some(_) if namespace.is_empty() => Err(Error::Namespace),
|
||||
// Step 9. If prefix is "xml" and namespace is not the XML namespace,
|
||||
// then throw a "NamespaceError" DOMException.
|
||||
Some("xml") if *namespace != *XML_NAMESPACE => Err(Error::Namespace),
|
||||
// Step 10. If either qualifiedName or prefix is "xmlns" and namespace
|
||||
// is not the XMLNS namespace, then throw a "NamespaceError" DOMException.
|
||||
p if (qualified_name == "xmlns" || p == Some("xmlns")) &&
|
||||
*namespace != *XMLNS_NAMESPACE =>
|
||||
{
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
Some(_) if qualified_name == "xmlns" && *namespace != *XMLNS_NAMESPACE => {
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
// Step 11. If namespace is the XMLNS namespace and neither qualifiedName
|
||||
// nor prefix is "xmlns", then throw a "NamespaceError" DOMException.
|
||||
p if *namespace == *XMLNS_NAMESPACE &&
|
||||
(qualified_name != "xmlns" && p != Some("xmlns")) =>
|
||||
{
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
// Step 12. Return (namespace, prefix, localName).
|
||||
_ => Ok((
|
||||
namespace,
|
||||
prefix.map(Prefix::from),
|
||||
LocalName::from(local_name),
|
||||
)),
|
||||
}
|
||||
}
|
|
@ -139,6 +139,7 @@ pub(crate) mod buffer_source;
|
|||
pub(crate) mod cell;
|
||||
pub(crate) mod constructor;
|
||||
pub(crate) mod conversions;
|
||||
pub(crate) mod domname;
|
||||
pub(crate) mod error;
|
||||
pub(crate) mod frozenarray;
|
||||
pub(crate) mod function;
|
||||
|
|
|
@ -4,14 +4,9 @@
|
|||
|
||||
//! Functions for validating and extracting qualified XML names.
|
||||
|
||||
use html5ever::{LocalName, Namespace, Prefix, ns};
|
||||
|
||||
use crate::dom::bindings::error::{Error, Fallible};
|
||||
use crate::dom::bindings::str::DOMString;
|
||||
|
||||
/// Check if an element name is valid. See <http://www.w3.org/TR/xml/#NT-Name>
|
||||
/// for details.
|
||||
fn is_valid_start(c: char) -> bool {
|
||||
pub(crate) fn is_valid_start(c: char) -> bool {
|
||||
matches!(c, ':' |
|
||||
'A'..='Z' |
|
||||
'_' |
|
||||
|
@ -30,7 +25,7 @@ fn is_valid_start(c: char) -> bool {
|
|||
'\u{10000}'..='\u{EFFFF}')
|
||||
}
|
||||
|
||||
fn is_valid_continuation(c: char) -> bool {
|
||||
pub(crate) fn is_valid_continuation(c: char) -> bool {
|
||||
is_valid_start(c) ||
|
||||
matches!(c,
|
||||
'-' |
|
||||
|
@ -41,103 +36,6 @@ fn is_valid_continuation(c: char) -> bool {
|
|||
'\u{203F}'..='\u{2040}')
|
||||
}
|
||||
|
||||
/// Validate a qualified name. See <https://dom.spec.whatwg.org/#validate> for details.
|
||||
///
|
||||
/// On success, this returns a tuple `(prefix, local name)`.
|
||||
pub(crate) fn validate_and_extract_qualified_name(
|
||||
qualified_name: &str,
|
||||
) -> Fallible<(Option<&str>, &str)> {
|
||||
if qualified_name.is_empty() {
|
||||
// Qualified names must not be empty
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
let mut colon_offset = None;
|
||||
let mut at_start_of_name = true;
|
||||
|
||||
for (byte_position, c) in qualified_name.char_indices() {
|
||||
if c == ':' {
|
||||
if colon_offset.is_some() {
|
||||
// Qualified names must not contain more than one colon
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
colon_offset = Some(byte_position);
|
||||
at_start_of_name = true;
|
||||
continue;
|
||||
}
|
||||
|
||||
if at_start_of_name {
|
||||
if !is_valid_start(c) {
|
||||
// Name segments must begin with a valid start character
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
at_start_of_name = false;
|
||||
} else if !is_valid_continuation(c) {
|
||||
// Name segments must consist of valid characters
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
}
|
||||
|
||||
let Some(colon_offset) = colon_offset else {
|
||||
// Simple case: there is no prefix
|
||||
return Ok((None, qualified_name));
|
||||
};
|
||||
|
||||
let (prefix, local_name) = qualified_name.split_at(colon_offset);
|
||||
let local_name = &local_name[1..]; // Remove the colon
|
||||
|
||||
if prefix.is_empty() || local_name.is_empty() {
|
||||
// Neither prefix nor local name can be empty
|
||||
return Err(Error::InvalidCharacter);
|
||||
}
|
||||
|
||||
Ok((Some(prefix), local_name))
|
||||
}
|
||||
|
||||
/// Validate a namespace and qualified name and extract their parts.
|
||||
/// See <https://dom.spec.whatwg.org/#validate-and-extract> for details.
|
||||
pub(crate) fn validate_and_extract(
|
||||
namespace: Option<DOMString>,
|
||||
qualified_name: &str,
|
||||
) -> Fallible<(Namespace, Option<Prefix>, LocalName)> {
|
||||
// Step 1. If namespace is the empty string, then set it to null.
|
||||
let namespace = namespace_from_domstring(namespace);
|
||||
|
||||
// Step 2. Validate qualifiedName.
|
||||
// Step 3. Let prefix be null.
|
||||
// Step 4. Let localName be qualifiedName.
|
||||
// Step 5. If qualifiedName contains a U+003A (:):
|
||||
// NOTE: validate_and_extract_qualified_name does all of these things for us, because
|
||||
// it's easier to do them together
|
||||
let (prefix, local_name) = validate_and_extract_qualified_name(qualified_name)?;
|
||||
debug_assert!(!local_name.contains(':'));
|
||||
|
||||
match (namespace, prefix) {
|
||||
(ns!(), Some(_)) => {
|
||||
// Step 6. If prefix is non-null and namespace is null, then throw a "NamespaceError" DOMException.
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
(ref ns, Some("xml")) if ns != &ns!(xml) => {
|
||||
// Step 7. If prefix is "xml" and namespace is not the XML namespace,
|
||||
// then throw a "NamespaceError" DOMException.
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
(ref ns, p) if ns != &ns!(xmlns) && (qualified_name == "xmlns" || p == Some("xmlns")) => {
|
||||
// Step 8. If either qualifiedName or prefix is "xmlns" and namespace is not the XMLNS namespace,
|
||||
// then throw a "NamespaceError" DOMException.
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
(ns!(xmlns), p) if qualified_name != "xmlns" && p != Some("xmlns") => {
|
||||
// Step 9. If namespace is the XMLNS namespace and neither qualifiedName nor prefix is "xmlns",
|
||||
// then throw a "NamespaceError" DOMException.
|
||||
Err(Error::Namespace)
|
||||
},
|
||||
(ns, p) => {
|
||||
// Step 10. Return namespace, prefix, and localName.
|
||||
Ok((ns, p.map(Prefix::from), LocalName::from(local_name)))
|
||||
},
|
||||
}
|
||||
}
|
||||
|
||||
pub(crate) fn matches_name_production(name: &str) -> bool {
|
||||
let mut iter = name.chars();
|
||||
|
||||
|
@ -146,13 +44,3 @@ pub(crate) fn matches_name_production(name: &str) -> bool {
|
|||
}
|
||||
iter.all(is_valid_continuation)
|
||||
}
|
||||
|
||||
/// Convert a possibly-null URL to a namespace.
|
||||
///
|
||||
/// If the URL is None, returns the empty namespace.
|
||||
pub(crate) fn namespace_from_domstring(url: Option<DOMString>) -> Namespace {
|
||||
match url {
|
||||
None => ns!(),
|
||||
Some(s) => Namespace::from(s),
|
||||
}
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue