diff --git a/CHANGELOG.md b/CHANGELOG.md index 2f828a27026b..f20ab59407be 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -15,6 +15,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - _Experimental_: Add `user-valid` and `user-invalid` variants ([#12370](https://github.com/tailwindlabs/tailwindcss/pull/12370)) - _Experimental_: Add `wrap-anywhere`, `wrap-break-word`, and `wrap-normal` utilities ([#12128](https://github.com/tailwindlabs/tailwindcss/pull/12128)) - Add `col-` and `row-` utilities for `grid-column` and `grid-row` ([#15183](https://github.com/tailwindlabs/tailwindcss/pull/15183)) +- Add new candidate extractor ([#16306](https://github.com/tailwindlabs/tailwindcss/pull/16306)) ### Fixed diff --git a/Cargo.lock b/Cargo.lock index f742de3eefb0..f87a6e889b0e 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -1,6 +1,6 @@ # This file is automatically @generated by Cargo. # It is not intended for manual editing. -version = 3 +version = 4 [[package]] name = "aho-corasick" @@ -35,9 +35,9 @@ checksum = "b048fb63fd8b5923fc5aa7b340d8e156aec7ec02f0c78fa8a6ddc2613f6f71de" [[package]] name = "bstr" -version = "1.10.0" +version = "1.11.3" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "40723b8fb387abc38f4f4a37c09073622e41dd12327033091ef8950659e6dc0c" +checksum = "531a9155a481e2ee699d4f98f43c0ca4ff8ee1bfd55c31e9e98fb29d2b176fe0" dependencies = [ "memchr", "regex-automata 0.4.8", @@ -268,9 +268,9 @@ checksum = "68354c5c6bd36d73ff3feceb05efa59b6acb7626617f4962be322a825e61f79a" [[package]] name = "napi" -version = "2.16.11" +version = "2.16.16" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "53575dfa17f208dd1ce3a2da2da4659aae393b256a472f2738a8586a6c4107fd" +checksum = "839ae2ee5e62c6348669c50098b187c08115bd3cced658c9c0bf945fca0fec83" dependencies = [ "bitflags", "ctor", @@ -281,15 +281,15 @@ dependencies = [ [[package]] name = "napi-build" -version = "2.0.1" +version = "2.1.4" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "882a73d9ef23e8dc2ebbffb6a6ae2ef467c0f18ac10711e4cc59c5485d41df0e" +checksum = "db836caddef23662b94e16bf1f26c40eceb09d6aee5d5b06a7ac199320b69b19" [[package]] name = "napi-derive" -version = "2.16.12" +version = "2.16.13" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "17435f7a00bfdab20b0c27d9c56f58f6499e418252253081bfff448099da31d1" +checksum = "7cbe2585d8ac223f7d34f13701434b9d5f4eb9c332cccce8dee57ea18ab8ab0c" dependencies = [ "cfg-if", "convert_case", @@ -301,9 +301,9 @@ dependencies = [ [[package]] name = "napi-derive-backend" -version = "1.0.74" +version = "1.0.75" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "967c485e00f0bf3b1bdbe510a38a4606919cf1d34d9a37ad41f25a81aa077abe" +checksum = "1639aaa9eeb76e91c6ae66da8ce3e89e921cd3885e99ec85f4abacae72fc91bf" dependencies = [ "convert_case", "once_cell", @@ -450,9 +450,9 @@ checksum = "2b15c43186be67a4fd63bee50d0303afffcef381492ebe2c5d87f324e1b8815c" [[package]] name = "rustc-hash" -version = "2.0.0" +version = "2.1.1" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "583034fd73374156e66797ed8e5b0d5690409c9226b22d87cb7f19821c05d152" +checksum = "357703d41365b4b27c590e3ed91eabb1b663f07c4c084095e60cbed4362dff0d" [[package]] name = "rustix" diff --git a/crates/node/Cargo.toml b/crates/node/Cargo.toml index 0009076936ab..2222c643fd10 100644 --- a/crates/node/Cargo.toml +++ b/crates/node/Cargo.toml @@ -8,10 +8,10 @@ crate-type = ["cdylib"] [dependencies] # Default enable napi4 feature, see https://nodejs.org/api/n-api.html#node-api-version-matrix -napi = { version = "2.16.11", default-features = false, features = ["napi4"] } -napi-derive = "2.16.12" +napi = { version = "2.16.16", default-features = false, features = ["napi4"] } +napi-derive = "2.16.13" tailwindcss-oxide = { path = "../oxide" } -rayon = "1.5.3" +rayon = "1.10.0" [build-dependencies] -napi-build = "2.0.1" +napi-build = "2.1.4" diff --git a/crates/node/src/lib.rs b/crates/node/src/lib.rs index 2eff57be308d..5811698c3bdd 100644 --- a/crates/node/src/lib.rs +++ b/crates/node/src/lib.rs @@ -28,12 +28,23 @@ pub struct GlobEntry { pub pattern: String, } -impl From for tailwindcss_oxide::ChangedContent { +impl From for tailwindcss_oxide::ChangedContent<'_> { fn from(changed_content: ChangedContent) -> Self { - Self { - file: changed_content.file.map(Into::into), - content: changed_content.content, + if let Some(file) = changed_content.file { + return tailwindcss_oxide::ChangedContent::File( + file.into(), + changed_content.extension.into(), + ); + } + + if let Some(contents) = changed_content.content { + return tailwindcss_oxide::ChangedContent::Content( + contents, + changed_content.extension.into(), + ); } + + unreachable!() } } diff --git a/crates/oxide/Cargo.toml b/crates/oxide/Cargo.toml index 96d847b96e02..3964b93887bf 100644 --- a/crates/oxide/Cargo.toml +++ b/crates/oxide/Cargo.toml @@ -4,11 +4,11 @@ version = "0.1.0" edition = "2021" [dependencies] -bstr = "1.10.0" +bstr = "1.11.3" globwalk = "0.9.1" log = "0.4.22" rayon = "1.10.0" -fxhash = { package = "rustc-hash", version = "2.0.0" } +fxhash = { package = "rustc-hash", version = "2.1.1" } crossbeam = "0.8.4" tracing = { version = "0.1.40", features = [] } tracing-subscriber = { version = "0.3.18", features = ["env-filter"] } @@ -20,3 +20,4 @@ fast-glob = "0.4.3" [dev-dependencies] tempfile = "3.13.0" + diff --git a/crates/oxide/src/cursor.rs b/crates/oxide/src/cursor.rs index 0e5ad6479e61..ebda110a26ab 100644 --- a/crates/oxide/src/cursor.rs +++ b/crates/oxide/src/cursor.rs @@ -41,14 +41,34 @@ impl<'a> Cursor<'a> { cursor } - pub fn rewind_by(&mut self, amount: usize) { - self.move_to(self.pos.saturating_sub(amount)); - } - pub fn advance_by(&mut self, amount: usize) { self.move_to(self.pos.saturating_add(amount)); } + #[inline(always)] + pub fn advance(&mut self) { + self.pos += 1; + + self.prev = self.curr; + self.curr = self.next; + self.next = *self + .input + .get(self.pos.saturating_add(1)) + .unwrap_or(&0x00u8); + } + + #[inline(always)] + pub fn advance_twice(&mut self) { + self.pos += 2; + + self.prev = self.next; + self.curr = *self.input.get(self.pos).unwrap_or(&0x00u8); + self.next = *self + .input + .get(self.pos.saturating_add(1)) + .unwrap_or(&0x00u8); + } + pub fn move_to(&mut self, pos: usize) { let len = self.input.len(); let pos = pos.clamp(0, len); @@ -57,13 +77,9 @@ impl<'a> Cursor<'a> { self.at_start = pos == 0; self.at_end = pos + 1 >= len; - self.prev = if pos > 0 { self.input[pos - 1] } else { 0x00 }; - self.curr = if pos < len { self.input[pos] } else { 0x00 }; - self.next = if pos + 1 < len { - self.input[pos + 1] - } else { - 0x00 - }; + self.prev = *self.input.get(pos.wrapping_sub(1)).unwrap_or(&0x00u8); + self.curr = *self.input.get(pos).unwrap_or(&0x00u8); + self.next = *self.input.get(pos.saturating_add(1)).unwrap_or(&0x00u8); } } @@ -139,21 +155,5 @@ mod test { assert_eq!(cursor.prev, b'd'); assert_eq!(cursor.curr, 0x00); assert_eq!(cursor.next, 0x00); - - cursor.rewind_by(1); - assert_eq!(cursor.pos, 10); - assert!(!cursor.at_start); - assert!(cursor.at_end); - assert_eq!(cursor.prev, b'l'); - assert_eq!(cursor.curr, b'd'); - assert_eq!(cursor.next, 0x00); - - cursor.rewind_by(10); - assert_eq!(cursor.pos, 0); - assert!(cursor.at_start); - assert!(!cursor.at_end); - assert_eq!(cursor.prev, 0x00); - assert_eq!(cursor.curr, b'h'); - assert_eq!(cursor.next, b'e'); } } diff --git a/crates/oxide/src/extractor/arbitrary_property_machine.rs b/crates/oxide/src/extractor/arbitrary_property_machine.rs new file mode 100644 index 000000000000..4c8e7ef1eaca --- /dev/null +++ b/crates/oxide/src/extractor/arbitrary_property_machine.rs @@ -0,0 +1,427 @@ +use crate::cursor; +use crate::extractor::bracket_stack::BracketStack; +use crate::extractor::machine::{Machine, MachineState}; +use crate::extractor::string_machine::StringMachine; +use crate::extractor::CssVariableMachine; + +/// Extracts arbitrary properties from the input, including the brackets. +/// +/// E.g.: +/// +/// ```text +/// [color:red] +/// ^^^^^^^^^^^ +/// +/// [--my-color:red] +/// ^^^^^^^^^^^^^^^^ +/// ``` +#[derive(Debug, Default)] +pub struct ArbitraryPropertyMachine { + /// Start position of the arbitrary value + start_pos: usize, + + /// Track brackets to ensure they are balanced + bracket_stack: BracketStack, + + /// Current state of the machine + state: State, + + css_variable_machine: CssVariableMachine, + string_machine: StringMachine, +} + +#[derive(Debug, Default)] +enum State { + #[default] + Idle, + + /// Parsing the property, e.g.: + /// + /// ```text + /// [color:red] + /// ^^^^^ + /// + /// [--my-color:red] + /// ^^^^^^^^^^ + /// ``` + ParsingProperty, + + /// Parsing the value, e.g.: + /// + /// ```text + /// [color:red] + /// ^^^ + /// ``` + ParsingValue, +} + +impl Machine for ArbitraryPropertyMachine { + #[inline(always)] + fn reset(&mut self) { + self.start_pos = 0; + self.state = State::Idle; + self.bracket_stack.reset(); + } + + #[inline] + fn next(&mut self, cursor: &mut cursor::Cursor<'_>) -> MachineState { + let len = cursor.input.len(); + + match self.state { + State::Idle => match CLASS_TABLE[cursor.curr as usize] { + // Start of an arbitrary property + Class::OpenBracket => { + self.start_pos = cursor.pos; + self.state = State::ParsingProperty; + cursor.advance(); + self.next(cursor) + } + + // Anything else is not a valid start of an arbitrary value + _ => MachineState::Idle, + }, + + State::ParsingProperty => { + while cursor.pos < len { + match CLASS_TABLE[cursor.curr as usize] { + Class::Dash => match CLASS_TABLE[cursor.next as usize] { + // Start of a CSS variable + // + // E.g.: `[--my-color:red]` + // ^^ + Class::Dash => return self.parse_property_variable(cursor), + + // Dashes are allowed in the property name + // + // E.g.: `[background-color:red]` + // ^ + _ => cursor.advance(), + }, + + // Alpha characters are allowed in the property name + // + // E.g.: `[color:red]` + // ^^^^^ + Class::Alpha => cursor.advance(), + + // End of the property name, but there must be at least a single character + Class::Colon if cursor.pos > self.start_pos + 1 => { + self.state = State::ParsingValue; + cursor.advance(); + return self.next(cursor); + } + + // Anything else is not a valid property character + _ => return self.restart(), + } + } + + self.restart() + } + + State::ParsingValue => { + while cursor.pos < len { + match CLASS_TABLE[cursor.curr as usize] { + Class::Escape => match CLASS_TABLE[cursor.next as usize] { + // An escaped whitespace character is not allowed + // + // E.g.: `[color:var(--my-\ color)]` + // ^ + Class::Whitespace => return self.restart(), + + // An escaped character, skip the next character, resume after + // + // E.g.: `[color:var(--my-\#color)]` + // ^ + _ => cursor.advance_twice(), + }, + + Class::OpenParen | Class::OpenBracket | Class::OpenCurly => { + if !self.bracket_stack.push(cursor.curr) { + return self.restart(); + } + cursor.advance(); + } + + Class::CloseParen | Class::CloseBracket | Class::CloseCurly + if !self.bracket_stack.is_empty() => + { + if !self.bracket_stack.pop(cursor.curr) { + return self.restart(); + } + cursor.advance(); + } + + // End of an arbitrary value + // + // 1. All brackets must be balanced + // 2. There must be at least a single character inside the brackets + Class::CloseBracket + if self.start_pos + 1 != cursor.pos + && self.bracket_stack.is_empty() => + { + return self.done(self.start_pos, cursor) + } + + // Start of a string + Class::Quote => return self.parse_string(cursor), + + // Another `:` inside of an arbitrary property is only valid inside of a string or + // inside of brackets. Everywhere else, it's invalid. + // + // E.g.: `[color:red:blue]` + // ^ Not valid + // E.g.: `[background:url(https://example.com)]` + // ^ Valid + // E.g.: `[content:'a:b:c:']` + // ^ ^ ^ Valid + Class::Colon if self.bracket_stack.is_empty() => return self.restart(), + + // Any kind of whitespace is not allowed + Class::Whitespace => return self.restart(), + + // Everything else is valid + _ => cursor.advance(), + }; + } + + self.restart() + } + } + } +} + +impl ArbitraryPropertyMachine { + fn parse_property_variable(&mut self, cursor: &mut cursor::Cursor<'_>) -> MachineState { + match self.css_variable_machine.next(cursor) { + MachineState::Idle => self.restart(), + MachineState::Done(_) => match CLASS_TABLE[cursor.next as usize] { + // End of the CSS variable, must be followed by a `:` + // + // E.g.: `[--my-color:red]` + // ^ + Class::Colon => { + self.state = State::ParsingValue; + cursor.advance_twice(); + self.next(cursor) + } + + // Invalid arbitrary property + _ => self.restart(), + }, + } + } + + fn parse_string(&mut self, cursor: &mut cursor::Cursor<'_>) -> MachineState { + match self.string_machine.next(cursor) { + MachineState::Idle => self.restart(), + MachineState::Done(_) => { + cursor.advance(); + self.next(cursor) + } + } + } +} + +#[derive(Clone, Copy)] +enum Class { + /// `(` + OpenParen, + + /// `[` + OpenBracket, + + /// `{` + OpenCurly, + + /// `)` + CloseParen, + + /// `]` + CloseBracket, + + /// `}` + CloseCurly, + + /// `\` + Escape, + + /// ', ", or ` + Quote, + + /// `-` + Dash, + + /// `a`..`z` or `A`..`Z` + Alpha, + + /// `:` + Colon, + + /// Whitespace characters + Whitespace, + + /// End of the input + End, + + Other, +} + +const CLASS_TABLE: [Class; 256] = { + let mut table = [Class::Other; 256]; + + macro_rules! set { + ($class:expr, $($byte:expr),+ $(,)?) => { + $(table[$byte as usize] = $class;)+ + }; + } + + macro_rules! set_range { + ($class:expr, $start:literal ..= $end:literal) => { + let mut i = $start; + while i <= $end { + table[i as usize] = $class; + i += 1; + } + }; + } + + set!(Class::OpenParen, b'('); + set!(Class::OpenBracket, b'['); + set!(Class::OpenCurly, b'{'); + + set!(Class::CloseParen, b')'); + set!(Class::CloseBracket, b']'); + set!(Class::CloseCurly, b'}'); + + set!(Class::Escape, b'\\'); + + set!(Class::Quote, b'"', b'\'', b'`'); + + set!(Class::Dash, b'-'); + + set_range!(Class::Alpha, b'a'..=b'z'); + set_range!(Class::Alpha, b'A'..=b'Z'); + + set!(Class::Colon, b':'); + set!(Class::End, b'\0'); + + set!(Class::Whitespace, b' ', b'\t', b'\n', b'\r', b'\x0C'); + + table +}; + +#[cfg(test)] +mod tests { + use super::ArbitraryPropertyMachine; + use crate::extractor::machine::Machine; + + #[test] + #[ignore] + fn test_arbitrary_property_machine_performance() { + let input = r#"