diff --git a/' b/'
new file mode 100644
index 0000000000000..53a6359f76054
--- /dev/null
+++ b/'
@@ -0,0 +1,46 @@
+use phf::phf_set;
+
+const SYNTAX_CHARACTERS: phf::Set<char> = phf_set!['(', ')', '[', ']', '{', '}', '|', '-'];
+
+const CLASS_SET_RESERVED_DOUBLE_PUNCTUATOR_CHARACTER: phf::Set<char> = phf_set! {
+    '&' => AMPERSAND,
+    '!' => EXCLAMATION_MARK,
+    '#' => NUMBER_SIGN,
+    '$' => DOLLAR_SIGN,
+    '%' => PERCENT_SIGN,
+    '*' => ASTERISK,
+    '+' => PLUS_SIGN,
+    ',' => COMMA,
+    '.' => FULL_STOP,
+    ':' => COLON,
+    ';' => SEMICOLON,
+    '<' => LESS_THAN_SIGN,
+    '=' => EQUALS_SIGN,
+    '>' => GREATER_THAN_SIGN,
+    '?' => QUESTION_MARK,
+    '@' => COMMERCIAL_AT,
+    '^' => CIRCUMFLEX_ACCENT,
+    '`' => GRAVE_ACCENT,
+    '~' => TILDE,
+};
+
+#[inline]
+pub fn is_syntax_character(cp: char) -> bool {
+    SYNTAX_CHARACTERS.contains(&cp)
+}
+
+pub fn is_lead_surrogate(code: u32) -> bool {
+    code >= 0xd800 && code <= 0xdbff
+}
+
+pub fn is_trail_surrogate(code: u32) -> bool {
+    code >= 0xdc00 && code <= 0xdfff
+}
+
+pub fn combine_surrogate_pair(lead: u32, trail: u32) -> u32 {
+    (lead - 0xd800) * 0x400 + (trail - 0xdc00) + 0x10000
+}
+
+pub fn is_class_set_reserved_double_punctuator_character(cp: char) -> bool {
+    CLASS_SET_RESERVED_DOUBLE_PUNCTUATOR_CHARACTER.contains(&cp)
+}
diff --git a/Cargo.lock b/Cargo.lock
index 3b11ab893b40c..1d13b2a27b61d 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -1600,7 +1600,10 @@ name = "oxc_js_regex"
 version = "0.0.0"
 dependencies = [
  "oxc_allocator",
+ "oxc_diagnostics",
  "oxc_span",
+ "oxc_syntax",
+ "phf",
 ]
 
 [[package]]
diff --git a/crates/oxc_js_regex/Cargo.toml b/crates/oxc_js_regex/Cargo.toml
index 38dcac20c5f06..e473738bc7bbe 100644
--- a/crates/oxc_js_regex/Cargo.toml
+++ b/crates/oxc_js_regex/Cargo.toml
@@ -19,5 +19,8 @@ workspace = true
 doctest = false
 
 [dependencies]
-oxc_allocator = { workspace = true }
-oxc_span      = { workspace = true }
+phf             = { workspace = true }
+oxc_allocator   = { workspace = true }
+oxc_span        = { workspace = true }
+oxc_diagnostics = { workspace = true }
+oxc_syntax.workspace = true
diff --git a/crates/oxc_js_regex/src/ast.rs b/crates/oxc_js_regex/src/ast.rs
index 6690c5f7386fc..f4e5900b8da32 100644
--- a/crates/oxc_js_regex/src/ast.rs
+++ b/crates/oxc_js_regex/src/ast.rs
@@ -3,6 +3,8 @@
 use oxc_allocator::{Box, Vec};
 use oxc_span::{Atom, Span};
 
+use crate::ast_kind::AstKind;
+
 /// The type which includes all nodes.
 #[derive(Debug)]
 pub enum Node<'a> {
@@ -42,46 +44,46 @@ pub enum Leaf<'a> {
 /// The type which includes all atom nodes.
 #[derive(Debug)]
 pub enum Element<'a> {
-    Assertion(Box<'a, Assertion<'a>>),
-    QuantifiableElement(Box<'a, QuantifiableElement<'a>>),
+    Assertion(Assertion<'a>),
+    QuantifiableElement(QuantifiableElement<'a>),
     Quantifier(Box<'a, Quantifier<'a>>),
 }
 
 /// The type which includes all atom nodes that Quantifier node can have as children.
 #[derive(Debug)]
 pub enum QuantifiableElement<'a> {
-    Backreference(Box<'a, Backreference<'a>>),
-    CapturingGroup(Box<'a, CapturingGroup<'a>>),
-    Character(Box<'a, Character>),
-    CharacterClass(Box<'a, CharacterClass<'a>>),
-    CharacterSet(Box<'a, CharacterSet<'a>>),
-    ExpressionCharacterClass(Box<'a, ExpressionCharacterClass<'a>>),
-    Group(Box<'a, Group<'a>>),
-    LookaheadAssertion(Box<'a, LookaheadAssertion<'a>>),
+    Backreference(Backreference<'a>),
+    CapturingGroup(CapturingGroup<'a>),
+    Character(Character),
+    CharacterClass(CharacterClass<'a>),
+    CharacterSet(CharacterSet<'a>),
+    ExpressionCharacterClass(ExpressionCharacterClass<'a>),
+    Group(Group<'a>),
+    LookaheadAssertion(LookaheadAssertion<'a>),
 }
 
 /// The type which includes all character class atom nodes.
 #[derive(Debug)]
 pub enum CharacterClassElement<'a> {
-    ClassRangesCharacterClassElement(Box<'a, ClassRangesCharacterClassElement<'a>>),
-    UnicodeSetsCharacterClassElement(Box<'a, UnicodeSetsCharacterClassElement<'a>>),
+    ClassRangesCharacterClassElement(ClassRangesCharacterClassElement),
+    UnicodeSetsCharacterClassElement(UnicodeSetsCharacterClassElement<'a>),
 }
 #[derive(Debug)]
-pub enum ClassRangesCharacterClassElement<'a> {
-    Character(Box<'a, Character>),
-    CharacterClassRange(Box<'a, CharacterClassRange>),
-    CharacterUnicodePropertyCharacterSet(Box<'a, CharacterUnicodePropertyCharacterSet>),
-    EscapeCharacterSet(Box<'a, EscapeCharacterSet>),
+pub enum ClassRangesCharacterClassElement {
+    Character(Character),
+    CharacterClassRange(CharacterClassRange),
+    CharacterUnicodePropertyCharacterSet(CharacterUnicodePropertyCharacterSet),
+    EscapeCharacterSet(EscapeCharacterSet),
 }
 #[derive(Debug)]
 pub enum UnicodeSetsCharacterClassElement<'a> {
-    Character(Box<'a, Character>),
-    CharacterClassRange(Box<'a, CharacterClassRange>),
-    ClassStringDisjunction(Box<'a, ClassStringDisjunction<'a>>),
-    EscapeCharacterSet(Box<'a, EscapeCharacterSet>),
-    ExpressionCharacterClass(Box<'a, ExpressionCharacterClass<'a>>),
-    UnicodePropertyCharacterSet(Box<'a, UnicodePropertyCharacterSet<'a>>),
-    UnicodeSetsCharacterClass(Box<'a, UnicodeSetsCharacterClass<'a>>),
+    Character(Character),
+    CharacterClassRange(CharacterClassRange),
+    ClassStringDisjunction(ClassStringDisjunction<'a>),
+    EscapeCharacterSet(EscapeCharacterSet),
+    ExpressionCharacterClass(ExpressionCharacterClass<'a>),
+    UnicodePropertyCharacterSet(UnicodePropertyCharacterSet<'a>),
+    UnicodeSetsCharacterClass(UnicodeSetsCharacterClass<'a>),
 }
 
 /// The root node.
@@ -117,7 +119,7 @@ pub struct Group<'a> {
 
 /// The capturing group.
 /// E.g. `(ab)`, `(?<name>ab)`
-#[derive(Debug)]
+#[derive(Debug, Default)]
 pub struct CapturingGroup<'a> {
     pub span: Span,
     pub name: Option<Atom>,
@@ -155,8 +157,10 @@ pub struct LookbehindAssertion<'a> {
 #[derive(Debug)]
 pub struct Quantifier<'a> {
     pub span: Span,
-    pub min: f64,
-    pub max: f64, // can be f64::INFINITY
+    /// https://github.com/eslint-community/regexpp/blob/2e8f1af992fb12eae46a446253e8fa3f6cede92a/src/validator.ts#L384-L398
+    /// both `min` and `max` are integer
+    pub min: usize,
+    pub max: usize,
     pub greedy: bool,
     pub element: QuantifiableElement<'a>,
 }
@@ -176,7 +180,7 @@ pub enum CharacterClass<'a> {
 pub struct ClassRangesCharacterClass<'a> {
     pub span: Span,
     pub unicode_sets: bool,
-    pub elements: Vec<'a, ClassRangesCharacterClassElement<'a>>,
+    pub elements: Vec<'a, ClassRangesCharacterClassElement>,
 }
 
 /// The character class used in Unicode sets mode (`v` flag).
@@ -354,7 +358,7 @@ pub struct StringAlternative<'a> {
 #[derive(Debug)]
 pub struct Character {
     pub span: Span,
-    pub value: u16, // UTF-16 code point
+    pub value: char, // UTF-16 code point
 }
 
 #[derive(Debug)]
diff --git a/crates/oxc_js_regex/src/ast_builder.rs b/crates/oxc_js_regex/src/ast_builder.rs
new file mode 100644
index 0000000000000..c94434cdf8a06
--- /dev/null
+++ b/crates/oxc_js_regex/src/ast_builder.rs
@@ -0,0 +1,73 @@
+use oxc_allocator::{Allocator, Box, String, Vec};
+use oxc_span::{Atom, GetSpan, SourceType, Span};
+
+#[allow(clippy::wildcard_imports)]
+use crate::ast::*;
+
+/// AST builder for creating AST nodes
+pub struct AstBuilder<'a> {
+    pub allocator: &'a Allocator,
+}
+
+impl<'a> AstBuilder<'a> {
+    pub fn new(allocator: &'a Allocator) -> Self {
+        Self { allocator }
+    }
+
+    #[inline]
+    pub fn alloc<T>(&self, value: T) -> Box<'a, T> {
+        Box(self.allocator.alloc(value))
+    }
+
+    #[inline]
+    pub fn new_vec<T>(&self) -> Vec<'a, T> {
+        Vec::new_in(self.allocator)
+    }
+
+    #[inline]
+    pub fn new_vec_with_capacity<T>(&self, capacity: usize) -> Vec<'a, T> {
+        Vec::with_capacity_in(capacity, self.allocator)
+    }
+
+    #[inline]
+    pub fn new_vec_single<T>(&self, value: T) -> Vec<'a, T> {
+        let mut vec = self.new_vec_with_capacity(1);
+        vec.push(value);
+        vec
+    }
+
+    #[inline]
+    pub fn new_str(&self, value: &str) -> &'a str {
+        String::from_str_in(value, self.allocator).into_bump_str()
+    }
+
+    pub fn copy<T>(&self, src: &T) -> T {
+        // SAFETY:
+        // This should be safe as long as `src` is an reference from the allocator.
+        // But honestly, I'm not really sure if this is safe.
+        unsafe { std::mem::transmute_copy(src) }
+    }
+
+    pub fn alternative(&mut self, span: Span, elements: Vec<'a, Element<'a>>) -> Branch<'a> {
+        Branch::Alternative(self.alloc(Alternative { span, elements }))
+    }
+
+    pub fn capturing_group(
+        &mut self,
+        span: Span,
+        name: Option<Atom>,
+        alternatives: Vec<'a, Alternative<'a>>,
+        references: Vec<'a, Backreference<'a>>,
+    ) -> Branch<'a> {
+        Branch::CapturingGroup(self.alloc(CapturingGroup { span, name, alternatives, references }))
+    }
+
+    pub fn reg_exp_literal(
+        &mut self,
+        span: Span,
+        flags: Flags,
+        pattern: Pattern<'a>,
+    ) -> RegExpLiteral<'a> {
+        RegExpLiteral { span, pattern, flags }
+    }
+}
diff --git a/crates/oxc_js_regex/src/ast_kind.rs b/crates/oxc_js_regex/src/ast_kind.rs
new file mode 100644
index 0000000000000..97eb10619a408
--- /dev/null
+++ b/crates/oxc_js_regex/src/ast_kind.rs
@@ -0,0 +1,25 @@
+use super::ast::*;
+
+#[allow(unused)]
+#[derive(Debug)]
+pub enum AstKind<'a> {
+    Alternative(&'a Alternative<'a>),
+    CapturingGroup(&'a CapturingGroup<'a>),
+    CharacterClass(&'a CharacterClass<'a>),
+    CharacterClassRange(&'a CharacterClassRange),
+    ClassIntersection(&'a ClassIntersection<'a>),
+    ClassStringDisjunction(&'a ClassStringDisjunction<'a>),
+    ClassSubtraction(&'a ClassSubtraction<'a>),
+    ExpressionCharacterClass(&'a ExpressionCharacterClass<'a>),
+    Group(&'a Group<'a>),
+    LookaroundAssertion(&'a LookaroundAssertion<'a>),
+    Pattern(&'a Pattern<'a>),
+    Quantifier(&'a Quantifier<'a>),
+    RegExpLiteral(&'a RegExpLiteral<'a>),
+    StringAlternative(&'a StringAlternative<'a>),
+    Backreference(&'a Backreference<'a>),
+    BoundaryAssertion(&'a BoundaryAssertion<'a>),
+    Character(&'a Character),
+    CharacterSet(&'a CharacterSet<'a>),
+    Flags(&'a Flags),
+}
diff --git a/crates/oxc_js_regex/src/ecma_version.rs b/crates/oxc_js_regex/src/ecma_version.rs
new file mode 100644
index 0000000000000..f71e61cd125d7
--- /dev/null
+++ b/crates/oxc_js_regex/src/ecma_version.rs
@@ -0,0 +1,22 @@
+#[allow(unused)]
+#[derive(Clone, Copy, PartialEq, PartialOrd, Default)]
+pub enum EcmaVersion {
+    #[default]
+    V5,
+    V2015,
+    V2016,
+    V2017,
+    V2018,
+    V2019,
+    V2020,
+    V2021,
+    V2022,
+    V2023,
+    V2024,
+}
+#[allow(unused)]
+impl EcmaVersion {
+    pub fn latest_ecma_version() -> Self {
+        Self::V2024
+    }
+}
diff --git a/crates/oxc_js_regex/src/lib.rs b/crates/oxc_js_regex/src/lib.rs
index 6647fb03be8f5..5062aac9f87e6 100644
--- a/crates/oxc_js_regex/src/lib.rs
+++ b/crates/oxc_js_regex/src/lib.rs
@@ -1,5 +1,9 @@
 pub mod ast;
+mod ast_builder;
+mod ast_kind;
+mod ecma_version;
 mod lexer;
 pub mod parser;
+mod util;
 pub mod validator;
 pub mod visitor;
diff --git a/crates/oxc_js_regex/src/parser.rs b/crates/oxc_js_regex/src/parser.rs
index 8b137891791fe..bca2c289ec990 100644
--- a/crates/oxc_js_regex/src/parser.rs
+++ b/crates/oxc_js_regex/src/parser.rs
@@ -1 +1,1604 @@
+use std::collections::{HashSet, VecDeque};
+use std::iter::Peekable;
+use std::ops::Range;
+use std::os::unix::fs::OpenOptionsExt;
+use std::panic;
+use std::str::{CharIndices, Chars, Matches};
 
+use oxc_diagnostics::Error;
+use oxc_span::Span;
+use oxc_syntax::identifier::is_identifier_part;
+use oxc_syntax::unicode_id_start::is_id_continue;
+
+use crate::ast::{
+    Alternative, Assertion, Backreference, BackreferenceRef, BoundaryAssertion, Branch,
+    CapturingGroup, Character, CharacterClass, ClassStringDisjunction, EdgeAssertion,
+    EdgeAssertionKind, Element, LookaheadAssertion, LookaroundAssertion, LookbehindAssertion,
+    Pattern, QuantifiableElement, Quantifier, RegExpLiteral, StringAlternative,
+    WordBoundaryAssertion,
+};
+use crate::ast_builder::AstBuilder;
+use crate::ecma_version::EcmaVersion;
+use crate::util::{
+    combine_surrogate_pair, is_class_set_reserved_double_punctuator_character,
+    is_class_set_reserved_punctuator, is_class_set_syntax_character, is_lead_surrogate,
+    is_syntax_character, is_trail_surrogate,
+};
+
+pub struct Lexer<'a> {
+    source: &'a str,
+    /// Regex usually, use a collected `Vec` could reduce lookahead and other util function implementation complexity
+    chars: Vec<char>,
+
+    pub(crate) errors: Vec<Error>,
+}
+
+#[allow(clippy::unused_self)]
+impl<'a> Lexer<'a> {
+    pub fn new(source: &'a str) -> Self {
+        Self { source, errors: vec![], chars: source.chars().collect::<Vec<_>>() }
+    }
+}
+
+pub struct Parser<'a> {
+    lexer: Lexer<'a>,
+    builder: AstBuilder<'a>,
+
+    /// Source Code
+    source_text: &'a str,
+
+    /// All syntax errors from parser and lexer
+    /// Note: favor adding to `Diagnostics` instead of raising Err
+    errors: Vec<Error>,
+    context: ParserContext,
+    index: usize,
+    group_names: HashSet<String>,
+    num_capturing_parens: usize,
+    last_int_value: u32,
+    back_reference_names: HashSet<String>,
+    last_assertion_is_quantifiable: bool,
+    last_range: Range<usize>,
+    last_str_value: Stirng,
+}
+
+#[derive(Default, Copy, Clone)]
+struct ParserContext {
+    source_kind: SourceKind,
+    unicode_mode: bool,
+    nflag: bool,
+    unicode_sets_mode: bool,
+    ecma_version: EcmaVersion,
+    strict: bool,
+}
+
+impl<'a> Parser<'a> {
+    /// Create a new parser
+    pub fn new(allocator: &'a oxc_allocator::Allocator, source_text: &'a str) -> Self {
+        Self {
+            lexer: Lexer::new(source_text),
+            source_text,
+            errors: vec![],
+            context: ParserContext::default(),
+            index: 0,
+            group_names: HashSet::new(),
+            num_capturing_parens: 0,
+            back_reference_names: HashSet::new(),
+            last_int_value: 0,
+            last_range: 0..0,
+            last_assertion_is_quantifiable: false,
+            builder: AstBuilder::new(allocator),
+            last_str_value: String::default(),
+        }
+    }
+
+    pub fn is(&self, ch: char) -> bool {
+        self.lexer.chars.get(self.index) == Some(&ch)
+    }
+
+    pub fn eat(&mut self, ch: char) -> bool {
+        if self.is(ch) {
+            self.index += 1;
+            true
+        } else {
+            false
+        }
+    }
+    pub fn span_with_start(&self, start: u32) -> Span {
+        Span::new(start, self.index as u32)
+    }
+
+    pub fn eat2(&mut self, first: char, second: char) -> bool {
+        if self.is(first) && self.nth(1) == Some(&second) {
+            self.index += 2;
+            true
+        } else {
+            false
+        }
+    }
+
+    pub fn eof(&self) -> bool {
+        self.index < self.lexer.chars.len()
+    }
+
+    pub fn nth(&self, n: usize) -> Option<&char> {
+        self.lexer.chars.get(self.index + n)
+    }
+
+    /// by default next means `nth(1)`
+    pub fn next(&self) -> Option<&char> {
+        self.lexer.chars.get(self.index + 1).copied()
+    }
+
+    /// get a range chars relative from current cursor
+    pub fn nrange(&self, range: Range<usize>) -> Option<&[char]> {
+        self.lexer.chars.get(self.index + range.start..(self.index + range.end))
+    }
+
+    pub fn current(&self) -> Option<char> {
+        self.lexer.chars.get(self.index).copied()
+    }
+
+    pub fn advance(&mut self) -> bool {
+        if self.index < self.lexer.chars.len() {
+            self.index += 1;
+            return true;
+        } else {
+            false
+        }
+    }
+
+    pub fn rewind<'a>(&mut self, start: usize) {
+        self.index = start;
+    }
+
+    fn eat3(&self, first: char, second: char, third: char) -> bool {
+        if self.is(first) && self.nth(1) == Some(&second) && self.nth(2) == Some(&third) {
+            self.index += 3;
+            true
+        } else {
+            false
+        }
+    }
+}
+
+#[derive(Default, Clone, Copy)]
+pub enum SourceKind {
+    Flags,
+    #[default]
+    Literal,
+    Pattern,
+}
+
+pub fn parse_literal<'a>(parser: &mut Parser<'a>) -> RegExpLiteral<'a> {
+    if parser.is('/') {
+        parser.advance();
+        let pattern = parse_pattern(parser);
+        todo!()
+    } else if parser.source_text.is_empty() {
+        panic!("Empty")
+    } else {
+        match parser.current() {
+            Some(ch) => {
+                panic!("unexpected character {ch}")
+            }
+            None => {
+                panic!("unexpected eof")
+            }
+        };
+    }
+}
+
+fn parse_pattern<'a>(parser: &mut Parser<'a>) -> Pattern<'a> {
+    let start = parser.index;
+    if let Some(pattern) = parse_pattern_internal(parser) {
+        return pattern;
+    } else if !parser.context.nflag
+        && parser.context.ecma_version >= EcmaVersion::V2018
+        && parser.group_names.len() > 0
+    {
+        parser.rewind(start);
+        parser.context.nflag = true;
+        return parse_pattern_internal(parser).expect("should have pattern");
+    }
+    panic!("Invalid pattern")
+}
+
+fn parse_pattern_internal<'a>(parser: &mut Parser<'a>) -> Option<Pattern<'a>> {
+    let start = parser.index;
+    parser.num_capturing_parens = count_capturing_parens(parser);
+    parser.group_names.clear();
+    parser.back_reference_names.clear();
+    todo!()
+}
+
+fn parse_disjunction<'a>(parser: &mut Parser<'a>) -> oxc_allocator::Vec<'a, Alternative<'a>> {
+    let start = parser.index;
+    let mut alternatives = parser.builder.new_vec();
+    loop {
+        alternatives.push(parse_alternative(parser));
+        if !parser.eat('|') {
+            break;
+        }
+    }
+    // Only consume the ast when `no_consume` is false
+    if parse_quantifier(parser, Some(true)).0 {
+        panic!("Nothing to repeat");
+    }
+    if parser.eat('{') {
+        panic!("Lone quantifier brackets")
+    }
+    alternatives
+}
+
+/// Validate the next characters as a RegExp `Alternative` production.
+/// ```
+///  Alternative[UnicodeMode, UnicodeSetsMode, N]::
+///      [empty]
+///  Alternative[?UnicodeMode, ?UnicodeSetsMode, ?N] Term[?UnicodeMode, ?UnicodeSetsMode, ?N]
+/// ```
+fn parse_alternative<'a>(parser: &mut Parser<'a>) -> Alternative<'a> {
+    let start = parser.index;
+    let mut elements = parser.builder.new_vec();
+    while !parser.eof() {
+        let (flag, node) = parse_term(parser);
+        if let Some(node) = node {
+            elements.push(node);
+        }
+        if !flag {
+            break;
+        }
+    }
+    Alternative { span: Span::new(start as u32, parser.index as u32), elements }
+}
+
+fn parse_term<'a>(parser: &mut Parser<'a>) -> (bool, Option<Element<'a>>) {
+    if parser.context.unicode_mode || parser.context.strict {}
+    todo!()
+}
+
+fn parse_optional_quantifier<'a>(parser: &mut Parser<'a>) -> (bool, Option<Element<'a>>) {
+    let (_, node) = parse_quantifier(parser, None);
+    (true, node)
+}
+
+fn parse_assertion<'a>(parser: &mut Parser<'a>) -> (bool, Option<Assertion<'a>>) {
+    let start = parser.index;
+    parser.last_assertion_is_quantifiable = false;
+
+    if parser.eat('^') {
+        return (
+            true,
+            Some(Assertion::BoundaryAssertion(parser.builder.alloc(
+                BoundaryAssertion::EdgeAssertion(parser.builder.alloc(EdgeAssertion {
+                    span: Span::new(start as u32, parser.index as u32),
+                    kind: EdgeAssertionKind::Start,
+                })),
+            ))),
+        );
+    }
+
+    if parser.eat('$') {
+        return (
+            true,
+            Some(Assertion::BoundaryAssertion(parser.builder.alloc(
+                BoundaryAssertion::EdgeAssertion(parser.builder.alloc(EdgeAssertion {
+                    span: Span::new(start as u32, parser.index as u32),
+                    kind: EdgeAssertionKind::End,
+                })),
+            ))),
+        );
+    }
+
+    if parser.eat2('\\', 'B') {
+        return (
+            true,
+            Some(Assertion::BoundaryAssertion(parser.builder.alloc(
+                BoundaryAssertion::WordBoundaryAssertion(parser.builder.alloc(
+                    WordBoundaryAssertion {
+                        span: Span::new(start as u32, parser.index as u32),
+                        negate: true,
+                    },
+                )),
+            ))),
+        );
+    }
+
+    if parser.eat2('\\', 'b') {
+        return (
+            true,
+            Some(Assertion::BoundaryAssertion(parser.builder.alloc(
+                BoundaryAssertion::WordBoundaryAssertion(parser.builder.alloc(
+                    WordBoundaryAssertion {
+                        span: Span::new(start as u32, parser.index as u32),
+                        negate: false,
+                    },
+                )),
+            ))),
+        );
+    }
+
+    // Lookahead / Lookbehind
+    if parser.eat2('(', '?') {
+        let lookbeind = parser.context.ecma_version >= EcmaVersion::V2018 && parser.eat('<');
+        let mut eq_sign = parser.eat('=');
+        let mut negate = if eq_sign { false } else { parser.eat('!') };
+        if eq_sign || negate {
+            let span = Span::new(start as u32, parser.index as u32);
+            let alternatives = parse_disjunction(parser);
+            let look_around_assertion =
+                if lookbeind {
+                    LookaroundAssertion::LookbehindAssertion(
+                        parser.builder.alloc(LookbehindAssertion { span, negate, alternatives }),
+                    )
+                } else {
+                    LookaroundAssertion::LookaheadAssertion(
+                        parser.builder.alloc(LookaheadAssertion { span, negate, alternatives }),
+                    )
+                };
+            let node = Assertion::LookaroundAssertion(parser.builder.alloc(look_around_assertion));
+            if !parser.eat(')') {
+                panic!("Unterminated group")
+            }
+            parser.last_assertion_is_quantifiable = !lookbeind && !parser.context.strict;
+        }
+        parser.rewind(start);
+    }
+    (false, None)
+}
+
+/// Validate the next characters as a RegExp `Quantifier` production if possible.
+/// ```
+///  Quantifier::
+///        QuantifierPrefix
+///        QuantifierPrefix `?`
+///   QuantifierPrefix::
+///        `*`
+///        `+`
+///        `?`
+///        `{` DecimalDigits `}`
+///        `{` DecimalDigits `,}`
+///        `{` DecimalDigits `,` DecimalDigits `}`
+///   ```
+/// returns `true` if it consumed the next characters successfully.
+fn parse_quantifier<'a>(
+    parser: &mut Parser<'a>,
+    no_consume: Option<bool>,
+) -> (bool, Option<Element<'a>>) {
+    let mut no_consume = no_consume.unwrap_or_default();
+    let start = parser.index;
+    let mut min = 0;
+    let mut max = 0;
+    let mut greedy = false;
+    let mut element = None;
+    match parser.current().cloned() {
+        Some('*') => {
+            min = 0;
+            max = usize::MAX;
+            parser.advance();
+        }
+        Some('+') => {
+            min = 1;
+            max = usize::MAX;
+            parser.advance();
+        }
+        Some('?') => {
+            min = 0;
+            max = 1;
+            parser.advance();
+        }
+        Some(_) => {
+            if parse_braced_quantifier(parser, no_consume) {
+                min = parser.last_range.start;
+                max = parser.last_range.end;
+            }
+        }
+        None => return (false, None),
+    }
+    greedy = !parser.eat('?');
+
+    if !no_consume {
+        let quantifier = parser.builder.alloc(Quantifier {
+            span: Span { start: start as u32, end: parser.index as u32 },
+            min,
+            max,
+            greedy,
+            // https://github.com/eslint-community/regexpp/blob/2e8f1af992fb12eae46a446253e8fa3f6cede92a/src/parser.ts#L269-L275
+            // it can't be null, or the program will panic, so we put a dummy element, and parent
+            // should replace it
+            element: QuantifiableElement::Character(Character {
+                span: Span::default(),
+                value: ' ',
+            }),
+        });
+
+        element = Some(Element::Quantifier(quantifier))
+    }
+    (true, element)
+}
+
+fn parse_braced_quantifier<'a>(parser: &mut Parser<'a>, no_error: bool) -> bool {
+    let start = parser.index;
+    if eat_decimal_digits(parser) {
+        let min = parser.last_int_value;
+        let mut max = min;
+        if parser.eat(',') {
+            max = if eat_decimal_digits(parser) { parser.last_int_value } else { usize::MAX };
+        }
+        if parser.eat('}') {
+            if !no_error && max < min {
+                panic!("numbers out of order in {{}} quantifier");
+            }
+            parser.last_range = min..max;
+            return true;
+        }
+    }
+    if !no_error && (parser.context.unicode_mode || parser.context.strict) {
+        panic!("Incomplete quantifier");
+    }
+    parser.rewind(start);
+    false
+}
+
+fn parse_atom<'a>(parser: &mut Parser<'a>) {
+    todo!()
+}
+
+fn parse_dot<'a>(parser: &mut Parser<'a>) -> (bool, Option<Character>) {
+    let start = parser.index;
+    if parser.eat('.') {
+        (true, Some(Character { span: Span::new(start as u32, parser.index as u32), value: '.' }))
+    } else {
+        (false, None)
+    }
+}
+
+fn parse_reverse_solidus_atom_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+    if parser.eat('\\') {
+        if parse_atom_escape(parser) {
+            return true;
+        }
+        parser.rewind(start);
+    }
+    false
+}
+
+fn parse_atom_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    if parse_backreference(parser)
+        || parser.consume_character_class_escape()
+        || parser.consume_character_escape()
+        || (parser.context.nflag && parser.consume_k_group_name())
+    {
+        true
+    } else {
+        if parser.strict || parser._unicode_mode {
+            parser.raise("Invalid escape");
+        }
+        false
+    }
+}
+
+/// TODO: resolve when pattern leave
+fn parse_backreference<'a>(parser: &mut Parser<'a>) -> Option<Backreference<'a>> {
+    let start = parser.index;
+    if parser.eat_decimal_escape() {
+        let n = parser.last_int_value;
+        if n <= parser.num_capturing_parens {
+            Some(Backreference {
+                span: Span::new(start as u32, parser.index as u32),
+                reference: BackreferenceRef::Number(n as usize),
+                resolved: CapturingGroup::default(),
+            })
+        } else {
+            if parser.context.strict || parser.context.unicode_mode {
+                panic!("Invalid escape");
+            }
+            parser.rewind(start);
+            None
+        }
+    } else {
+        None
+    }
+}
+
+struct UnicodeSetsConsumeResult {
+    may_contain_strings: Option<bool>,
+}
+
+fn consume_character_class_escape<'a>(parser: &mut Parser<'a>) -> Option<UnicodeSetsConsumeResult> {
+    let start = parser.index;
+
+    if parser.eat(LATIN_SMALL_LETTER_D) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "digit", false);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    if parser.eat(LATIN_CAPITAL_LETTER_D) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "digit", true);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    if parser.eat(LATIN_SMALL_LETTER_S) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "space", false);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    if parser.eat(LATIN_CAPITAL_LETTER_S) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "space", true);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    if parser.eat(LATIN_SMALL_LETTER_W) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "word", false);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    if parser.eat(LATIN_CAPITAL_LETTER_W) {
+        parser.last_int_value = -1;
+        parser.on_escape_character_set(start - 1, parser.index, "word", true);
+        return Some(UnicodeSetsConsumeResult { may_contain_strings: None });
+    }
+
+    let mut negate = false;
+    if parser._unicode_mode
+        && parser.ecma_version >= 2018
+        && (parser.eat(LATIN_SMALL_LETTER_P) || (negate = parser.eat(LATIN_CAPITAL_LETTER_P)))
+    {
+        parser.last_int_value = -1;
+        if parser.eat(LEFT_CURLY_BRACKET) {
+            if let Some(result) = parser.eat_unicode_property_value_expression() {
+                if parser.eat(RIGHT_CURLY_BRACKET) {
+                    if negate && result.strings.is_some() {
+                        parser.raise("Invalid property name");
+                    }
+
+                    parser.on_unicode_property_character_set(
+                        start - 1,
+                        parser.index,
+                        "property",
+                        &result.key,
+                        &result.value,
+                        negate,
+                        result.strings.unwrap_or(false),
+                    );
+
+                    return Some(UnicodeSetsConsumeResult {
+                        may_contain_strings: result.strings.unwrap_or(false),
+                    });
+                }
+            }
+        }
+        panic!("Invalid property name");
+    }
+
+    None
+}
+
+fn consume_k_group_name<'a>(parser: &mut Parser<'a>) -> Option<Backreference<'a>> {
+    let start = parser.index;
+
+    if parser.eat('k') {
+        if parser.eat_group_name() {
+            let group_name: String = parser.last_str_value.clone();
+            parser.back_reference_names.insert(group_name.clone());
+            return Some(Backreference {
+                span: parser.span_with_start(start),
+                reference: BackreferenceRef::Atom(group_name.as_str().into()),
+                // dummy resolved
+                resolved: CapturingGroup::default(),
+            });
+        }
+        panic!("Invalid named reference");
+    }
+
+    None
+}
+
+fn consume_character_class<'a>(parser: &mut Parser<'a>) -> Option<UnicodeSetsConsumeResult> {
+    let start = parser.index;
+
+    if parser.eat(LEFT_SQUARE_BRACKET) {
+        let negate = parser.eat(CIRCUMFLEX_ACCENT);
+        parser.on_character_class_enter(start, negate, parser._unicode_sets_mode);
+        let result = consume_class_contents(parser);
+        if !parser.eat(RIGHT_SQUARE_BRACKET) {
+            if parser.current_code_point == -1 {
+                parser.raise("Unterminated character class");
+            }
+            parser.raise("Invalid character in character class");
+        }
+        if negate && result.may_contain_strings {
+            parser.raise("Negated character class may contain strings");
+        }
+
+        parser.on_character_class_leave(start, parser.index, negate);
+
+        // * Static Semantics: MayContainStrings
+        // CharacterClass[UnicodeMode, UnicodeSetsMode] ::
+        //         [ ^ ClassContents[?UnicodeMode, ?UnicodeSetsMode] ]
+        //     1. Return false.
+        // CharacterClass :: [ ClassContents ]
+        //     1. Return MayContainStrings of the ClassContents.
+        Some(result)
+    } else {
+        None
+    }
+}
+
+/// * Consume ClassContents in a character class.
+///  * @returns `UnicodeSetsConsumeResult`.
+fn consume_class_contents<'a>(parser: &mut Parser<'a>) -> UnicodeSetsConsumeResult {
+    if parser._unicode_sets_mode {
+        if parser.current_code_point == RIGHT_SQUARE_BRACKET {
+            // [empty]
+
+            // * Static Semantics: MayContainStrings
+            // ClassContents[UnicodeMode, UnicodeSetsMode] ::
+            //         [empty]
+            //     1. Return false.
+            return UnicodeSetsConsumeResult { may_contain_strings: None };
+        }
+        let result = parser.consume_class_set_expression();
+
+        // * Static Semantics: MayContainStrings
+        // ClassContents :: ClassSetExpression
+        //     1. Return MayContainStrings of the ClassSetExpression.
+        return result;
+    }
+
+    let strict = parser.strict || parser._unicode_mode;
+    loop {
+        // Consume the first ClassAtom
+        let range_start = parser.index;
+        if !parser.consume_class_atom() {
+            break;
+        }
+        let min = parser._last_int_value;
+
+        // Consume `-`
+        if !parser.eat(HYPHEN_MINUS) {
+            continue;
+        }
+        parser.on_character(range_start - 1, parser.index, HYPHEN_MINUS);
+
+        // Consume the second ClassAtom
+        if !parser.consume_class_atom() {
+            break;
+        }
+        let max = parser._last_int_value;
+
+        // Validate
+        if min == -1 || max == -1 {
+            if strict {
+                parser.raise("Invalid character class");
+            }
+            continue;
+        }
+        if min > max {
+            parser.raise("Range out of order in character class");
+        }
+
+        parser.on_character_class_range(range_start, self.index, min, max);
+    }
+
+    // * Static Semantics: MayContainStrings
+    // ClassContents[UnicodeMode, UnicodeSetsMode] ::
+    //         NonemptyClassRanges[?UnicodeMode]
+    //     1. Return false.
+    return UnicodeSetsConsumeResult { may_contain_strings: false };
+}
+
+/**
+ * Consume ClassAtom in a character class.
+ * @returns `true` if it consumed the next characters successfully.
+ */
+fn consume_class_atom<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = self.index;
+    let cp = self.current_code_point;
+
+    if cp != -1 && cp != REVERSE_SOLIDUS && cp != RIGHT_SQUARE_BRACKET {
+        self.advance();
+        self._last_int_value = cp;
+        self.on_character(start, self.index, self._last_int_value);
+        return true;
+    }
+
+    if self.eat(REVERSE_SOLIDUS) {
+        if consume_class_escape(parser) {
+            return true;
+        }
+        if !self.strict && self.current_code_point == LATIN_SMALL_LETTER_C {
+            self._last_int_value = REVERSE_SOLIDUS;
+            self.on_character(start, self.index, self._last_int_value);
+            return true;
+        }
+        if self.strict || self._unicode_mode {
+            self.raise("Invalid escape");
+        }
+        self.rewind(start);
+    }
+
+    return false;
+}
+
+/**
+ * Consume ClassEscape in a character class.
+ * @returns `true` if it consumed the next characters successfully.
+ */
+fn consume_class_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = self.index;
+
+    // `b`
+    if self.eat(LATIN_SMALL_LETTER_B) {
+        self._last_int_value = BACKSPACE;
+        self.on_character(start - 1, self.index, self._last_int_value);
+        return true;
+    }
+
+    // [+UnicodeMode] `-`
+    if self._unicode_mode && self.eat(HYPHEN_MINUS) {
+        self._last_int_value = HYPHEN_MINUS;
+        self.on_character(start - 1, self.index, self._last_int_value);
+        return true;
+    }
+
+    // [annexB][~UnicodeMode] `c` ClassControlLetter
+    let cp = 0;
+    if !self.strict
+        && !self._unicode_mode
+        && self.current_code_point == LATIN_SMALL_LETTER_C
+        && (is_decimal_digit((cp = self.next_code_point)) || cp == LOW_LINE)
+    {
+        self.advance();
+        self.advance();
+        self._last_int_value = cp % 0x20;
+        self.on_character(start - 1, self.index, self._last_int_value);
+        return true;
+    }
+
+    return consume_character_class_escape(parser) || consume_character_escape(parser);
+}
+
+/**
+ * Consume ClassSetExpression in a character class.
+ * @returns `UnicodeSetsConsumeResult`.
+ */
+fn consume_class_set_expression<'a>(parser: &mut Parser<'a>) -> UnicodeSetsConsumeResult {
+    let start = self.index;
+    let mut may_contain_strings: Option<bool> = None;
+    let mut result: Option<UnicodeSetsConsumeResult> = None;
+
+    if self.consume_class_set_character() {
+        if self.consume_class_set_range_from_operator(start) {
+            // ClassUnion
+            self.consume_class_union_right(UnicodeSetsConsumeResult { may_contain_strings: None });
+            return UnicodeSetsConsumeResult { may_contain_strings: false };
+        }
+        // ClassSetOperand
+
+        // * Static Semantics: MayContainStrings
+        // ClassSetOperand ::
+        //         ClassSetCharacter
+        //     1. Return false.
+        may_contain_strings = Some(false);
+    } else if let Some(res) = self.consume_class_set_operand() {
+        may_contain_strings = Some(res.may_contain_strings);
+    } else {
+        let cp = self.current_code_point;
+        if cp == REVERSE_SOLIDUS {
+            self.advance();
+            self.raise("Invalid escape");
+        }
+        if cp == self.next_code_point && is_class_set_reserved_double_punctuator_character(cp) {
+            self.raise("Invalid set operation in character class");
+        }
+        self.raise("Invalid character in character class");
+    }
+
+    if self.eat2(AMPERSAND, AMPERSAND) {
+        // ClassIntersection
+        while self.current_code_point != AMPERSAND
+            && (result = self.consume_class_set_operand()).is_some()
+        {
+            self.on_class_intersection(start, self.index);
+            if !result.as_ref().unwrap().may_contain_strings.unwrap_or(false) {
+                may_contain_strings = Some(false);
+            }
+            if self.eat2(AMPERSAND, AMPERSAND) {
+                continue;
+            }
+
+            // * Static Semantics: MayContainStrings
+            // ClassSetExpression :: ClassIntersection
+            //     1. Return MayContainStrings of the ClassIntersection.
+            // ClassIntersection :: ClassSetOperand && ClassSetOperand
+            //     1. If MayContainStrings of the first ClassSetOperand is false, return false.
+            //     2. If MayContainStrings of the second ClassSetOperand is false, return false.
+            //     3. Return true.
+            // ClassIntersection :: ClassIntersection && ClassSetOperand
+            //     1. If MayContainStrings of the ClassIntersection is false, return false.
+            //     2. If MayContainStrings of the ClassSetOperand is false, return false.
+            //     3. Return true.
+            return UnicodeSetsConsumeResult { may_contain_strings };
+        }
+
+        self.raise("Invalid character in character class");
+    }
+    if self.eat2(HYPHEN_MINUS, HYPHEN_MINUS) {
+        // ClassSubtraction
+        while self.consume_class_set_operand() {
+            self.on_class_subtraction(start, self.index);
+            if self.eat2(HYPHEN_MINUS, HYPHEN_MINUS) {
+                continue;
+            }
+            // * Static Semantics: MayContainStrings
+            // ClassSetExpression :: ClassSubtraction
+            //     1. Return MayContainStrings of the ClassSubtraction.
+            // ClassSubtraction :: ClassSetOperand -- ClassSetOperand
+            //     1. Return MayContainStrings of the first ClassSetOperand.
+            // ClassSubtraction :: ClassSubtraction -- ClassSetOperand
+            //     1. Return MayContainStrings of the ClassSubtraction.
+            return UnicodeSetsConsumeResult { may_contain_strings };
+        }
+
+        self.raise("Invalid character in character class");
+    }
+    // ClassUnion
+    return self.consume_class_union_right(UnicodeSetsConsumeResult { may_contain_strings });
+}
+
+/**
+ * Consume the right operand of a ClassUnion in a character class.
+ * @param left_result The result information for the left ClassSetRange or ClassSetOperand.
+ * @returns `UnicodeSetsConsumeResult`.
+ */
+fn consume_class_union_right<'a>(
+    parser: &mut Parser<'a>,
+    left_result: UnicodeSetsConsumeResult,
+) -> UnicodeSetsConsumeResult {
+    // ClassUnion
+    let mut may_contain_strings = left_result.may_contain_strings.unwrap_or(false);
+    loop {
+        let start = self.index;
+        if self.consume_class_set_character() {
+            self.consume_class_set_range_from_operator(start);
+            continue;
+        }
+        if let Some(result) = self.consume_class_set_operand() {
+            if result.may_contain_strings.unwrap_or(false) {
+                may_contain_strings = true;
+            }
+            continue;
+        }
+        break;
+    }
+
+    // * Static Semantics: MayContainStrings
+    // ClassSetExpression :: ClassUnion
+    //     1. Return MayContainStrings of the ClassUnion.
+    // ClassUnion :: ClassSetRange ClassUnion(opt)
+    //     1. If the ClassUnion is present, return MayContainStrings of the ClassUnion.
+    //     2. Return false.
+    // ClassUnion :: ClassSetOperand ClassUnion(opt)
+    //     1. If MayContainStrings of the ClassSetOperand is true, return true.
+    //     2. If ClassUnion is present, return MayContainStrings of the ClassUnion.
+    //     3. Return false.
+    return UnicodeSetsConsumeResult { may_contain_strings: Some(may_contain_strings) };
+}
+
+fn eat_decimal_digits<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+    parser.last_int_value = 0;
+    while let Some(ch) = parser.current() {
+        let Some(d) = ch.to_digit(10) else {
+            break;
+        };
+        parser.last_int_value = 10 * parser.last_int_value + d;
+        parser.advance();
+    }
+    parser.index != start
+}
+
+fn eat_hex_digits(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+    parser.last_int_value = 0;
+
+    while let Some(ch) = parser.current() {
+        if !ch.is_ascii_hexdigit() {
+            break;
+        }
+        parser.last_int_value =
+            16 * parser.last_int_value + ch.to_digit(16).expect("should convert successfully");
+        parser.advance();
+    }
+
+    parser.index != start
+}
+
+fn count_capturing_parens<'a>(parser: &mut Parser<'a>) -> usize {
+    let start = parser.index;
+    let mut in_class = false;
+    let mut escaped = false;
+    let mut count = 0;
+    while let Some(ch) = parser.current() {
+        if escaped {
+            escaped = false;
+        }
+        match ch {
+            '\\' => {
+                escaped = true;
+            }
+            '[' | ']' => {
+                in_class = false;
+            }
+            '(' if !in_class => {
+                if parser.nth(1) != Some(&'?')
+                    || (parser.nth(2) == Some(&'<')
+                        && !matches!(parser.nth(3), Some(&'=') | Some(&'!')))
+                {
+                    count += 1;
+                }
+            }
+            _ => {}
+        }
+        parser.advance();
+    }
+    parser.rewind(start);
+    count
+}
+
+/// * Consume NestedClass in a character class.
+///  * @returns `UnicodeSetsConsumeResult`.
+///  TODO:
+fn consume_nested_class<'a>(parser: &mut Parser<'a>) -> Option<CharacterClass> {
+    let start = self.index;
+    if self.eat(LEFT_SQUARE_BRACKET) {
+        let negate = self.eat(CIRCUMFLEX_ACCENT);
+        self.on_character_class_enter(start, negate, true);
+        let result = consume_class_contents(parser);
+        if !self.eat(RIGHT_SQUARE_BRACKET) {
+            self.raise("Unterminated character class");
+        }
+        if negate && result.may_contain_strings.unwrap_or(false) {
+            self.raise("Negated character class may contain strings");
+        }
+        self.on_character_class_leave(start, self.index, negate);
+
+        // * Static Semantics: MayContainStrings
+        // NestedClass ::
+        //         [ ^ ClassContents[+UnicodeMode, +UnicodeSetsMode] ]
+        //     1. Return false.
+        // NestedClass :: [ ClassContents ]
+        //     1. Return MayContainStrings of the ClassContents.
+        return Some(result);
+    }
+    if self.eat(REVERSE_SOLIDUS) {
+        if let Some(result) = self.consume_character_class_escape() {
+            // * Static Semantics: MayContainStrings
+            // NestedClass :: \ CharacterClassEscape
+            //     1. Return MayContainStrings of the CharacterClassEscape.
+            return Some(result);
+        }
+        self.rewind(start);
+    }
+    None
+}
+
+/**
+ * Consume ClassStringDisjunction in a character class.
+ * @returns `UnicodeSetsConsumeResult`.
+ */
+fn consume_class_string_disjunction<'a>(
+    parser: &mut Parser<'a>,
+) -> (Option<UnicodeSetsConsumeResult>, Option<ClassStringDisjunction<'a>>) {
+    let start = parser.index;
+    if parser.eat3('\\', 'q', '{') {
+        let mut i = 0;
+        let mut may_contain_strings = false;
+        let mut alternatives = parser.builder.new_vec();
+        loop {
+            let (consume_res, node) = consume_class_string(parser, i);
+            if consume_res.may_contain_strings.unwrap_or_default() {
+                may_contain_strings = true;
+            }
+            if let Some(node) = node {
+                alternatives.push(node);
+            }
+            i += 1;
+            if !parser.eat('|') {
+                break;
+            }
+        }
+
+        if parser.eat('}') {
+            // * Static Semantics: MayContainStrings
+            // ClassStringDisjunction :: \q{ ClassStringDisjunctionContents }
+            //     1. Return MayContainStrings of the ClassStringDisjunctionContents.
+            // ClassStringDisjunctionContents :: ClassString
+            //     1. Return MayContainStrings of the ClassString.
+            // ClassStringDisjunctionContents :: ClassString | ClassStringDisjunctionContents
+            //     1. If MayContainStrings of the ClassString is true, return true.
+            //     2. Return MayContainStrings of the ClassStringDisjunctionContents.
+            return (
+                Some(UnicodeSetsConsumeResult { may_contain_strings: Some(may_contain_strings) }),
+                Some(ClassStringDisjunction { span: parser.span_with_start(start), alternatives }),
+            );
+        }
+        panic!("Unterminated class string disjunction");
+    }
+    None
+}
+
+/**
+ * Consume ClassString in a character class.
+ * @param i - The index of the string alternative.
+ * @returns `UnicodeSetsConsumeResult`.
+ */
+fn consume_class_string<'a>(
+    parser: &mut Parser<'a>,
+    i: usize,
+) -> (UnicodeSetsConsumeResult, Option<StringAlternative<'a>>) {
+    let start = parser.index;
+
+    let mut count = 0;
+    let mut arr = parser.builder.new_vec();
+    while !parser.eof() {
+        if let Some(character) = consume_class_set_character(parser) {
+            arr.push(character);
+            count += 1;
+        } else {
+            break;
+        }
+    }
+
+    // * Static Semantics: MayContainStrings
+    // ClassString :: [empty]
+    //     1. Return true.
+    // ClassString :: NonEmptyClassString
+    //     1. Return MayContainStrings of the NonEmptyClassString.
+    // NonEmptyClassString :: ClassSetCharacter NonEmptyClassString(opt)
+    //     1. If NonEmptyClassString is present, return true.
+    //     2. Return false.
+    (
+        UnicodeSetsConsumeResult { may_contain_strings: Some(count != 1) },
+        Some(StringAlternative { span: parser.span_with_start(start), elements: arr }),
+    )
+}
+
+/**
+ * Consume ClassSetCharacter in a character class.
+ * Set `self._last_int_value` if it consumed the next characters successfully.
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn consume_class_set_character<'a>(parser: &mut Parser<'a>) -> Option<Character> {
+    let start = parser.index;
+    let cp = parser.current()?;
+
+    if Some(cp) != parser.next() || !is_class_set_reserved_double_punctuator_character(cp) {
+        if !is_class_set_syntax_character(cp) {
+            parser.last_int_value = cp as u32;
+            parser.advance();
+            Some(Character { span: parser.span_with_start(start), value: cp })
+        }
+    }
+
+    if parser.eat('\\') {
+        if consume_character_escape(parser) {
+            return true;
+        }
+        if let Some(ch) = parser.current()
+            && is_class_set_reserved_punctuator(ch)
+        {
+            parser.last_int_value = parser.current()? as u32;
+            parser.advance();
+
+            Some(Character {
+                span: parser.span_with_start(start),
+                value: parser.last_int_value as char,
+            })
+        }
+        if parser.eat('b') {
+            parser.last_int_value = 8;
+            Some(Character {
+                span: parser.span_with_start(start),
+                value: parser.last_int_value as char,
+            })
+        }
+        parser.rewind(start);
+    }
+
+    None
+}
+
+fn consume_character_escape<'a>(parser: &mut Parser<'a>) -> Option<Character> {
+    let start = parser.index;
+    if eat_control_escape(parser)
+        || eat_c_control_letter(parser)
+        || eat_zero(parser).is_some()
+        || eat_hex_escape_sequence(parser)
+        || eat_reg_exp_unicode_escape_sequence(parser, false)
+        || (!parser.context.strict
+            && !parser.context.unicode_mode
+            && eat_legacy_octal_escape_sequence(parser))
+        || eat_identity_escape(parser).is_some()
+    {
+        Some(Character {
+            span: parser.span_with_start(start - 1),
+            value: parser.last_int_value as char,
+        })
+    }
+    None
+}
+
+fn eat_hex_escape_sequence<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+    if parser.eat('x') {
+        if eat_fixed_hex_digits(parser, 2) {
+            return true;
+        }
+        if parser.context.unicode_mode || parser.context.strict {
+            panic!("Invalid escape");
+        }
+        parser.rewind(start);
+    }
+    false
+}
+
+fn eat_legacy_octal_escape_sequence<'a>(parser: &mut Parser<'a>) -> bool {
+    if eat_octal_digit(parser).is_some() {
+        let n1 = parser.last_int_value;
+        if eat_octal_digit(parser).is_some() {
+            let n2 = parser.last_int_value;
+            if n1 <= 3 && eat_octal_digit(parser).is_some() {
+                parser.last_int_value = n1 * 64 + n2 * 8 + parser.last_int_value;
+            } else {
+                parser.last_int_value = n1 * 8 + n2;
+            }
+        } else {
+            parser.last_int_value = n1;
+        }
+        return true;
+    }
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `GroupName` production if possible.
+ * Set `self._last_str_value` if the group name existed.
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_group_name<'a>(parser: &mut Parser<'a>) -> bool {
+    if parser.eat('<') {
+        if eat_reg_exp_identifier_name(parser) && parser.eat('>') {
+            return true;
+        }
+        panic!("Invalid capture group name");
+    }
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `RegExpIdentifierName` production if
+ * possible.
+ * Set `self._last_str_value` if the identifier name existed.
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_identifier_name<'a>(parser: &mut Parser<'a>) -> bool {
+    if eat_reg_exp_identifier_start(parser).is_some() {
+        parser.last_str_value = (parser.last_int_value as char).to_string();
+
+        while eat_reg_exp_identifier_part(parser) {
+            parser.last_str_value.push(parser.last_int_value as char);
+        }
+
+        return true;
+    }
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `RegExpIdentifierStart` production if
+ * possible.
+ * Set `self._last_int_value` if the identifier start existed.
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_identifier_start<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    let start = parser.index;
+    let force_u_flag =
+        !parser.context.unicode_mode && parser.context.ecma_version >= EcmaVersion::V2020;
+    let mut cp = parser.current()?;
+    parser.advance();
+
+    if cp == '\\' && eat_reg_exp_unicode_escape_sequence(parser, force_u_flag) {
+        cp = char::from_u32(parser.last_int_value).expect("should convert to char");
+    } else if force_u_flag && is_lead_surrogate(cp) && is_trail_surrogate(parser.current()? as u32)
+    {
+        cp = combine_surrogate_pair(cp, parser.current().expect("should convert to u32") as u32);
+        parser.advance();
+    }
+
+    if is_identifier_start_char(cp) {
+        parser.last_int_value = cp as u32;
+        return Some(());
+    }
+
+    if parser.index != start {
+        parser.rewind(start);
+    }
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `RegExpIdentifierPart` production if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * RegExpIdentifierPart[UnicodeMode]::
+ *      RegExpIdentifierStart[?UnicodeMode]
+ *      DecimalDigit
+ *      \ UnicodeEscapeSequence[+UnicodeMode]
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_identifier_part<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    let start = parser.index;
+    let force_u_flag =
+        !parser.context.unicode_mode && parser.context.ecma_version >= EcmaVersion::V2020;
+    let mut cp = parser.current()?;
+    parser.advance();
+
+    if cp == '\\' && eat_reg_exp_unicode_escape_sequence(parser, force_u_flag) {
+        cp = char::from_u32(parser.last_int_value).expect("should convert to char");
+    } else if force_u_flag
+        && is_lead_surrogate(cp as u32)
+        && is_trail_surrogate(parser.current()? as u32)
+    {
+        cp = combine_surrogate_pair(cp as u32, parser.current()? as u32);
+        parser.advance();
+    }
+
+    if is_identifier_part(cp) {
+        parser.last_int_value = cp as u32;
+        return Some(());
+    }
+
+    if parser.index != start {
+        parser.rewind(start);
+    }
+    None
+}
+
+/**
+ * Eat the next characters as the following alternatives if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ *      `c` ControlLetter
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_c_control_letter<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+    if parser.eat('c') {
+        if eat_control_letter(parser).is_some() {
+            return true;
+        }
+        parser.rewind(start);
+    }
+    false
+}
+
+/**
+ * Eat the next characters as the following alternatives if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ *      `0` [lookahead ∉ DecimalDigit]
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_zero<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    if parser.current()? == '0' && parser.nth(1).map(|ch| ch.is_ascii_digit()) == Some(false) {
+        parser.last_int_value = 0;
+        parser.advance();
+        return Some(());
+    }
+    None
+}
+
+/**
+ * Eat the next characters as a RegExp `ControlEscape` production if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * ControlEscape:: one of
+ *      f n r t v
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_control_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    if parser.eat('f') {
+        parser.last_int_value = 12;
+        return true;
+    }
+    if parser.eat('n') {
+        parser.last_int_value = 10;
+        return true;
+    }
+    if parser.eat('r') {
+        parser.last_int_value = 13;
+        return true;
+    }
+    if parser.eat('t') {
+        parser.last_int_value = 9;
+        return true;
+    }
+    if parser.eat('v') {
+        parser.last_int_value = 11;
+        return true;
+    }
+    false
+}
+
+/**
+ * Eat the next characters as the following alternatives if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ *      `{` CodePoint `}`
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_unicode_code_point_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+
+    if parser.eat('{')
+        && eat_hex_digits(parser)
+        && parser.eat('}')
+        && is_valid_unicode(parser.last_int_value as u32)
+    {
+        return true;
+    }
+
+    parser.rewind(start);
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `DecimalEscape` production if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * DecimalEscape::
+ *      NonZeroDigit DecimalDigits(opt) [lookahead ∉ DecimalDigit]
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_decimal_escape<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    parser.last_int_value = 0;
+    let mut cp = parser.current()?;
+    if cp >= '1' && cp <= '9' {
+        while cp >= '1' && cp <= '9' {
+            parser.last_int_value =
+                10 * parser.last_int_value + cp.to_digit(10).expect("should convert successfully");
+            parser.advance();
+            cp = match parser.current() {
+                Some(ch) => ch,
+                None => break,
+            };
+        }
+        return Some(());
+    }
+    None
+}
+
+/**
+ * Eat the next characters as a RegExp `ControlLetter` production if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * ControlLetter:: one of
+ *      a b c d e f g h i j k l m n o p q r s t u v w x y z
+ *      A B C D E F G H I J K L M N O P Q R S T U V W X Y Z
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_control_letter<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    let cp = parser.current()?;
+    if cp.is_ascii_alphabetic() {
+        parser.advance();
+        parser.last_int_value = (cp as u32) % 0x20;
+        return Some(());
+    }
+    None
+}
+
+/**
+ * Eat the next characters as a RegExp `RegExpUnicodeEscapeSequence`
+ * production if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * RegExpUnicodeEscapeSequence[UnicodeMode]::
+ *      [+UnicodeMode] `u` HexLeadSurrogate `\u` HexTrailSurrogate
+ *      [+UnicodeMode] `u` HexLeadSurrogate
+ *      [+UnicodeMode] `u` HexTrailSurrogate
+ *      [+UnicodeMode] `u` HexNonSurrogate
+ *      [~UnicodeMode] `u` Hex4Digits
+ *      [+UnicodeMode] `u{` CodePoint `}`
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_unicode_escape_sequence<'a>(parser: &mut Parser<'a>, force_u_flag: bool) -> bool {
+    let start = parser.index;
+    let u_flag = force_u_flag || parser.context.unicode_mode;
+
+    if parser.eat('u') {
+        if (u_flag && eat_reg_exp_unicode_surrogate_pair_escape(parser))
+            || eat_fixed_hex_digits(parser, 4).is_some()
+            || (u_flag && eat_reg_exp_unicode_code_point_escape(parser))
+        {
+            return true;
+        }
+        if parser.context.strict || u_flag {
+            panic!("Invalid unicode escape");
+        }
+        parser.rewind(start);
+    }
+
+    false
+}
+
+/**
+ * Eat the next characters as the following alternatives if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ *      HexLeadSurrogate `\u` HexTrailSurrogate
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_reg_exp_unicode_surrogate_pair_escape<'a>(parser: &mut Parser<'a>) -> bool {
+    let start = parser.index;
+
+    if eat_fixed_hex_digits(parser, 4).is_some() {
+        let lead = parser.last_int_value;
+        if is_lead_surrogate(lead)
+            && parser.eat('\\')
+            && parser.eat('u')
+            && eat_fixed_hex_digits(parser, 4).is_some()
+        {
+            let trail = parser.last_int_value;
+            if is_trail_surrogate(trail) {
+                parser.last_int_value = combine_surrogate_pair(lead, trail);
+                return true;
+            }
+        }
+
+        parser.rewind(start);
+    }
+
+    false
+}
+
+/**
+ * Eat the next characters as a RegExp `IdentityEscape` production if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * IdentityEscape[UnicodeMode, N]::
+ *      [+UnicodeMode] SyntaxCharacter
+ *      [+UnicodeMode] `/`
+ *      [strict][~UnicodeMode] SourceCharacter but not UnicodeIDContinue
+ *      [annexB][~UnicodeMode] SourceCharacterIdentityEscape[?N]
+ * SourceCharacterIdentityEscape[N]::
+ *      [~N] SourceCharacter but not c
+ *      [+N] SourceCharacter but not one of c k
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_identity_escape<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    let cp = parser.current();
+    if is_valid_identity_escape(parser, cp) {
+        parser.last_int_value = cp.unwrap() as u32;
+        parser.advance();
+        return Some(());
+    }
+    None
+}
+
+fn is_valid_identity_escape(parser: &mut Parser<'a>, cp: Option<char>) -> bool {
+    if cp.is_none() {
+        return false;
+    }
+    let cp = cp.unwrap();
+    if parser.context.unicode_mode {
+        return is_syntax_character(cp) || cp == '/';
+    }
+    if parser.context.strict {
+        return !is_id_continue(cp);
+    }
+    if parser.context.nflag {
+        return !(cp == 'c' || cp == 'k');
+    }
+    cp != 'c'
+}
+
+/**
+ * Eat the next characters as a RegExp `DecimalEscape` production if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * DecimalEscape::
+ *      NonZeroDigit DecimalDigits(opt) [lookahead ∉ DecimalDigit]
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_decimal_escape<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    parser.last_int_value = 0;
+    let mut cp = parser.current()?;
+    if cp.is_ascii_digit() {
+        while cp.is_ascii_digit() {
+            parser.last_int_value = 10 * parser.last_int_value + cp.to_digit(10)?;
+            parser.advance();
+            cp = match parser.current() {
+                Some(char) => char,
+                None => break,
+            };
+        }
+        return Some(());
+    }
+    None
+}
+
+/**
+ * Eat the next characters as a `OctalDigit` production if possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * OctalDigit:: one of
+ *      0 1 2 3 4 5 6 7
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_octal_digit<'a>(parser: &mut Parser<'a>) -> Option<()> {
+    let cp = parser.current()?;
+    if cp.is_digit(8) {
+        parser.advance();
+        parser.last_int_value = cp.to_digit(8)?;
+        Some(())
+    } else {
+        parser.last_int_value = 0;
+        None
+    }
+}
+
+/**
+ * Eat the next characters as the given number of `HexDigit` productions if
+ * possible.
+ * Set `self._last_int_value` if it ate the next characters successfully.
+ * ```
+ * HexDigit:: one of
+ *      0 1 2 3 4 5 6 7 8 9 a b c d e f A B C D E F
+ * ```
+ * @returns `true` if it ate the next characters successfully.
+ */
+fn eat_fixed_hex_digits<'a>(parser: &mut Parser<'a>, length: usize) -> Option<()> {
+    let start = parser.index;
+    parser.last_int_value = 0;
+    for _ in 0..length {
+        let cp = parser.current()?;
+        if !cp.is_ascii_hexdigit() {
+            parser.rewind(start);
+            return None;
+        }
+        parser.last_int_value = 16 * parser.last_int_value + cp.to_digit(16)?;
+        parser.advance();
+    }
+    Some(())
+}
+
+const MIN_CODE_POINT: u32 = 0;
+const MAX_CODE_POINT: u32 = 0x10FFFF;
+
+fn is_valid_unicode(code: u32) -> bool {
+    code >= MIN_CODE_POINT && code <= MAX_CODE_POINT
+}
diff --git a/crates/oxc_js_regex/src/util.rs b/crates/oxc_js_regex/src/util.rs
new file mode 100644
index 0000000000000..454ea5fb88bc9
--- /dev/null
+++ b/crates/oxc_js_regex/src/util.rs
@@ -0,0 +1,84 @@
+use phf::phf_set;
+
+const SYNTAX_CHARACTERS: phf::Set<char> = phf_set!['(', ')', '[', ']', '{', '}', '|', '-'];
+
+const CLASS_SET_RESERVED_DOUBLE_PUNCTUATOR_CHARACTER: phf::Set<char> = phf_set! {
+    '&' => AMPERSAND,
+    '!' => EXCLAMATION_MARK,
+    '#' => NUMBER_SIGN,
+    '$' => DOLLAR_SIGN,
+    '%' => PERCENT_SIGN,
+    '*' => ASTERISK,
+    '+' => PLUS_SIGN,
+    ',' => COMMA,
+    '.' => FULL_STOP,
+    ':' => COLON,
+    ';' => SEMICOLON,
+    '<' => LESS_THAN_SIGN,
+    '=' => EQUALS_SIGN,
+    '>' => GREATER_THAN_SIGN,
+    '?' => QUESTION_MARK,
+    '@' => COMMERCIAL_AT,
+    '^' => CIRCUMFLEX_ACCENT,
+    '`' => GRAVE_ACCENT,
+    '~' => TILDE,
+};
+
+const CLASS_SET_SYNTAX_CHARACTER: phf::Set<char> = phf_set! {
+    '(' => LEFT_PARENTHESIS,
+    ')' => RIGHT_PARENTHESIS,
+    '[' => LEFT_SQUARE_BRACKET,
+    ']' => RIGHT_SQUARE_BRACKET,
+    '{' => LEFT_CURLY_BRACKET,
+    '}' => RIGHT_CURLY_BRACKET,
+    '/' => SOLIDUS,
+    '-' => HYPHEN_MINUS,
+    '\\' => REVERSE_SOLIDUS,
+    '|' => VERTICAL_LINE,
+};
+
+const CLASS_SET_RESERVED_PUNCTUATOR: phf::Set<char> = phf_set! {
+    '&' => AMPERSAND,
+    '-' => HYPHEN_MINUS,
+    '!' => EXCLAMATION_MARK,
+    '#' => NUMBER_SIGN,
+    '%' => PERCENT_SIGN,
+    ',' => COMMA,
+    ':' => COLON,
+    ';' => SEMICOLON,
+    '<' => LESS_THAN_SIGN,
+    '=' => EQUALS_SIGN,
+    '>' => GREATER_THAN_SIGN,
+    '@' => COMMERCIAL_AT,
+    '`' => GRAVE_ACCENT,
+    '~' => TILDE,
+};
+
+#[inline]
+pub fn is_syntax_character(cp: char) -> bool {
+    SYNTAX_CHARACTERS.contains(&cp)
+}
+
+pub fn is_lead_surrogate(code: u32) -> bool {
+    code >= 0xd800 && code <= 0xdbff
+}
+
+pub fn is_trail_surrogate(code: u32) -> bool {
+    code >= 0xdc00 && code <= 0xdfff
+}
+
+pub fn combine_surrogate_pair(lead: u32, trail: u32) -> u32 {
+    (lead - 0xd800) * 0x400 + (trail - 0xdc00) + 0x10000
+}
+
+pub fn is_class_set_reserved_double_punctuator_character(cp: char) -> bool {
+    CLASS_SET_RESERVED_DOUBLE_PUNCTUATOR_CHARACTER.contains(&cp)
+}
+
+pub fn is_class_set_syntax_character(cp: char) -> bool {
+    CLASS_SET_SYNTAX_CHARACTER.contains(&cp)
+}
+
+pub fn is_class_set_reserved_punctuator(cp: char) -> bool {
+    CLASS_SET_RESERVED_PUNCTUATOR.contains(&cp)
+}