`109f5c9`

Add bitwise char class and pre-computed epsilon closures (4x speedup)

Two major optimizations:

1. Bitwise character class representation:
- Replace 256-element boolean array with 4×64-bit integers
- O(1) bit test via btest() instead of array lookup
- [a-z]+ now 2x faster than grep (was 0.5x slower)
- [a-zA-Z0-9]+ now 1.4x faster (was 0.37x slower)

2. Pre-computed epsilon closures:
- Pre-compute epsilon closure for every NFA state
- Merge closures via bitwise OR instead of graph traversal
- Optional quantifier colou?r now 1.1x faster (was 0.24x)

Overall: ferp wins 38/39 benchmarks, average speedup 4.0x vs grep

Also adds benchmark.sh for automated performance testing.

Authored by

espadonne 4 months ago

SHA: 109f5c95880f0f2bfb73a19409a39bf6920123b5
Parents: 3293715
Tree: e432e11

6 changed files

Status	File	+	-
M	`Makefile`	6	3
A	`benchmark.sh`	444	0
A	`src/regex/regex_charclass.f90`	152	0
M	`src/regex/regex_nfa.f90`	3	0
M	`src/regex/regex_optimizer.f90`	77	5
M	`src/regex/regex_types.f90`	3	1

Makefilemodified

  TARGET = $(BIN_DIR)/ferp
  # Regex source files (in dependency order)
 -REGEX_SRCS = $(REGEX_DIR)/regex_types.f90 \
 +REGEX_SRCS = $(REGEX_DIR)/regex_charclass.f90 \
 +             $(REGEX_DIR)/regex_types.f90 \
               $(REGEX_DIR)/regex_lexer.f90 \
               $(REGEX_DIR)/regex_parser.f90 \
               $(REGEX_DIR)/regex_nfa.f90 \
  	$(CC) $(CFLAGS) -c $< -o $@
  # Regex module dependencies
 +$(BUILD_DIR)/regex_charclass.o:
 +$(BUILD_DIR)/regex_types.o: $(BUILD_DIR)/regex_charclass.o
  $(BUILD_DIR)/regex_lexer.o: $(BUILD_DIR)/regex_types.o
  $(BUILD_DIR)/regex_parser.o: $(BUILD_DIR)/regex_types.o
 -$(BUILD_DIR)/regex_nfa.o: $(BUILD_DIR)/regex_types.o $(BUILD_DIR)/regex_parser.o
 +$(BUILD_DIR)/regex_nfa.o: $(BUILD_DIR)/regex_types.o $(BUILD_DIR)/regex_charclass.o $(BUILD_DIR)/regex_parser.o
  $(BUILD_DIR)/regex_engine.o: $(BUILD_DIR)/regex_types.o
  $(BUILD_DIR)/aho_corasick.o:
 -$(BUILD_DIR)/regex_optimizer.o: $(BUILD_DIR)/regex_types.o $(BUILD_DIR)/aho_corasick.o
 +$(BUILD_DIR)/regex_optimizer.o: $(BUILD_DIR)/regex_types.o $(BUILD_DIR)/regex_charclass.o $(BUILD_DIR)/aho_corasick.o
  $(BUILD_DIR)/regex_api.o: $(BUILD_DIR)/regex_types.o $(BUILD_DIR)/regex_lexer.o $(BUILD_DIR)/regex_parser.o $(BUILD_DIR)/regex_nfa.o $(BUILD_DIR)/regex_engine.o $(BUILD_DIR)/regex_optimizer.o
  $(BUILD_DIR)/pcre_api.o:

benchmark.shadded

 +#!/usr/bin/env bash
 +#
 +# FERP vs grep Benchmark Suite
 +# Comprehensive performance comparison
 +#
 +# Requires: bash 4+, bc, python3 (for timing)
 +#
++
 +set -e
++
 +# Colors for output
 +RED='\033[0;31m'
 +GREEN='\033[0;32m'
 +YELLOW='\033[1;33m'
 +BLUE='\033[0;34m'
 +CYAN='\033[0;36m'
 +BOLD='\033[1m'
 +NC='\033[0m' # No Color
++
 +# Configuration
 +BENCH_DIR="/tmp/ferp_benchmark_$$"
 +FERP="./ferp"
 +GREP="grep"
 +RUNS=3  # Number of runs per benchmark (take median)
++
 +# Test file sizes
 +SMALL_LINES=10000      # ~700KB
 +MEDIUM_LINES=100000    # ~7MB
 +LARGE_LINES=1000000    # ~70MB
++
 +# Results storage (simple arrays for portability)
 +RESULT_NAMES=()
 +RESULT_FERP_TIMES=()
 +RESULT_GREP_TIMES=()
++
 +#------------------------------------------------------------------------------
 +# Utility Functions
 +#------------------------------------------------------------------------------
++
 +cleanup() {
 +    echo -e "\n${CYAN}Cleaning up...${NC}"
 +    rm -rf "$BENCH_DIR"
 +}
++
 +trap cleanup EXIT
++
 +die() {
 +    echo -e "${RED}ERROR: $1${NC}" >&2
 +    exit 1
 +}
++
 +check_prerequisites() {
 +    echo -e "${CYAN}Checking prerequisites...${NC}"
++
 +    # Check ferp exists
 +    if [[ ! -x "$FERP" ]]; then
 +        echo -e "${YELLOW}Building ferp (release mode)...${NC}"
 +        make release >/dev/null 2>&1 || die "Failed to build ferp"
 +    fi
++
 +    # Verify ferp works
 +    echo "test" | $FERP "test" >/dev/null 2>&1 || die "ferp not working"
++
 +    # Check grep exists
 +    command -v $GREP >/dev/null 2>&1 || die "grep not found"
++
 +    echo -e "${GREEN}Prerequisites OK${NC}"
 +}
++
 +create_test_files() {
 +    echo -e "\n${CYAN}Creating test files in $BENCH_DIR...${NC}"
 +    mkdir -p "$BENCH_DIR"
++
 +    # File 1: English-like text (varied content) - use awk for speed
 +    echo -e "  Creating english text file ($LARGE_LINES lines)..."
 +    awk -v n="$LARGE_LINES" 'BEGIN {
 +        lines[0] = "The quick brown fox jumps over the lazy dog near the riverbank."
 +        lines[1] = "Hello world, this is line number %d of the benchmark test file."
 +        lines[2] = "Lorem ipsum dolor sit amet, consectetur adipiscing elit sed do."
 +        lines[3] = "Error: connection timeout after 30000ms on server node-%d."
 +        lines[4] = "DEBUG [2024-01-15 10:23:45] Processing request id=%d status=pending"
 +        lines[5] = "user@example.com logged in from 192.168.1.%d at 12:00:00"
 +        lines[6] = "WARNING: disk usage at %d%% on /dev/sda1 partition"
 +        lines[7] = "Function calculate_total(items=[1,2,3]) returned value=%d"
 +        lines[8] = "The API endpoint /api/v2/users/%d responded with HTTP 200 OK"
 +        lines[9] = "Configuration: max_threads=16, timeout=5000, retry_count=3"
 +        for (i = 1; i <= n; i++) {
 +            idx = i % 10
 +            if (idx == 0 || idx == 2 || idx == 9) {
 +                print lines[idx]
 +            } else if (idx == 3) {
 +                printf lines[idx] "\n", i % 100
 +            } else if (idx == 5) {
 +                printf lines[idx] "\n", i % 256
 +            } else if (idx == 6) {
 +                printf lines[idx] "\n", 50 + (i % 50)
 +            } else if (idx == 7) {
 +                printf lines[idx] "\n", i * 42
 +            } else {
 +                printf lines[idx] "\n", i
 +            }
 +        }
 +    }' > "$BENCH_DIR/english_large.txt"
++
 +    # File 2: Log-like file (structured)
 +    echo -e "  Creating log file ($MEDIUM_LINES lines)..."
 +    awk -v n="$MEDIUM_LINES" 'BEGIN {
 +        levels[0] = "INFO"; levels[1] = "DEBUG"; levels[2] = "WARN"; levels[3] = "ERROR"
 +        for (i = 1; i <= n; i++) {
 +            day = 1 + (i % 28)
 +            hour = i % 24
 +            min = i % 60
 +            sec = i % 60
 +            comp = i % 20
 +            printf "[2024-01-%02d %02d:%02d:%02d] %s: Message number %d from component-%d\n", \
 +                   day, hour, min, sec, levels[i % 4], i, comp
 +        }
 +    }' > "$BENCH_DIR/logs_medium.txt"
++
 +    # File 3: Code-like file
 +    echo -e "  Creating code file ($MEDIUM_LINES lines)..."
 +    awk -v n="$MEDIUM_LINES" 'BEGIN {
 +        for (i = 1; i <= n; i++) {
 +            idx = i % 8
 +            if (idx == 0) printf "function process_data_%d(input) {\n", i
 +            else if (idx == 1) print "    const result = input.map(x => x * 2);"
 +            else if (idx == 2) print "    if (result.length > 0) {"
 +            else if (idx == 3) print "        console.log(\"Processing:\", result);"
 +            else if (idx == 4) print "        return result.filter(x => x > 10);"
 +            else if (idx == 5) print "    }"
 +            else if (idx == 6) print "    return [];"
 +            else print "}"
 +        }
 +    }' > "$BENCH_DIR/code_medium.txt"
++
 +    # File 4: CSV-like data
 +    echo -e "  Creating CSV file ($MEDIUM_LINES lines)..."
 +    awk -v n="$MEDIUM_LINES" 'BEGIN {
 +        print "id,name,email,score,timestamp"
 +        srand()
 +        for (i = 1; i <= n; i++) {
 +            score = int(rand() * 100)
 +            printf "%d,user_%d,user%d@domain%d.com,%d,%d\n", \
 +                   i, i, i, i % 100, score, 1700000000 + i
 +        }
 +    }' > "$BENCH_DIR/data_medium.csv"
++
 +    # File 5: Small file for quick tests
 +    echo -e "  Creating small file ($SMALL_LINES lines)..."
 +    head -n $SMALL_LINES "$BENCH_DIR/english_large.txt" > "$BENCH_DIR/english_small.txt"
++
 +    # Print file sizes
 +    echo -e "\n${CYAN}Test files created:${NC}"
 +    ls -lh "$BENCH_DIR"/*.txt "$BENCH_DIR"/*.csv 2>/dev/null | awk '{print "  " $9 ": " $5}'
 +}
++
 +#------------------------------------------------------------------------------
 +# Benchmark Functions
 +#------------------------------------------------------------------------------
++
 +# Run a command multiple times and return median time
 +run_timed() {
 +    local cmd="$1"
 +    local times=()
++
 +    for i in $(seq 1 $RUNS); do
 +        # Use /usr/bin/time for portable timing
 +        local t=$( { time eval "$cmd" >/dev/null 2>&1; } 2>&1 | grep real | sed 's/real[[:space:]]*//' )
 +        # Convert to seconds (handles both 0m0.123s and 0.123 formats)
 +        if [[ "$t" =~ ([0-9]+)m([0-9.]+)s ]]; then
 +            local mins="${BASH_REMATCH[1]}"
 +            local secs="${BASH_REMATCH[2]}"
 +            t=$(echo "$mins * 60 + $secs" | bc -l)
 +        elif [[ "$t" =~ ^[0-9.]+$ ]]; then
 +            : # already in seconds
 +        else
 +            t="999"  # Error case
 +        fi
 +        times+=("$t")
 +    done
++
 +    # Return median (sort and take middle)
 +    printf '%s\n' "${times[@]}" | sort -n | sed -n "$((($RUNS + 1) / 2))p"
 +}
++
 +# Alternative timing using date (more portable)
 +run_timed_portable() {
 +    local cmd="$1"
 +    local times=()
++
 +    for i in $(seq 1 $RUNS); do
 +        local start=$(python3 -c 'import time; print(time.time())' 2>/dev/null || date +%s.%N)
 +        eval "$cmd" >/dev/null 2>&1
 +        local end=$(python3 -c 'import time; print(time.time())' 2>/dev/null || date +%s.%N)
 +        local t=$(echo "$end - $start" | bc -l)
 +        times+=("$t")
 +    done
++
 +    # Return median
 +    printf '%s\n' "${times[@]}" | sort -n | sed -n "$((($RUNS + 1) / 2))p"
 +}
++
 +benchmark_pattern() {
 +    local name="$1"
 +    local file="$2"
 +    local ferp_args="$3"
 +    local grep_args="$4"
 +    local pattern="$5"
++
 +    printf "  %-35s" "$name"
++
 +    # Run ferp
 +    local ferp_time=$(run_timed_portable "$FERP $ferp_args '$pattern' '$file'")
++
 +    # Run grep
 +    local grep_time=$(run_timed_portable "$GREP $grep_args '$pattern' '$file'")
++
 +    # Calculate speedup
 +    local speedup=$(echo "scale=2; $grep_time / $ferp_time" | bc -l 2>/dev/null || echo "N/A")
++
 +    # Store results
 +    RESULT_NAMES+=("$name")
 +    RESULT_FERP_TIMES+=("$ferp_time")
 +    RESULT_GREP_TIMES+=("$grep_time")
++
 +    # Color-code the speedup
 +    local color="$NC"
 +    if (( $(echo "$speedup > 1.5" | bc -l) )); then
 +        color="$GREEN"
 +    elif (( $(echo "$speedup < 0.8" | bc -l) )); then
 +        color="$RED"
 +    fi
++
 +    printf "ferp: %6.3fs  grep: %6.3fs  ${color}%5.2fx${NC}\n" "$ferp_time" "$grep_time" "$speedup"
 +}
++
 +#------------------------------------------------------------------------------
 +# Benchmark Suites
 +#------------------------------------------------------------------------------
++
 +run_literal_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Literal String Matching ===${NC}"
 +    local file="$BENCH_DIR/english_large.txt"
++
 +    benchmark_pattern "Simple word (hello)" "$file" "" "" "hello"
 +    benchmark_pattern "Common word (the)" "$file" "" "" "the"
 +    benchmark_pattern "Longer phrase (quick brown)" "$file" "" "" "quick brown"
 +    benchmark_pattern "Case insensitive (-i hello)" "$file" "-i" "-i" "hello"
 +    benchmark_pattern "Fixed string (-F hello)" "$file" "-F" "-F" "hello"
 +    benchmark_pattern "Word boundary (-w the)" "$file" "-w" "-w" "the"
 +}
++
 +run_regex_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Regular Expression Matching ===${NC}"
 +    local file="$BENCH_DIR/english_large.txt"
++
 +    benchmark_pattern "Dot wildcard (h.llo)" "$file" "" "" "h.llo"
 +    benchmark_pattern "Star quantifier (hel*o)" "$file" "" "" "hel*o"
 +    benchmark_pattern "Character class ([a-z]+)" "$file" "-E" "-E" "[a-z]+"
 +    benchmark_pattern "Mixed class ([a-zA-Z0-9]+)" "$file" "-E" "-E" "[a-zA-Z0-9]+"
 +    benchmark_pattern "Digit class ([0-9]+)" "$file" "-E" "-E" "[0-9]+"
 +    benchmark_pattern "Alternation (cat|dog|fox)" "$file" "-E" "-E" "cat|dog|fox"
 +    benchmark_pattern "Optional (colou?r)" "$file" "-E" "-E" "colou?r"
 +    benchmark_pattern "One or more (hel+o)" "$file" "-E" "-E" "hel+o"
 +}
++
 +run_anchor_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Anchor Patterns ===${NC}"
 +    local file="$BENCH_DIR/english_large.txt"
++
 +    benchmark_pattern "Start anchor (^The)" "$file" "" "" "^The"
 +    benchmark_pattern "End anchor (\\.$)" "$file" "" "" '\.$'
 +    benchmark_pattern "Both anchors (^The.*dog$)" "$file" "-E" "-E" "^The.*dog$"
 +    benchmark_pattern "Word start (\\<quick)" "$file" "" "" '\<quick'
 +    benchmark_pattern "Word end (fox\\>)" "$file" "" "" 'fox\>'
 +}
++
 +run_log_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Log File Patterns ===${NC}"
 +    local file="$BENCH_DIR/logs_medium.txt"
++
 +    benchmark_pattern "Log level (ERROR)" "$file" "" "" "ERROR"
 +    benchmark_pattern "Log level (-i warn)" "$file" "-i" "-i" "warn"
 +    benchmark_pattern "Timestamp pattern ([0-9]{2}:[0-9]{2})" "$file" "-E" "-E" "[0-9]{2}:[0-9]{2}"
 +    benchmark_pattern "Component (component-[0-9]+)" "$file" "-E" "-E" "component-[0-9]+"
 +    benchmark_pattern "Multiple levels (ERROR|WARN)" "$file" "-E" "-E" "ERROR|WARN"
 +}
++
 +run_code_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Code Pattern Matching ===${NC}"
 +    local file="$BENCH_DIR/code_medium.txt"
++
 +    benchmark_pattern "Function name (function)" "$file" "" "" "function"
 +    benchmark_pattern "Variable (const|let|var)" "$file" "-E" "-E" "const|let|var"
 +    benchmark_pattern "Return statement (return)" "$file" "" "" "return"
 +    benchmark_pattern "Console log (console\\.log)" "$file" "-E" "-E" "console\\.log"
 +}
++
 +run_csv_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== CSV/Data Pattern Matching ===${NC}"
 +    local file="$BENCH_DIR/data_medium.csv"
++
 +    benchmark_pattern "Email pattern (@.*\\.com)" "$file" "-E" "-E" "@.*\\.com"
 +    benchmark_pattern "Specific domain (domain50)" "$file" "" "" "domain50"
 +    benchmark_pattern "User pattern (user_[0-9]+)" "$file" "-E" "-E" "user_[0-9]+"
 +    benchmark_pattern "High score (,[89][0-9],)" "$file" "-E" "-E" ",[89][0-9],"
 +}
++
 +run_special_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Special Cases ===${NC}"
 +    local file="$BENCH_DIR/english_large.txt"
++
 +    benchmark_pattern "Invert match (-v error)" "$file" "-v" "-v" "error"
 +    benchmark_pattern "Count only (-c the)" "$file" "-c" "-c" "the"
 +    benchmark_pattern "Line number (-n hello)" "$file" "-n" "-n" "hello"
 +    benchmark_pattern "Multiple patterns (cat|dog|bird|fish)" "$file" "-E" "-E" "cat|dog|bird|fish"
 +    benchmark_pattern "Long alternation (the|and|for|with|from)" "$file" "-E" "-E" "the|and|for|with|from"
 +}
++
 +run_scaling_benchmarks() {
 +    echo -e "\n${BOLD}${BLUE}=== Scaling Tests ===${NC}"
++
 +    echo -e "  ${CYAN}Small file (~700KB):${NC}"
 +    benchmark_pattern "  [a-z]+ on small" "$BENCH_DIR/english_small.txt" "-E" "-E" "[a-z]+"
++
 +    echo -e "  ${CYAN}Large file (~70MB):${NC}"
 +    benchmark_pattern "  [a-z]+ on large" "$BENCH_DIR/english_large.txt" "-E" "-E" "[a-z]+"
++
 +    # Calculate scaling factor (get last two results)
 +    local num_results=${#RESULT_FERP_TIMES[@]}
 +    local small_ferp="${RESULT_FERP_TIMES[$((num_results-2))]}"
 +    local large_ferp="${RESULT_FERP_TIMES[$((num_results-1))]}"
 +    local small_grep="${RESULT_GREP_TIMES[$((num_results-2))]}"
 +    local large_grep="${RESULT_GREP_TIMES[$((num_results-1))]}"
++
 +    echo -e "\n  ${CYAN}Scaling (large/small ratio):${NC}"
 +    local ferp_scale=$(echo "scale=1; $large_ferp / $small_ferp" | bc -l 2>/dev/null || echo "N/A")
 +    local grep_scale=$(echo "scale=1; $large_grep / $small_grep" | bc -l 2>/dev/null || echo "N/A")
 +    echo -e "    ferp: ${ferp_scale}x  grep: ${grep_scale}x  (lower is better for large files)"
 +}
++
 +#------------------------------------------------------------------------------
 +# Report Generation
 +#------------------------------------------------------------------------------
++
 +print_summary() {
 +    echo -e "\n${BOLD}${BLUE}══════════════════════════════════════════════════════════════${NC}"
 +    echo -e "${BOLD}${BLUE}                        SUMMARY                                 ${NC}"
 +    echo -e "${BOLD}${BLUE}══════════════════════════════════════════════════════════════${NC}"
++
 +    local total_ferp=0
 +    local total_grep=0
 +    local wins_ferp=0
 +    local wins_grep=0
 +    local count=${#RESULT_NAMES[@]}
++
 +    for i in "${!RESULT_NAMES[@]}"; do
 +        local ft="${RESULT_FERP_TIMES[$i]}"
 +        local gt="${RESULT_GREP_TIMES[$i]}"
 +        total_ferp=$(echo "$total_ferp + $ft" | bc -l)
 +        total_grep=$(echo "$total_grep + $gt" | bc -l)
++
 +        if (( $(echo "$ft < $gt" | bc -l) )); then
 +            wins_ferp=$((wins_ferp + 1))
 +        else
 +            wins_grep=$((wins_grep + 1))
 +        fi
 +    done
++
 +    local avg_speedup=$(echo "scale=2; $total_grep / $total_ferp" | bc -l 2>/dev/null || echo "N/A")
++
 +    echo -e "\n${CYAN}Overall Statistics:${NC}"
 +    echo -e "  Total benchmarks run: $count"
 +    echo -e "  ferp wins: ${GREEN}$wins_ferp${NC}"
 +    echo -e "  grep wins: ${RED}$wins_grep${NC}"
 +    printf "  Total time - ferp: %.3fs  grep: %.3fs\n" "$total_ferp" "$total_grep"
 +    echo -e "  ${BOLD}Average speedup: ${GREEN}${avg_speedup}x${NC}"
++
 +    echo -e "\n${CYAN}System Information:${NC}"
 +    echo -e "  OS: $(uname -s) $(uname -r)"
 +    echo -e "  CPU: $(sysctl -n machdep.cpu.brand_string 2>/dev/null || lscpu 2>/dev/null | grep 'Model name' | cut -d: -f2 | xargs || echo 'Unknown')"
 +    echo -e "  ferp version: $($FERP --version 2>&1 | head -1 || echo 'Unknown')"
 +    echo -e "  grep version: $($GREP --version 2>&1 | head -1 || echo 'Unknown')"
 +    echo -e "  Runs per benchmark: $RUNS (median taken)"
++
 +    echo -e "\n${BOLD}${BLUE}══════════════════════════════════════════════════════════════${NC}"
 +}
++
 +#------------------------------------------------------------------------------
 +# Main
 +#------------------------------------------------------------------------------
++
 +main() {
 +    echo -e "${BOLD}${BLUE}"
 +    echo "╔══════════════════════════════════════════════════════════════╗"
 +    echo "║           FERP vs grep Benchmark Suite                       ║"
 +    echo "║           Comprehensive Performance Comparison               ║"
 +    echo "╚══════════════════════════════════════════════════════════════╝"
 +    echo -e "${NC}"
++
 +    check_prerequisites
 +    create_test_files
++
 +    echo -e "\n${BOLD}${CYAN}Running benchmarks (${RUNS} runs each, reporting median)...${NC}"
 +    echo -e "${CYAN}Format: ferp time | grep time | speedup (>1 = ferp faster)${NC}\n"
++
 +    run_literal_benchmarks
 +    run_regex_benchmarks
 +    run_anchor_benchmarks
 +    run_log_benchmarks
 +    run_code_benchmarks
 +    run_csv_benchmarks
 +    run_special_benchmarks
 +    run_scaling_benchmarks
++
 +    print_summary
++
 +    echo -e "\n${GREEN}Benchmark complete!${NC}"
 +}
++
 +# Run with optional arguments
 +if [[ "$1" == "-h" || "$1" == "--help" ]]; then
 +    echo "Usage: $0 [OPTIONS]"
 +    echo ""
 +    echo "Options:"
 +    echo "  -r, --runs N    Number of runs per benchmark (default: 3)"
 +    echo "  -q, --quick     Quick mode (smaller files, fewer runs)"
 +    echo "  -h, --help      Show this help"
 +    exit 0
 +fi
++
 +if [[ "$1" == "-q" || "$1" == "--quick" ]]; then
 +    RUNS=1
 +    SMALL_LINES=1000
 +    MEDIUM_LINES=10000
 +    LARGE_LINES=100000
 +    echo -e "${YELLOW}Quick mode: reduced file sizes and single run${NC}"
 +fi
++
 +if [[ "$1" == "-r" || "$1" == "--runs" ]]; then
 +    RUNS="${2:-3}"
 +fi
++
 +main

src/regex/regex_charclass.f90added

 +module regex_charclass
 +  !> High-performance bitwise character class operations for FERP
 +  !> Uses 256-bit representation (4 x 64-bit integers) instead of boolean array
 +  !> Provides O(1) membership testing with minimal memory footprint
 +  implicit none
 +  private
++
 +  public :: char_class_bits_t
 +  public :: charclass_from_array, charclass_test, charclass_test_case_insensitive
 +  public :: charclass_set, charclass_clear, charclass_set_range
 +  public :: charclass_add_case_variants
++
 +  !> Bitwise character class - 256 bits in 4 words
 +  type :: char_class_bits_t
 +    integer(8) :: words(4) = 0_8  ! bits 0-63, 64-127, 128-191, 192-255
 +    logical :: negated = .false.
 +  end type char_class_bits_t
++
 +contains
++
 +  pure subroutine charclass_clear(cc)
 +    !> Clear all bits
 +    type(char_class_bits_t), intent(inout) :: cc
 +    cc%words = 0_8
 +    cc%negated = .false.
 +  end subroutine charclass_clear
++
 +  pure subroutine charclass_set(cc, char_code)
 +    !> Set a single character bit
 +    type(char_class_bits_t), intent(inout) :: cc
 +    integer, intent(in) :: char_code
 +    integer :: word_idx, bit_idx
++
 +    if (char_code < 0 .or. char_code > 255) return
 +    word_idx = char_code / 64 + 1  ! 1-based index
 +    bit_idx = mod(char_code, 64)
 +    cc%words(word_idx) = ior(cc%words(word_idx), ishft(1_8, bit_idx))
 +  end subroutine charclass_set
++
 +  pure subroutine charclass_set_range(cc, start_char, end_char)
 +    !> Set a range of character bits efficiently
 +    type(char_class_bits_t), intent(inout) :: cc
 +    integer, intent(in) :: start_char, end_char
 +    integer :: i
++
 +    do i = start_char, end_char
 +      if (i >= 0 .and. i <= 255) then
 +        call charclass_set(cc, i)
 +      end if
 +    end do
 +  end subroutine charclass_set_range
++
 +  pure function charclass_test(cc, c) result(res)
 +    !> Test if character is in class - O(1) bit test
 +    type(char_class_bits_t), intent(in) :: cc
 +    character(len=1), intent(in) :: c
 +    logical :: res
++
 +    integer :: char_code, word_idx, bit_idx
++
 +    char_code = ichar(c)
 +    word_idx = char_code / 64 + 1
 +    bit_idx = mod(char_code, 64)
 +    res = btest(cc%words(word_idx), bit_idx)
++
 +    if (cc%negated) res = .not. res
 +  end function charclass_test
++
 +  pure function charclass_test_case_insensitive(cc, c) result(res)
 +    !> Test character with case insensitivity - checks both cases in one call
 +    type(char_class_bits_t), intent(in) :: cc
 +    character(len=1), intent(in) :: c
 +    logical :: res
++
 +    integer :: char_code, word_idx, bit_idx, other_case
++
 +    char_code = ichar(c)
 +    word_idx = char_code / 64 + 1
 +    bit_idx = mod(char_code, 64)
 +    res = btest(cc%words(word_idx), bit_idx)
++
 +    ! Quick check for other case (only for a-z and A-Z)
 +    if (.not. res) then
 +      if (char_code >= 65 .and. char_code <= 90) then
 +        ! Uppercase A-Z -> check lowercase a-z
 +        other_case = char_code + 32
 +        word_idx = other_case / 64 + 1
 +        bit_idx = mod(other_case, 64)
 +        res = btest(cc%words(word_idx), bit_idx)
 +      else if (char_code >= 97 .and. char_code <= 122) then
 +        ! Lowercase a-z -> check uppercase A-Z
 +        other_case = char_code - 32
 +        word_idx = other_case / 64 + 1
 +        bit_idx = mod(other_case, 64)
 +        res = btest(cc%words(word_idx), bit_idx)
 +      end if
 +    end if
++
 +    if (cc%negated) res = .not. res
 +  end function charclass_test_case_insensitive
++
 +  pure subroutine charclass_from_array(cc, char_class_array, negated)
 +    !> Convert 256-element boolean array to bitwise format
 +    type(char_class_bits_t), intent(out) :: cc
 +    logical, intent(in) :: char_class_array(0:255)
 +    logical, intent(in) :: negated
++
 +    integer :: i, word_idx, bit_idx
++
 +    cc%words = 0_8
 +    cc%negated = negated
++
 +    do i = 0, 255
 +      if (char_class_array(i)) then
 +        word_idx = i / 64 + 1
 +        bit_idx = mod(i, 64)
 +        cc%words(word_idx) = ior(cc%words(word_idx), ishft(1_8, bit_idx))
 +      end if
 +    end do
 +  end subroutine charclass_from_array
++
 +  pure subroutine charclass_add_case_variants(cc)
 +    !> Pre-compute case variants into the character class
 +    !> After calling this, case-insensitive matching becomes a single test
 +    type(char_class_bits_t), intent(inout) :: cc
++
 +    integer :: i, word_idx, bit_idx, other_case
 +    integer(8) :: saved_words(4)
++
 +    saved_words = cc%words
++
 +    ! For each set bit, also set its case variant
 +    do i = 0, 255
 +      word_idx = i / 64 + 1
 +      bit_idx = mod(i, 64)
++
 +      if (btest(saved_words(word_idx), bit_idx)) then
 +        ! Character is in class - add its case variant
 +        if (i >= 65 .and. i <= 90) then
 +          ! Uppercase A-Z -> add lowercase a-z
 +          other_case = i + 32
 +          call charclass_set(cc, other_case)
 +        else if (i >= 97 .and. i <= 122) then
 +          ! Lowercase a-z -> add uppercase A-Z
 +          other_case = i - 32
 +          call charclass_set(cc, other_case)
 +        end if
 +      end if
 +    end do
 +  end subroutine charclass_add_case_variants
++
 +end module regex_charclass

src/regex/regex_nfa.f90modified

    !> Thompson NFA construction from AST
    !> Implements the classic Thompson construction algorithm
    use regex_types
 +  use regex_charclass
    use regex_parser, only: ast_pool_t
    implicit none
    private
          trans%trans_type = TRANS_CLASS
          trans%char_class = node%char_class
          trans%negated = node%negated
 +        ! Pre-compute bitwise character class for fast matching
 +        call charclass_from_array(trans%char_bits, node%char_class, node%negated)
          trans%target = s2
          call nfa%states(s1)%add_trans(trans)

src/regex/regex_optimizer.f90modified

    !>   - Lazy DFA state caching
    !>   - Anchored pattern fast paths
    !>   - Aho-Corasick for alternation patterns
 +  !>   - Bitwise character class matching
    use regex_types
 +  use regex_charclass
    use aho_corasick
    implicit none
    private
      logical :: anchored_end = .false.            ! Pattern ends with $
      integer :: skip_table(0:255) = 0             ! Boyer-Moore skip table for prefix
      type(state_set_t) :: start_closure           ! Pre-computed start state epsilon closure
 +    type(state_set_t), allocatable :: epsilon_closures(:)  ! Pre-computed epsilon closures per state
      type(dfa_cache_entry_t) :: dfa_cache(DFA_CACHE_SIZE)  ! Lazy DFA cache
      type(compiled_dfa_t) :: dfa                  ! Full compiled DFA (if available)
      logical :: use_dfa = .false.                 ! Use DFA instead of NFA
      ! Pre-compute start state epsilon closure (position-independent part)
      call precompute_start_closure(opt)
 +    ! Pre-compute epsilon closures for all states (for fast expansion)
 +    call precompute_all_epsilon_closures(opt)
++
      ! Clear DFA cache
      opt%dfa_cache%valid = .false.
      end do
    end subroutine compute_epsilon_closure_basic
 +  subroutine precompute_all_epsilon_closures(opt)
 +    !> Pre-compute epsilon closure for every NFA state
 +    !> This allows O(1) closure lookup during matching instead of repeated traversal
 +    type(optimized_nfa_t), intent(inout) :: opt
++
 +    integer :: i, n
++
 +    n = opt%nfa%num_states
 +    if (n <= 0) return
++
 +    ! Allocate epsilon closures array
 +    if (allocated(opt%epsilon_closures)) deallocate(opt%epsilon_closures)
 +    allocate(opt%epsilon_closures(n))
++
 +    ! Compute epsilon closure for each state
 +    do i = 1, n
 +      call opt%epsilon_closures(i)%clear()
 +      call compute_epsilon_closure_basic(opt%nfa, i, opt%epsilon_closures(i))
 +    end do
 +  end subroutine precompute_all_epsilon_closures
++
    function has_anchor_transitions(nfa) result(has_anchors)
      !> Check if NFA has any anchor transitions (position-dependent)
      !> These include ^, $, \<, \>, \b, \B
          ! Compute epsilon closure of result
          if (.not. next_set%is_empty()) then
 -          call expand_epsilon_closure_simple(opt%nfa, next_set)
 +          call expand_epsilon_closure_simple(opt, next_set)
          end if
          if (next_set%is_empty()) then
      end do
    end subroutine compute_char_transitions_simple
 -  subroutine expand_epsilon_closure_simple(nfa, state_set)
 +  subroutine expand_epsilon_closure_simple(opt, state_set)
      !> Expand state set to include epsilon closure (in-place)
 +    !> Uses pre-computed closures for O(1) lookup per state
 +    type(optimized_nfa_t), intent(in) :: opt
 +    type(state_set_t), intent(inout) :: state_set
++
 +    integer :: word_idx, bit_idx, state, j
 +    integer(8) :: word, mask, original_bits(size(state_set%bits))
++
 +    ! If no pre-computed closures, fall back to computing on-the-fly
 +    if (.not. allocated(opt%epsilon_closures)) then
 +      call expand_epsilon_closure_simple_fallback(opt%nfa, state_set)
 +      return
 +    end if
++
 +    ! Save original bits to avoid processing newly added states
 +    original_bits = state_set%bits
++
 +    ! Expand using pre-computed closures - just OR the bit vectors
 +    do word_idx = 1, size(original_bits)
 +      word = original_bits(word_idx)
 +      if (word == 0) cycle
++
 +      do bit_idx = 0, 63
 +        mask = ishft(1_8, bit_idx)
 +        if (iand(word, mask) /= 0) then
 +          state = (word_idx - 1) * 64 + bit_idx + 1
 +          if (state >= 1 .and. state <= opt%nfa%num_states) then
 +            ! Merge pre-computed epsilon closure using bitwise OR
 +            do j = 1, size(state_set%bits)
 +              state_set%bits(j) = ior(state_set%bits(j), opt%epsilon_closures(state)%bits(j))
 +            end do
 +          end if
 +        end if
 +      end do
 +    end do
 +  end subroutine expand_epsilon_closure_simple
++
 +  subroutine expand_epsilon_closure_simple_fallback(nfa, state_set)
 +    !> Fallback: compute epsilon closure on-the-fly
      type(nfa_t), intent(in) :: nfa
      type(state_set_t), intent(inout) :: state_set
      end do
      call state_set%copy_from(result)
 -  end subroutine expand_epsilon_closure_simple
 +  end subroutine expand_epsilon_closure_simple_fallback
    !---------------------------------------------------------------------------
    ! Optimized Search: Use prefix to skip positions
                  end if
                case (TRANS_CLASS)
 -                if (char_in_class_opt(c, trans%char_class, trans%negated, ignore_case)) then
 -                  call next_set%add(trans%target)
 +                ! Use fast bitwise character class test
 +                if (ignore_case) then
 +                  if (charclass_test_case_insensitive(trans%char_bits, c)) then
 +                    call next_set%add(trans%target)
 +                  end if
 +                else
 +                  if (charclass_test(trans%char_bits, c)) then
 +                    call next_set%add(trans%target)
 +                  end if
                  end if
                case (TRANS_ANY)

src/regex/regex_types.f90modified

  module regex_types
    !> Core data types for the FERP regex engine
    !> Defines tokens, AST nodes, and NFA structures
 +  use regex_charclass
    implicit none
    private
    type :: nfa_transition_t
      integer :: trans_type = TRANS_EPSILON   ! Transition type
      character(len=1) :: match_char = ' '    ! For TRANS_CHAR
 -    logical :: char_class(0:255) = .false.  ! For TRANS_CLASS
 +    logical :: char_class(0:255) = .false.  ! For TRANS_CLASS (legacy)
 +    type(char_class_bits_t) :: char_bits    ! Bitwise char class (fast)
      logical :: negated = .false.            ! For negated classes
      integer :: target = 0                   ! Target state index