#!/bin/ksh # Set the number of files/dirs TOTAL=500 # Approximate size in blocks BLOCK_SIZE=16 COUNT=1 for i in $(seq 1 $TOTAL); do # Create a unique directory name DIR="site_$i" mkdir -p "$DIR" # 1. Generate random valid ASCII (valid UTF-8) text # We read more from urandom than needed because tr will filter some out dd if=/dev/urandom bs=1024 count=$BLOCK_SIZE 2>/dev/null | tr -dc 'a-zA-Z0-9 \n' > "$DIR/index.html" # 2. Append the necessary HTML structure so your Perl regexes work # This adds the and <main> tags your script looks for echo "<html><head><title>Site $i

Searchable content here for keyword_$i. Lorem ipsum text follows.

" >> "$DIR/index.html" # Optional: print progress every 100 files if [ $((i % 100)) -eq 0 ]; then echo "Created $i files..." fi done echo "Done! 10000 directories created with valid text."