summaryrefslogtreecommitdiffstats
path: root/_site/cgi-bin/seed.sh
diff options
context:
space:
mode:
Diffstat (limited to '_site/cgi-bin/seed.sh')
-rwxr-xr-x_site/cgi-bin/seed.sh28
1 files changed, 28 insertions, 0 deletions
diff --git a/_site/cgi-bin/seed.sh b/_site/cgi-bin/seed.sh
new file mode 100755
index 0000000..9d85108
--- /dev/null
+++ b/_site/cgi-bin/seed.sh
@@ -0,0 +1,28 @@
+#!/bin/ksh
+
+# Set the number of files/dirs
+TOTAL=10000
+# Approximate size in blocks
+BLOCK_SIZE=16
+COUNT=1
+
+for i in $(seq 1 $TOTAL); do
+ # Create a unique directory name
+ DIR="site_$i"
+ mkdir -p "$DIR"
+
+ # 1. Generate random valid ASCII (valid UTF-8) text
+ # We read more from urandom than needed because tr will filter some out
+ dd if=/dev/urandom bs=1024 count=$BLOCK_SIZE 2>/dev/null | tr -dc 'a-zA-Z0-9 \n' > "$DIR/index.html"
+
+ # 2. Append the necessary HTML structure so your Perl regexes work
+ # This adds the <title> and <main> tags your script looks for
+ echo "<html><head><title>Site $i</title></head><body><main><p>Searchable content here for keyword_$i. Lorem ipsum text follows.</p></main></body></html>" >> "$DIR/index.html"
+
+ # Optional: print progress every 100 files
+ if [ $((i % 100)) -eq 0 ]; then
+ echo "Created $i files..."
+ fi
+done
+
+echo "Done! 10000 directories created with valid text."