Move all awk functions to separate files

2026-03-07 19:42:37 +01:00
parent 3258616282
commit f580ed9cab
17 changed files with 838 additions and 777 deletions
@@ -0,0 +1,14 @@
+BEGIN { in_bq = 0 }
+/^>[[:space:]]?/ {
+    if (!in_bq) { print "<blockquote>"; in_bq = 1 }
+    sub(/^>[[:space:]]?/, "", $0)
+    print $0
+    next
+}
+{
+    if (in_bq) { print "</blockquote>"; in_bq = 0 }
+    print
+}
+END {
+    if (in_bq) print "</blockquote>"
+}
@@ -0,0 +1,46 @@
+function cap(s) { return toupper(substr(s, 1, 1)) tolower(substr(s, 2)) }
+BEGIN { count = 0 }
+{ lines[++count] = $0 }
+END {
+    i = 1
+    while (i <= count) {
+        if (lines[i] == "<blockquote>") {
+            j = i + 1
+            while (j <= count && lines[j] != "</blockquote>") j++
+            if (j <= count) {
+                first = ""
+                first_idx = 0
+                for (k = i + 1; k < j; k++) {
+                    if (lines[k] != "") {
+                        first = lines[k]
+                        first_idx = k
+                        break
+                    }
+                }
+                if (first ~ /^\[![A-Za-z]+\]$/) {
+                    kind = first
+                    sub(/^\[!/, "", kind)
+                    sub(/\]$/, "", kind)
+                    lkind = tolower(kind)
+                    if (lkind == "note" || lkind == "tip" || lkind == "important" || lkind == "warning" || lkind == "caution") {
+                        print "<div class=\"admonition admonition-" lkind "\">"
+                        print "<p class=\"admonition-title\">" cap(lkind) "</p>"
+                        has_body = 0
+                        for (k = first_idx + 1; k < j; k++) {
+                            if (lines[k] != "") {
+                                print "<p>" lines[k] "</p>"
+                                has_body = 1
+                            }
+                        }
+                        if (!has_body) print "<p></p>"
+                        print "</div>"
+                        i = j + 1
+                        continue
+                    }
+                }
+            }
+        }
+        print lines[i]
+        i++
+    }
+}
@@ -0,0 +1,5 @@
+{
+    if ($0 == "" && prev == "") print "<br />"
+    else print $0
+    prev = $0
+}
@@ -0,0 +1,27 @@
+BEGIN { in_fence = 0; first_line = 0 }
+{
+    if (!in_fence && $0 ~ /^```/) {
+        in_fence = 1
+        first_line = 1
+        next
+    }
+    if (in_fence && $0 ~ /^```[[:space:]]*$/) {
+        print "</code></pre>"
+        in_fence = 0
+        next
+    }
+    if (in_fence) {
+        if (first_line) {
+            first_line = 0
+            if ($0 == "") next
+            print "<pre><code>" $0
+        } else {
+            print
+        }
+    } else {
+        print
+    }
+}
+END {
+    if (in_fence) print "</code></pre>"
+}
@@ -4,6 +4,34 @@ function title_from_name(name) {
    return name
 }

+function compare_paths(p1, p2,    parts1, parts2, n1, n2, i, name1, name2, lname1, lname2, w1, w2) {
+    n1 = split(p1, parts1, "/")
+    n2 = split(p2, parts2, "/")
+    for (i = 1; i <= n1 && i <= n2; i++) {
+        name1 = parts1[i]
+        name2 = parts2[i]
+        if (i == n1) gsub(/\.md$/, "", name1)
+        if (i == n2) gsub(/\.md$/, "", name2)
+        lname1 = tolower(name1)
+        lname2 = tolower(name2)
+
+        if (lname1 == "index" && i == n1 && lname2 != "index") return -1
+        if (lname2 == "index" && i == n2 && lname1 != "index") return 1
+
+        w1 = (lname1 in custom_order ? custom_order[lname1] : 999999)
+        w2 = (lname2 in custom_order ? custom_order[lname2] : 999999)
+
+        if (w1 < w2) return -1
+        if (w1 > w2) return 1
+
+        if (lname1 < lname2) return -1
+        if (lname1 > lname2) return 1
+    }
+    if (n1 < n2) return -1
+    if (n1 > n2) return 1
+    return 0
+}
+
 BEGIN {
    n_dlines = split(dinfo, dlines, "\n")
    for (i = 1; i <= n_dlines; i++) {
@@ -39,33 +67,6 @@ BEGIN {
        has_index[dir] = 1
    }
 }
-function compare_paths(p1, p2,    parts1, parts2, n1, n2, i, name1, name2, lname1, lname2, w1, w2) {
-    n1 = split(p1, parts1, "/")
-    n2 = split(p2, parts2, "/")
-    for (i = 1; i <= n1 && i <= n2; i++) {
-        name1 = parts1[i]
-        name2 = parts2[i]
-        if (i == n1) gsub(/\.md$/, "", name1)
-        if (i == n2) gsub(/\.md$/, "", name2)
-        lname1 = tolower(name1)
-        lname2 = tolower(name2)
-
-        if (lname1 == "index" && i == n1 && lname2 != "index") return -1
-        if (lname2 == "index" && i == n2 && lname1 != "index") return 1
-
-        w1 = (lname1 in custom_order ? custom_order[lname1] : 999999)
-        w2 = (lname2 in custom_order ? custom_order[lname2] : 999999)
-
-        if (w1 < w2) return -1
-        if (w1 > w2) return 1
-
-        if (lname1 < lname2) return -1
-        if (lname1 > lname2) return 1
-    }
-    if (n1 < n2) return -1
-    if (n1 > n2) return 1
-    return 0
-}

 END {
    for (i = 0; i < count - 1; i++) {
@@ -78,7 +79,6 @@ END {
        }
    }

-
    print "<ul>"
    if ("index.md" in all_paths) {
        print "<li><a href=\"/index.html\">Home</a></li>"
@@ -0,0 +1,65 @@
+function strip_markdown(s) {
+    gsub(/<[^>]+>/, "", s)
+    gsub(/[*_`~]/, "", s)
+    gsub(/[\[\]]/, "", s)
+    gsub(/\([^\)]*\)/, "", s)
+    sub(/^[[:space:]]*/, "", s)
+    sub(/[[:space:]]*$/, "", s)
+    return s
+}
+BEGIN {
+    has_prev = 0
+    in_pre = 0
+}
+{
+    if ($0 ~ /^<pre><code>/) {
+        in_pre = 1
+        if (has_prev && prev != "") { print prev; has_prev = 0 }
+        print
+        next
+    }
+    if (in_pre) {
+        if ($0 ~ /<\/code><\/pre>/) in_pre = 0
+        print
+        next
+    }
+
+    if ($0 ~ /^=+$/ && has_prev && prev != "" && prev !~ /^<[a-z]/) {
+        print "<h1 id=\"" strip_markdown(prev) "\">" prev "</h1>"
+        has_prev = 0
+    } else if ($0 ~ /^-+$/ && has_prev && prev != "" && prev !~ /^<[a-z]/) {
+        print "<h2 id=\"" strip_markdown(prev) "\">" prev "</h2>"
+        has_prev = 0
+    } else {
+        if (has_prev) {
+            line = prev
+            if (line ~ /^# /) {
+                sub(/^# /, "", line); print "<h1 id=\"" strip_markdown(line) "\">" line "</h1>"
+            } else if (line ~ /^## /) {
+                sub(/^## /, "", line); print "<h2 id=\"" strip_markdown(line) "\">" line "</h2>"
+            } else if (line ~ /^### /) {
+                sub(/^### /, "", line); print "<h3 id=\"" strip_markdown(line) "\">" line "</h3>"
+            } else if (line ~ /^#### /) {
+                sub(/^#### /, "", line); print "<h4 id=\"" strip_markdown(line) "\">" line "</h4>"
+            } else if (line ~ /^##### /) {
+                sub(/^##### /, "", line); print "<h5 id=\"" strip_markdown(line) "\">" line "</h5>"
+            } else if (line ~ /^###### /) {
+                sub(/^###### /, "", line); print "<h6 id=\"" strip_markdown(line) "\">" line "</h6>"
+            } else {
+                print prev
+            }
+        }
+        prev = $0
+        has_prev = 1
+    }
+}
+END {
+    if (has_prev) {
+        line = prev
+        if (line ~ /^# /) {
+            sub(/^# /, "", line); print "<h1 id=\"" strip_markdown(line) "\">" line "</h1>"
+        } else {
+            print prev
+        }
+    }
+}
@@ -0,0 +1,9 @@
+BEGIN { in_code = 0 }
+/^	|    / {
+    if (!in_code) { print "<pre><code>"; in_code = 1 }
+    sub(/^	|    /, "", $0)
+    gsub(/&/, "&amp;"); gsub(/</, "&lt;"); gsub(/>/, "&gt;")
+    print; next
+}
+{ if (in_code) { print "</code></pre>"; in_code = 0 } print }
+END { if (in_code) print "</code></pre>" }
@@ -0,0 +1,66 @@
+BEGIN {
+    depth = 0
+    in_pre = 0
+}
+
+{
+    if ($0 ~ /^<pre>/) in_pre = 1
+    if (in_pre) {
+        while (depth > 0) { print "</" cur_type[depth] ">"; depth-- }
+        print
+        if ($0 ~ /<\/pre>/) in_pre = 0
+        next
+    }
+
+    line = $0
+    type = ""
+    # match list marker and its preceding spaces
+    if (line ~ /^[ \t]*[*+-] /) {
+        type = "ul"
+        match(line, /^[ \t]*[*+-] /)
+        marker_len = RLENGTH
+    } else if (line ~ /^[ \t]*[0-9]+\. /) {
+        type = "ol"
+        match(line, /^[ \t]*[0-9]+\. /)
+        marker_len = RLENGTH
+    }
+
+    if (type != "") {
+        content = substr(line, marker_len + 1)
+        # get indentation level
+        match(line, /^[ \t]*/)
+        indent = RLENGTH
+        
+        if (depth == 0 || indent > cur_indent[depth]) {
+            depth++
+            cur_indent[depth] = indent
+            cur_type[depth] = type
+            print "<" type ">"
+        } else {
+            while (depth > 1 && indent < cur_indent[depth]) {
+                print "</" cur_type[depth] ">"
+                depth--
+            }
+            if (type != cur_type[depth]) {
+                print "</" cur_type[depth] ">"
+                cur_type[depth] = type
+                print "<" type ">"
+            }
+        }
+
+        print "<li>" content "</li>"
+    } else {
+        while (depth > 0) {
+            print "</" cur_type[depth] ">"
+            depth--
+        }
+        print line
+    }
+}
+
+END {
+    while (depth > 0) {
+        print "</" cur_type[depth] ">"
+        depth--
+    }
+}
@@ -119,11 +119,35 @@ function css_highlight_line(line,    m, prop, val) {
        return "<span class=\"tok-punc\">}</span>"
    }

-    if (match(line, /^([[:space:]]*)(--?[A-Za-z0-9_-]+)([[:space:]]*:[[:space:]]*)([^;]*)(;?[[:space:]]*)$/, m)) {
-        prop = "<span class=\"tok-prop\">" m[2] "</span>"
-        gsub(/var\(--[A-Za-z0-9_-]+\)/, "<span class=\"tok-var\">&</span>", m[4])
-        val = "<span class=\"tok-val\">" m[4] "</span>"
-        return m[1] prop m[3] val m[5]
+    if (line ~ /^[[:space:]]*--?[A-Za-z0-9_-]+[[:space:]]*:[[:space:]]*[^;]*;?[[:space:]]*$/) {
+        match(line, /:[[:space:]]*/)
+        sep_pos = RSTART
+        sep_len = RLENGTH
+        
+        pre_sep = substr(line, 1, sep_pos - 1)
+        sep = substr(line, sep_pos, sep_len)
+        post_sep = substr(line, sep_pos + sep_len)
+        
+        match(pre_sep, /--?[A-Za-z0-9_-]+/)
+        prop_pos = RSTART
+        prop_len = RLENGTH
+        
+        indent = substr(pre_sep, 1, prop_pos - 1)
+        prop_name = substr(pre_sep, prop_pos, prop_len)
+        
+        if (match(post_sep, /;[[:space:]]*$/)) {
+            val_part = substr(post_sep, 1, RSTART - 1)
+            suffix = substr(post_sep, RSTART)
+        } else {
+            val_part = post_sep
+            suffix = ""
+        }
+        
+        prop = "<span class=\"tok-prop\">" prop_name "</span>"
+        gsub(/var\(--[A-Za-z0-9_-]+\)/, "<span class=\"tok-var\">&</span>", val_part)
+        val = "<span class=\"tok-val\">" val_part "</span>"
+        
+        return indent prop sep val suffix
    }

    return line
@@ -0,0 +1,173 @@
+BEGIN {
+    in_pre = 0
+}
+
+{
+    if ($0 ~ /<pre>/) {
+        in_pre = 1
+    }
+    
+    if (in_pre) {
+        print
+        if ($0 ~ /<\/pre>/) {
+            in_pre = 0
+        }
+        next
+    }
+
+    line = $0
+
+    # automatic links
+    while (match(line, /<https?:\/\/[^>]+>/)) {
+        start = RSTART; len = RLENGTH
+        url = substr(line, start + 1, len - 2)
+        repl = "<a href=\"" url "\">" url "</a>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # automatic email address links
+    while (match(line, /<[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Za-z]{2,}>/)) {
+        start = RSTART; len = RLENGTH
+        email = substr(line, start + 1, len - 2)
+        repl = "<a href=\"mailto:" email "\">" email "</a>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # force-inline image syntax (double bang)
+    while (match(line, /!!\[[^\]]*\]\([^\)]+ "[^"]*"\)/)) {
+        start = RSTART; len = RLENGTH
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); alt = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /"[^"]*"/); title = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); inner = substr(token, RSTART + 1, RLENGTH - 1)
+        sub(/[[:space:]]*"[^"]*"/, "", inner); src = inner
+        repl = "<img data-force-inline=\"1\" alt=\"" alt "\" src=\"" src "\" title=\"" title "\" />"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    while (match(line, /!!\[[^\]]*\]\([^\)]+\)/)) {
+        start = RSTART; len = RLENGTH
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); alt = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); src = substr(token, RSTART + 1, RLENGTH - 1)
+        repl = "<img data-force-inline=\"1\" alt=\"" alt "\" src=\"" src "\" />"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # inline image
+    while (match(line, /!\[[^\]]*\]\([^\)]+ "[^"]*"\)/)) {
+        start = RSTART; len = RLENGTH
+        if (start > 1 && substr(line, start - 1, 1) == "\\") break
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); alt = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /"[^"]*"/); title = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); inner = substr(token, RSTART + 1, RLENGTH - 1)
+        sub(/[[:space:]]*"[^"]*"/, "", inner); src = inner
+        repl = "<img alt=\"" alt "\" src=\"" src "\" title=\"" title "\" />"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    while (match(line, /!\[[^\]]*\]\([^\)]+\)/)) {
+        start = RSTART; len = RLENGTH
+        if (start > 1 && substr(line, start - 1, 1) == "\\") break
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); alt = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); src = substr(token, RSTART + 1, RLENGTH - 1)
+        repl = "<img alt=\"" alt "\" src=\"" src "\" />"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # inline link
+    while (match(line, /\[[^\]]*\]\([^\)]+ "[^"]*"\)/)) {
+        start = RSTART; len = RLENGTH
+        if (start > 1 && (substr(line, start - 1, 1) == "\\" || substr(line, start - 1, 1) == "!")) break
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); text = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /"[^"]*"/); title = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); inner = substr(token, RSTART + 1, RLENGTH - 1)
+        sub(/[[:space:]]*"[^"]*"/, "", inner); href = inner
+        repl = "<a href=\"" href "\" title=\"" title "\">" text "</a>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    while (match(line, /\[[^\]]*\]\([^\)]+\)/)) {
+        start = RSTART; len = RLENGTH
+        if (start > 1 && (substr(line, start - 1, 1) == "\\" || substr(line, start - 1, 1) == "!")) break
+        token = substr(line, start, len)
+        match(token, /\[[^\]]*\]/); text = substr(token, RSTART + 1, RLENGTH - 2)
+        match(token, /\([^\)]+/); href = substr(token, RSTART + 1, RLENGTH - 1)
+        repl = "<a href=\"" href "\">" text "</a>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # MFM font syntax
+    while (match(line, /\$\[font\.serif [^\]]+\]/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 13, len - 14)
+        line = substr(line, 1, start - 1) "<span style=\"font-family: serif;\">" content "</span>" substr(line, start + len)
+    }
+    while (match(line, /\$\[font\.monospace [^\]]+\]/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 17, len - 18)
+        line = substr(line, 1, start - 1) "<span style=\"font-family: monospace;\">" content "</span>" substr(line, start + len)
+    }
+    while (match(line, /\$\[font\.sans [^\]]+\]/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 12, len - 13)
+        line = substr(line, 1, start - 1) "<span style=\"font-family: sans-serif;\">" content "</span>" substr(line, start + len)
+    }
+
+    # Bold, Italic, Strikethrough (BRE-like logic in AWK)
+    # Strong Bold **
+    while (match(line, /\*\*[^*]+\*\*/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 2, len - 4)
+        repl = "<strong>" content "</strong>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    # Strong Bold __
+    while (match(line, /__[^_]+__/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 2, len - 4)
+        repl = "<strong>" content "</strong>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    # Italic *
+    while (match(line, /\*[^*]+\*/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 1, len - 2)
+        repl = "<em>" content "</em>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    # Italic _
+    while (match(line, /_[^_]+_/)) {
+        start = RSTART; len = RLENGTH
+        if (start > 1 && substr(line, start - 1, 1) == "\\") break
+        content = substr(line, start + 1, len - 2)
+        repl = "<em>" content "</em>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+    # Strikethrough ~~
+    while (match(line, /~~[^~]+~~/)) {
+        start = RSTART; len = RLENGTH
+        content = substr(line, start + 2, len - 4)
+        repl = "<strike>" content "</strike>"
+        line = substr(line, 1, start - 1) repl substr(line, start + len)
+    }
+
+    # special characters
+    if (line !~ /&[A-Za-z0-9#]+;/) {
+        gsub(/&/, "&amp;", line)
+    }
+    
+    p = 1
+    while (match(substr(line, p), /</)) {
+        start = p + RSTART - 1
+        next_char = substr(line, start + 1, 1)
+        if (next_char !~ /^[\/A-Za-z]/) {
+            line = substr(line, 1, start - 1) "&lt;" substr(line, start + 1)
+            p = start + 4
+        } else {
+            p = start + 1
+        }
+    }
+
+    print line
+}
@@ -0,0 +1,85 @@
+function mask(s,    t) {
+    t = s
+    gsub(/\*/, "\034P0\034", t)
+    gsub(/_/, "\034P1\034", t)
+    gsub(/`/, "\034P2\034", t)
+    gsub(/\[/, "\034P3\034", t)
+    gsub(/\]/, "\034P4\034", t)
+    gsub(/\(/, "\034P5\034", t)
+    gsub(/\)/, "\034P6\034", t)
+    gsub(/!/, "\034P7\034", t)
+    gsub(/\$/, "\034P8\034", t)
+    gsub(/#/, "\034P9\034", t)
+    gsub(/\+/, "\034P10\034", t)
+    gsub(/-/, "\034P11\034", t)
+    gsub(/\\/, "\034P12\034", t)
+    gsub(/</, "\034P13\034", t)
+    gsub(/>/, "\034P14\034", t)
+    return t
+}
+{
+    # backslash escapes
+    gsub(/\\\*/, "\034P0\034")
+    gsub(/\\_/, "\034P1\034")
+    gsub(/\\`/, "\034P2\034")
+    gsub(/\\\[/, "\034P3\034")
+    gsub(/\\\]/, "\034P4\034")
+    gsub(/\\\(/, "\034P5\034")
+    gsub(/\\\)/, "\034P6\034")
+    gsub(/\\!/, "\034P7\034")
+    gsub(/\\\$/, "\034P8\034")
+    gsub(/\\#/, "\034P9\034")
+    gsub(/\\\+/, "\034P10\034")
+    gsub(/\\\-/, "\034P11\034")
+    gsub(/\\\\/, "\034P12\034")
+    gsub(/\\</, "\034P13\034")
+    gsub(/\\>/, "\034P14\034")
+
+    # inline code (1 or 2 backticks)
+    line = $0
+    if (line ~ /^```/) {
+        print line
+        next
+    }
+    out = ""
+    p = 1
+    while (match(substr(line, p), /`+/)) {
+        pstart = p + RSTART - 1
+        plen = RLENGTH
+        if (plen >= 3) {
+            out = out substr(line, p, pstart - p + plen)
+            p = pstart + plen
+            continue
+        }
+
+        # Found 1 or 2 backticks at pstart
+        # Search for closing marker
+        marker = substr(line, pstart, plen)
+        tail = substr(line, pstart + plen)
+        mpos = index(tail, marker)
+        if (mpos > 0) {
+            # Check if it is followed by more backticks
+            if (substr(tail, mpos + plen, 1) == "`") {
+                # Not a match, treat as literal
+                out = out substr(line, p, pstart - p + plen)
+                p = pstart + plen
+                continue
+            }
+            
+            # Found match!
+            content = substr(tail, 1, mpos - 1)
+            out = out substr(line, p, pstart - p)
+            if (plen == 2 && substr(content, 1, 1) == " " && substr(content, length(content), 1) == " ") {
+                content = substr(content, 2, length(content) - 2)
+            }
+            out = out "<code>" mask(content) "</code>"
+            p = pstart + plen + mpos + plen - 1
+        } else {
+            # No closing marker, treat as literal
+            out = out substr(line, p, pstart - p + plen)
+            p = pstart + plen
+        }
+    }
+    out = out substr(line, p)
+    print out
+}
@@ -0,0 +1,52 @@
+function find_unescaped_tag(s, tag,    p, off, pos) {
+    p = 1
+    while (1) {
+        off = index(substr(s, p), tag)
+        if (off == 0) return 0
+        pos = p + off - 1
+        if (pos == 1 || substr(s, pos - 1, 1) != "\\") return pos
+        p = pos + 1
+    }
+}
+
+function mask_plain(s,    t) {
+    t = s
+    gsub(/\*/, "\034P0\034", t)
+    gsub(/_/, "\034P1\034", t)
+    gsub(/`/, "\034P2\034", t)
+    gsub(/\[/, "\034P3\034", t)
+    gsub(/\]/, "\034P4\034", t)
+    gsub(/\(/, "\034P5\034", t)
+    gsub(/\)/, "\034P6\034", t)
+    gsub(/!/, "\034P7\034", t)
+    gsub(/\$/, "\034P8\034", t)
+    return t
+}
+BEGIN { in_plain = 0 }
+{
+    line = $0
+    out = ""
+    while (1) {
+        if (!in_plain) {
+            pos = find_unescaped_tag(line, "<plain>")
+            if (pos == 0) {
+                out = out line
+                break
+            }
+            out = out substr(line, 1, pos - 1) "<mfmplain>"
+            line = substr(line, pos + 7)
+            in_plain = 1
+        } else {
+            pos = find_unescaped_tag(line, "</plain>")
+            if (pos == 0) {
+                out = out mask_plain(line)
+                line = ""
+                break
+            }
+            out = out mask_plain(substr(line, 1, pos - 1)) "</mfmplain>"
+            line = substr(line, pos + 8)
+            in_plain = 0
+        }
+    }
+    print out
+}
@@ -0,0 +1,43 @@
+BEGIN {
+    in_p = 0
+    in_pre = 0
+}
+
+{
+    if ($0 ~ /^<pre>/) in_pre = 1
+    
+    if (in_pre) {
+        if (in_p) { print "</p>"; in_p = 0 }
+        print
+        if ($0 ~ /<\/pre>/) in_pre = 0
+        next
+    }
+
+    if ($0 ~ /^<\/?(div|table|p|[ou]l|h[1-6]|[bh]r|blockquote|li)/) {
+        if (in_p) {
+            print "</p>"
+            in_p = 0
+        }
+        print
+        next
+    }
+
+    if ($0 == "") {
+        if (in_p) {
+            print "</p>"
+            in_p = 0
+        }
+        print
+        next
+    }
+
+    if (!in_p) {
+        print "<p>"
+        in_p = 1
+    }
+    print
+}
+
+END {
+    if (in_p) print "</p>"
+}
@@ -0,0 +1,143 @@
+function trim(s) {
+    sub(/^[[:space:]]+/, "", s)
+    sub(/[[:space:]]+$/, "", s)
+    return s
+}
+
+function is_table_row(line, t) {
+    t = line
+    return (t ~ /^[[:space:]]*\|/ && t ~ /\|[[:space:]]*$/)
+}
+
+function is_table_sep(line, t) {
+    if (!is_table_row(line)) return 0
+    t = line
+    gsub(/[|:\-[:space:]]/, "", t)
+    return (t == "" && line ~ /-/)
+}
+
+function split_row(line, out, n, i, raw) {
+    raw = line
+    sub(/^[[:space:]]*\|/, "", raw)
+    sub(/\|[[:space:]]*$/, "", raw)
+    n = split(raw, out, /\|/)
+    for (i = 1; i <= n; i++) out[i] = trim(out[i])
+    return n
+}
+
+function align_for(sep, t) {
+    t = trim(sep)
+    if (t ~ /^:-+:$/) return "center"
+    if (t ~ /^:-+$/) return "left"
+    if (t ~ /^-+:$/) return "right"
+    return ""
+}
+
+function render_cell(cell, inner) {
+    inner = trim(cell)
+    if (inner ~ /^```.*```$/) {
+        sub(/^```[[:space:]]*/, "", inner)
+        sub(/[[:space:]]*```$/, "", inner)
+        return "<pre><code>" inner "</code></pre>"
+    }
+    return inner
+}
+
+BEGIN { count = 0 }
+{ lines[++count] = $0 }
+
+END {
+    in_pre = 0
+    i = 1
+    while (i <= count) {
+        if (lines[i] ~ /^<pre><code>/) {
+            in_pre = 1
+            print lines[i]
+            i++
+            continue
+        }
+        if (in_pre) {
+            print lines[i]
+            if (lines[i] ~ /^<\/code><\/pre>/) in_pre = 0
+            i++
+            continue
+        }
+
+        if (i < count && is_table_row(lines[i]) && is_table_sep(lines[i + 1])) {
+            n_header = split_row(lines[i], header)
+            n_sep = split_row(lines[i + 1], sep)
+            n_cols = (n_header > n_sep ? n_header : n_sep)
+
+            print "<table>"
+            print "<thead>"
+            print "<tr>"
+            for (c = 1; c <= n_cols; c++) {
+                cell = (c <= n_header ? render_cell(header[c]) : "")
+                a = (c <= n_sep ? align_for(sep[c]) : "")
+                if (a != "") print "<th style=\"text-align: " a ";\">" cell "</th>"
+                else print "<th>" cell "</th>"
+            }
+            print "</tr>"
+            print "</thead>"
+
+            j = i + 2
+            print "<tbody>"
+            while (j <= count && is_table_row(lines[j])) {
+                n_body = split_row(lines[j], body)
+                print "<tr>"
+                for (c = 1; c <= n_cols; c++) {
+                    cell = (c <= n_body ? render_cell(body[c]) : "")
+                    a = (c <= n_sep ? align_for(sep[c]) : "")
+                    if (a != "") print "<td style=\"text-align: " a ";\">" cell "</td>"
+                    else print "<td>" cell "</td>"
+                }
+                print "</tr>"
+                j++
+            }
+            print "</tbody>"
+            print "</table>"
+
+            i = j
+            continue
+        }
+
+        if (is_table_sep(lines[i]) && i < count && is_table_row(lines[i + 1])) {
+            n_sep = split_row(lines[i], sep)
+            n_cols = n_sep
+
+            print "<table>"
+            print "<thead>"
+            print "<tr>"
+            for (c = 1; c <= n_cols; c++) {
+                a = align_for(sep[c])
+                if (a != "") print "<th style=\"text-align: " a ";\"></th>"
+                else print "<th></th>"
+            }
+            print "</tr>"
+            print "</thead>"
+
+            j = i + 1
+            print "<tbody>"
+            while (j <= count && is_table_row(lines[j])) {
+                n_body = split_row(lines[j], body)
+                print "<tr>"
+                for (c = 1; c <= n_cols; c++) {
+                    cell = (c <= n_body ? render_cell(body[c]) : "")
+                    a = (c <= n_sep ? align_for(sep[c]) : "")
+                    if (a != "") print "<td style=\"text-align: " a ";\">" cell "</td>"
+                    else print "<td>" cell "</td>"
+                }
+                print "</tr>"
+                j++
+            }
+            print "</tbody>"
+            print "</table>"
+
+            i = j
+            continue
+        }
+
+        print lines[i]
+        i++
+    }
+}
@@ -0,0 +1,10 @@
+BEGIN { done = 0 }
+/^title[[:space:]]*=/ {
+    print "title = \"" new_title "\""
+    done = 1
+    next
+}
+{ print }
+END {
+    if (!done) print "title = \"" new_title "\""
+}
@@ -82,18 +82,7 @@ create_new_site() {
    printf "# _kewt_ website\n" > "$new_dir/index.md"

    if [ -n "$new_title" ]; then
-        awk -v new_title="$new_title" '
-            BEGIN { done = 0 }
-            /^title[[:space:]]*=/ {
-                print "title = \"" new_title "\""
-                done = 1
-                next
-            }
-            { print }
-            END {
-                if (!done) print "title = \"" new_title "\""
-            }
-        ' "$new_dir/site.conf" > "$new_dir/site.conf.tmp" && mv "$new_dir/site.conf.tmp" "$new_dir/site.conf"
+        awk -v new_title="$new_title" -f "$awk_dir/update_site_conf.awk" "$new_dir/site.conf" > "$new_dir/site.conf.tmp" && mv "$new_dir/site.conf.tmp" "$new_dir/site.conf"
    fi

    echo "Created new site at '$new_dir'."
@@ -101,7 +90,7 @@ create_new_site() {
 }

 generate_nav() {
-    dinfo=$(find "$1" -not -path '*/.*' | sort | awk -v src="$1" -f "$awk_dir/collect_dir_info.awk")
+    dinfo=$(find "$1" ! -path '*/.*' | sort | awk -v src="$1" -f "$awk_dir/collect_dir_info.awk")
    find "$1" -name "*.md" | sort | awk -v src="$1" -v single_file_index="$single_file_index" -v flatten="$flatten" -v order="$order" -v dinfo="$dinfo" -f "$awk_dir/generate_sidebar.awk"
 }

@@ -314,9 +303,9 @@ find "$src" -type d | sort | while read -r dir; do

    if [ ! -f "$dir/index.md" ]; then
        if [ "$single_file_index" = "true" ]; then
-            md_count=$(find "$dir" -maxdepth 1 -name "*.md" | wc -l)
+            md_count=$(find "$dir" ! -name "$(basename "$dir")" -prune -name "*.md" | wc -l)
            if [ "$md_count" -eq 1 ]; then
-                md_file=$(find "$dir" -maxdepth 1 -name "*.md")
+                md_file=$(find "$dir" ! -name "$(basename "$dir")" -prune -name "*.md")
                render_markdown "$md_file" > "$out_dir/index.html"
                continue
            fi
@@ -327,7 +316,7 @@ find "$src" -type d | sort | while read -r dir; do
        [ -z "$display_dir" ] && display_dir="/"
        echo "# Index of $display_dir" > "$temp_index"
        echo "" >> "$temp_index"
-        find "$dir" -maxdepth 1 -not -path '*/.*' -not -path "$dir" | sort | while read -r entry; do
+        find "$dir" ! -name "$(basename "$dir")" -prune ! -path '*/.*' | sort | while read -r entry; do
            name="${entry##*/}"
            case "$name" in
                template.html|site.conf|style.css|index.md) continue ;;
@@ -359,7 +348,7 @@ find "$src" -type f | sort | while IFS= read -r file; do
    esac

    if [ "$single_file_index" = "true" ] && [ "${file%.md}" != "$file" ] && [ ! -f "$(dirname "$file")/index.md" ]; then
-        md_count=$(find "$(dirname "$file")" -maxdepth 1 -name "*.md" | wc -l)
+        md_count=$(find "$(dirname "$file")" ! -name "$(basename "$(dirname "$file")")" -prune -name "*.md" | wc -l)
        [ "$md_count" -eq 1 ] && continue
    fi

@@ -3,34 +3,6 @@
 script_dir=$(CDPATH= cd -- "$(dirname -- "$0")" && pwd)
 awk_dir="$script_dir/awk"

-sed_ere() {
-    if sed -E '' </dev/null >/dev/null 2>&1; then
-        sed -E "$@"
-    else
-        sed -r "$@"
-    fi
-}
-
-sed_ere_inplace() {
-    script="$1"
-    file="$2"
-    tmp="${file}.tmp.$$"
-    sed_ere "$script" "$file" > "$tmp" && mv "$tmp" "$file" || {
-        rm -f "$tmp"
-        return 1
-    }
-}
-
-sed_ere_inplace_n() {
-    script="$1"
-    file="$2"
-    tmp="${file}.tmp.$$"
-    sed_ere -n "$script" "$file" > "$tmp" && mv "$tmp" "$file" || {
-        rm -f "$tmp"
-        return 1
-    }
-}
-
 sed_inplace() {
    script="$1"
    file="$2"
@@ -44,711 +16,49 @@ sed_inplace() {
 temp_file="/tmp/markdown.$$"
 cat "$@" > "$temp_file"

-# backslash escapes for literal characters and inline code masking
-awk '
-function mask(s,    t) {
-    t = s
-    gsub(/\*/, "\034P0\034", t)
-    gsub(/_/, "\034P1\034", t)
-    gsub(/`/, "\034P2\034", t)
-    gsub(/\[/, "\034P3\034", t)
-    gsub(/\]/, "\034P4\034", t)
-    gsub(/\(/, "\034P5\034", t)
-    gsub(/\)/, "\034P6\034", t)
-    gsub(/!/, "\034P7\034", t)
-    gsub(/\$/, "\034P8\034", t)
-    gsub(/#/, "\034P9\034", t)
-    gsub(/\+/, "\034P10\034", t)
-    gsub(/-/, "\034P11\034", t)
-    gsub(/\\/, "\034P12\034", t)
-    gsub(/</, "\034P13\034", t)
-    gsub(/>/, "\034P14\034", t)
-    return t
-}
-{
-    # backslash escapes
-    gsub(/\\\*/, "\034P0\034")
-    gsub(/\\_/, "\034P1\034")
-    gsub(/\\`/, "\034P2\034")
-    gsub(/\\\[/, "\034P3\034")
-    gsub(/\\\]/, "\034P4\034")
-    gsub(/\\\(/, "\034P5\034")
-    gsub(/\\\)/, "\034P6\034")
-    gsub(/\\!/, "\034P7\034")
-    gsub(/\\\$/, "\034P8\034")
-    gsub(/\\#/, "\034P9\034")
-    gsub(/\\\+/, "\034P10\034")
-    gsub(/\\\-/, "\034P11\034")
-    gsub(/\\\\/, "\034P12\034")
-    gsub(/\\</, "\034P13\034")
-    gsub(/\\>/, "\034P14\034")
-
-    # inline code (1 or 2 backticks)
-    line = $0
-    if (line ~ /^```/) {
-        print line
-        next
-    }
-    out = ""
-    p = 1
-    while (match(substr(line, p), /`+/)) {
-        pstart = p + RSTART - 1
-        plen = RLENGTH
-        if (plen >= 3) {
-            out = out substr(line, p, pstart - p + plen)
-            p = pstart + plen
-            continue
-        }
-
-        # Found 1 or 2 backticks at pstart
-        # Search for closing marker
-        marker = substr(line, pstart, plen)
-        tail = substr(line, pstart + plen)
-        mpos = index(tail, marker)
-        if (mpos > 0) {
-            # Check if it is followed by more backticks
-            if (substr(tail, mpos + plen, 1) == "`") {
-                # Not a match, treat as literal
-                out = out substr(line, p, pstart - p + plen)
-                p = pstart + plen
-                continue
-            }
-            
-            # Found match!
-            content = substr(tail, 1, mpos - 1)
-            out = out substr(line, p, pstart - p)
-            if (plen == 2 && substr(content, 1, 1) == " " && substr(content, length(content), 1) == " ") {
-                content = substr(content, 2, length(content) - 2)
-            }
-            out = out "<code>" mask(content) "</code>"
-            p = pstart + plen + mpos + plen - 1
-        } else {
-            # No closing marker, treat as literal
-            out = out substr(line, p, pstart - p + plen)
-            p = pstart + plen
-        }
-    }
-    out = out substr(line, p)
-    print out
-}' "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
-
-awk '
-
-function find_unescaped_tag(s, tag,    p, off, pos) {
-    p = 1
-    while (1) {
-        off = index(substr(s, p), tag)
-        if (off == 0) return 0
-        pos = p + off - 1
-        if (pos == 1 || substr(s, pos - 1, 1) != "\\") return pos
-        p = pos + 1
-    }
-}
-
-function mask_plain(s,    t) {
-    t = s
-    gsub(/\*/, "\034P0\034", t)
-    gsub(/_/, "\034P1\034", t)
-    gsub(/`/, "\034P2\034", t)
-    gsub(/\[/, "\034P3\034", t)
-    gsub(/\]/, "\034P4\034", t)
-    gsub(/\(/, "\034P5\034", t)
-    gsub(/\)/, "\034P6\034", t)
-    gsub(/!/, "\034P7\034", t)
-    gsub(/\$/, "\034P8\034", t)
-    return t
-}
-BEGIN { in_plain = 0 }
-{
-    line = $0
-    out = ""
-    while (1) {
-        if (!in_plain) {
-            pos = find_unescaped_tag(line, "<plain>")
-            if (pos == 0) {
-                out = out line
-                break
-            }
-            out = out substr(line, 1, pos - 1) "<mfmplain>"
-            line = substr(line, pos + 7)
-            in_plain = 1
-        } else {
-            pos = find_unescaped_tag(line, "</plain>")
-            if (pos == 0) {
-                out = out mask_plain(line)
-                line = ""
-                break
-            }
-            out = out mask_plain(substr(line, 1, pos - 1)) "</mfmplain>"
-            line = substr(line, pos + 8)
-            in_plain = 0
-        }
-    }
-    print out
-}
-' "$temp_file" > "$temp_file.plain.$$" && mv "$temp_file.plain.$$" "$temp_file"
+# Mask
+awk -f "$awk_dir/mask_inline_code.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/mask_plain.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"

+# Reference links
+refs=$(cat "$@" | awk '/^\[[^\]]+\]: +/')
 IFS='
 '
-refs=$(sed_ere -n "/^\[.+\]: +/p" "$@")
-for ref in $refs
-do
-    ref_id=$(printf %s "$ref" | sed_ere -n "s/^\[(.+)\]: .*/\1/p" | tr -d '\n')
-    ref_url=$(printf %s "$ref" | sed_ere -n "s/^\[.+\]: (.+)/\1/p" | cut -d' ' -f1 | tr -d '\n')
-    ref_title=$(printf %s "$ref" | sed_ere -n "s/^\[.+\]: (.+) \"(.+)\"/\2/p" | sed 's@|@!@g' | tr -d '\n')
+for ref in $refs; do
+    ref_id=$(echo "$ref" | sed 's/^\[\(.*\)\]: .*/\1/')
+    ref_url=$(echo "$ref" | sed 's/^\[.*\]: \([^ ]*\).*/\1/')
+    ref_title=$(echo "$ref" | sed -n 's/^\[.*\]: [^ ]* "\(.*\)"/\1/p' | sed 's@|@!@g')
+    sed_inplace "s|!\[\([^]]*\)\]\[$ref_id\]|<img src=\"$ref_url\" title=\"$ref_title\" alt=\"\1\" />|g" "$temp_file"
+    sed_inplace "s|\[\([^]]*\)\]\[$ref_id\]|<a href=\"$ref_url\" title=\"$ref_title\">\1</a>|g" "$temp_file"
+    sed_inplace "s|!\[$ref_id\]\[\]|<img src=\"$ref_url\" title=\"$ref_title\" alt=\"$ref_id\" />|g" "$temp_file"
+    sed_inplace "s|\[$ref_id\]\[\]|<a href=\"$ref_url\" title=\"$ref_title\">$ref_id</a>|g" "$temp_file"
+done
+sed_inplace "/^\[[^\]]*\]: +/d" "$temp_file"

-    # reference-style image using the label
-    sed_ere_inplace "s|!\[([^]]+)\]\[($ref_id)\]|<img src=\"$ref_url\" title=\"$ref_title\" alt=\"\1\" />|g" "$temp_file"
-    # reference-style link using the label
-    sed_ere_inplace "s|\[([^]]+)\]\[($ref_id)\]|<a href=\"$ref_url\" title=\"$ref_title\">\1</a>|g" "$temp_file"
+# Blocks
+sed_inplace "s/^>!\[/> [!/g" "$temp_file"
+sed_inplace "s/^>\[!/> [!/g" "$temp_file"

-    # implicit reference-style
-    sed_ere_inplace "s|!\[($ref_id)\]\[\]|<img src=\"$ref_url\" title=\"$ref_title\" alt=\"\1\" />|g" "$temp_file"
-    # implicit reference-style
-    sed_ere_inplace "s|\[($ref_id)\]\[\]|<a href=\"$ref_url\" title=\"$ref_title\">\1</a>|g" "$temp_file"
+while grep '^>' "$temp_file" >/dev/null; do
+    awk -f "$awk_dir/blockquote.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
 done

-# delete the reference lines
-sed_ere_inplace "/^\[.+\]: +/d" "$temp_file"
-
-# normalize GitHub admonition shorthand in blockquotes
-sed_ere_inplace '
-/^>!\[/s/^>!\[/> [!/
-/^>\[!/s/^>\[!/> [!/
-s/^>([^[:space:]>])/> \1/
-' "$temp_file"
-
-# blockquotes
-# use grep to find all the nested blockquotes
-while grep '^> ' "$temp_file" >/dev/null
-do
-    sed_ere_inplace_n '
-/^$/b blockquote
-
-H
-$ b blockquote
-b
-
-:blockquote
-x
-s/(\n+)(> .*)/\1<blockquote>\n\2\n<\/blockquote>/ # wrap the tags in a blockquote
-p
-' "$temp_file"
-
-    sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-    # cleanup blank lines and remove subsequent blockquote characters
-    sed_ere_inplace '
-/^> /s/^> (.*)/\1/
-' "$temp_file"
-done
-
-# convert [!TYPE] blockquotes into admonition blocks
-awk '
-function cap(s) { return toupper(substr(s, 1, 1)) tolower(substr(s, 2)) }
-BEGIN { count = 0 }
-{ lines[++count] = $0 }
-END {
-    i = 1
-    while (i <= count) {
-        if (lines[i] == "<blockquote>") {
-            j = i + 1
-            while (j <= count && lines[j] != "</blockquote>") j++
-            if (j <= count) {
-                first = ""
-                first_idx = 0
-                for (k = i + 1; k < j; k++) {
-                    if (lines[k] != "") {
-                        first = lines[k]
-                        first_idx = k
-                        break
-                    }
-                }
-                if (first ~ /^\[![A-Za-z]+\]$/) {
-                    kind = first
-                    sub(/^\[!/, "", kind)
-                    sub(/\]$/, "", kind)
-                    lkind = tolower(kind)
-                    if (lkind == "note" || lkind == "tip" || lkind == "important" || lkind == "warning" || lkind == "caution") {
-                        print "<div class=\"admonition admonition-" lkind "\">"
-                        print "<p class=\"admonition-title\">" cap(lkind) "</p>"
-                        has_body = 0
-                        for (k = first_idx + 1; k < j; k++) {
-                            if (lines[k] != "") {
-                                print "<p>" lines[k] "</p>"
-                                has_body = 1
-                            }
-                        }
-                        if (!has_body) print "<p></p>"
-                        print "</div>"
-                        i = j + 1
-                        continue
-                    }
-                }
-            }
-        }
-        print lines[i]
-        i++
-    }
-}
-' "$temp_file" > "$temp_file.admon.$$" && mv "$temp_file.admon.$$" "$temp_file"
-
-# Setext-style headers
-sed_ere_inplace_n '
-# Setext-style headers need to be wrapped around newlines
-/^$/ b print
-
-# else, append to holding area
-H
-$ b print
-b
-
-:print
-x
-/=+$/{
-s/\n(.*)\n=+$/\n<h1>\1<\/h1>/
-p
-b
-}
-/\-+$/{
-s/\n(.*)\n\-+$/\n<h2>\1<\/h2>/
-p
-b
-}
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# atx-style headers and other block styles
-sed_ere_inplace '
-/^#+ /s/ #+$// # kill all ending header characters
-/^# /s/# ([A-Za-z0-9 ]*)(.*)/<h1 id="\1">\1\2<\/h1>/g # H1
-/^#{2} /s/#{2} ([A-Za-z0-9 ]*)(.*)/<h2 id="\1">\1\2<\/h2>/g # H2
-/^#{3} /s/#{3} ([A-Za-z0-9 ]*)(.*)/<h3 id="\1">\1\2<\/h3>/g # H3
-/^#{4} /s/#{4} ([A-Za-z0-9 ]*)(.*)/<h4 id="\1">\1\2<\/h4>/g # H4
-/^#{5} /s/#{5} ([A-Za-z0-9 ]*)(.*)/<h5 id="\1">\1\2<\/h5>/g # H5
-/^#{6} /s/#{6} ([A-Za-z0-9 ]*)(.*)/<h6 id="\1">\1\2<\/h6>/g # H6
-
-/^\*\*\*+$/s/\*\*\*+/<hr \/>/ # hr with *
-/^---+$/s/---+/<hr \/>/ # hr with -
-/^___+$/s/___+/<hr \/>/ # hr with _
-
-' "$temp_file"
-
-# unordered lists
-# use grep to find all the nested lists
-while grep '^[\*\+\-] ' "$temp_file" >/dev/null
-do
-sed_ere_inplace_n '
-# wrap the list
-/^$/b list
-
-# wrap the li tags then add to the hold buffer
-# use uli instead of li to avoid collisions when processing nested lists
-/^[\*\+\-] /s/[\*\+\-] (.*)/<\/uli>\n<uli>\n\1/
-
-H
-$ b list # if at end of file, check for the end of a list
-b # else, branch to the end of the script
-
-# this is where a list is checked for the pattern
-:list
-# exchange the hold space into the pattern space
-x
-# look for the list items, if there wrap the ul tags
-/<uli>/{
-s/(.*)/\n<ul>\1\n<\/uli>\n<\/ul>/ # close the ul tags
-s/\n<\/uli>// # kill the first superfluous closing tag
-p
-b
-}
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# convert to the proper li to avoid collisions with nested lists
-sed_inplace 's/uli>/li>/g' "$temp_file"
-
-# prepare any nested lists
-sed_ere_inplace '/^[\*\+\-] /s/(.*)/\n\1\n/' "$temp_file"
-done
-
-# ordered lists
-# use grep to find all the nested lists
-while grep -E '^[1-9]+\. ' "$temp_file" >/dev/null
-do
-sed_ere_inplace_n '
-# wrap the list
-/^$/b list
-
-# wrap the li tags then add to the hold buffer
-# use oli instead of li to avoid collisions when processing nested lists
-/^[1-9]+\. /s/[1-9]+\. (.*)/<\/oli>\n<oli>\n\1/
-
-H
-$ b list # if at end of file, check for the end of a list
-b # else, branch to the end of the script
-
-:list
-# exchange the hold space into the pattern space
-x
-# look for the list items, if there wrap the ol tags
-/<oli>/{
-s/(.*)/\n<ol>\1\n<\/oli>\n<\/ol>/ # close the ol tags
-s/\n<\/oli>// # kill the first superfluous closing tag
-p
-b
-}
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# convert list items into proper list items to avoid collisions with nested lists
-sed_inplace 's/oli>/li>/g' "$temp_file"
-
-# prepare any nested lists
-sed_ere_inplace '/^[1-9]+\. /s/(.*)/\n\1\n/' "$temp_file"
-done
-
-# make escaped periods literal
-sed_ere_inplace '/^[1-9]+\\. /s/([1-9]+)\\. /\1\. /' "$temp_file"
-
-# fenced code blocks (triple backticks)
-awk '
-BEGIN { in_fence = 0; first_line = 0 }
-{
-    if (!in_fence && $0 ~ /^```/) {
-        printf "<pre><code>"
-        in_fence = 1
-        first_line = 1
-        next
-    }
-    if (in_fence && $0 ~ /^```[[:space:]]*$/) {
-        print "</code></pre>"
-        in_fence = 0
-        next
-    }
-    if (in_fence) {
-        if (first_line) {
-            first_line = 0
-            if ($0 == "") next
-        }
-        print
-    } else {
-        print
-    }
-}
-END {
-    if (in_fence) print "</code></pre>"
-}
-' "$temp_file" > "$temp_file.fence.$$" && mv "$temp_file.fence.$$" "$temp_file"
-
-
-# code blocks
-sed_ere_inplace_n '
-# if at end of file, append the current line to the hold buffer and print it
-${
-H
-b code
-}
-
-# wrap the code block on any non code block lines
-/^\t| {4}/!b code
-
-# else, append to the holding buffer and do nothing
-H
-b # else, branch to the end of the script
-
-:code
-# exchange the hold space with the pattern space
-x
-# look for the code items, if there wrap the pre-code tags
-/\t| {4}/{
-s/(\t| {4})(.*)/<pre><code>\n\1\2\n<\/code><\/pre>/ # wrap the ending tags
-p
-b
-}
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# convert html characters inside pre-code tags into printable representations
-sed_ere_inplace '
-# get inside pre-code tags
-/^<pre><code>/{
-:inside
-n
-# if you found the end tags, branch out
-/^<\/code><\/pre>/!{
-s/&/\&amp;/g # ampersand
-s/</\&lt;/g # less than
-s/>/\&gt;/g # greater than
-b inside
-}
-}
-' "$temp_file"
-
-# remove the first tab (or 4 spaces) from the code lines
-sed_ere_inplace 's/^\t| {4}(.*)/\1/' "$temp_file"
-
-# markdown pipe tables
-awk '
-function trim(s) {
-    sub(/^[[:space:]]+/, "", s)
-    sub(/[[:space:]]+$/, "", s)
-    return s
-}
-
-function is_table_row(line, t) {
-    t = line
-    return (t ~ /^[[:space:]]*\|/ && t ~ /\|[[:space:]]*$/)
-}
-
-function is_table_sep(line, t) {
-    if (!is_table_row(line)) return 0
-    t = line
-    gsub(/[|:\-[:space:]]/, "", t)
-    return (t == "" && line ~ /-/)
-}
-
-function split_row(line, out, n, i, raw) {
-    raw = line
-    sub(/^[[:space:]]*\|/, "", raw)
-    sub(/\|[[:space:]]*$/, "", raw)
-    n = split(raw, out, /\|/)
-    for (i = 1; i <= n; i++) out[i] = trim(out[i])
-    return n
-}
-
-function align_for(sep, t) {
-    t = trim(sep)
-    if (t ~ /^:-+:$/) return "center"
-    if (t ~ /^:-+$/) return "left"
-    if (t ~ /^-+:$/) return "right"
-    return ""
-}
-
-function render_cell(cell, inner) {
-    inner = trim(cell)
-    if (inner ~ /^```.*```$/) {
-        sub(/^```[[:space:]]*/, "", inner)
-        sub(/[[:space:]]*```$/, "", inner)
-        return "<pre><code>" inner "</code></pre>"
-    }
-    return inner
-}
-
-BEGIN { count = 0 }
-{ lines[++count] = $0 }
-
-END {
-    in_pre = 0
-    i = 1
-    while (i <= count) {
-        if (lines[i] ~ /^<pre><code>/) {
-            in_pre = 1
-            print lines[i]
-            i++
-            continue
-        }
-        if (in_pre) {
-            print lines[i]
-            if (lines[i] ~ /^<\/code><\/pre>/) in_pre = 0
-            i++
-            continue
-        }
-
-        if (i < count && is_table_row(lines[i]) && is_table_sep(lines[i + 1])) {
-            n_header = split_row(lines[i], header)
-            n_sep = split_row(lines[i + 1], sep)
-            n_cols = (n_header > n_sep ? n_header : n_sep)
-
-            print "<table>"
-            print "<thead>"
-            print "<tr>"
-            for (c = 1; c <= n_cols; c++) {
-                cell = (c <= n_header ? render_cell(header[c]) : "")
-                a = (c <= n_sep ? align_for(sep[c]) : "")
-                if (a != "") print "<th style=\"text-align: " a ";\">" cell "</th>"
-                else print "<th>" cell "</th>"
-            }
-            print "</tr>"
-            print "</thead>"
-
-            j = i + 2
-            print "<tbody>"
-            while (j <= count && is_table_row(lines[j])) {
-                n_body = split_row(lines[j], body)
-                print "<tr>"
-                for (c = 1; c <= n_cols; c++) {
-                    cell = (c <= n_body ? render_cell(body[c]) : "")
-                    a = (c <= n_sep ? align_for(sep[c]) : "")
-                    if (a != "") print "<td style=\"text-align: " a ";\">" cell "</td>"
-                    else print "<td>" cell "</td>"
-                }
-                print "</tr>"
-                j++
-            }
-            print "</tbody>"
-            print "</table>"
-
-            i = j
-            continue
-        }
-
-        if (is_table_sep(lines[i]) && i < count && is_table_row(lines[i + 1])) {
-            n_sep = split_row(lines[i], sep)
-            n_cols = n_sep
-
-            print "<table>"
-            print "<thead>"
-            print "<tr>"
-            for (c = 1; c <= n_cols; c++) {
-                a = align_for(sep[c])
-                if (a != "") print "<th style=\"text-align: " a ";\"></th>"
-                else print "<th></th>"
-            }
-            print "</tr>"
-            print "</thead>"
-
-            j = i + 1
-            print "<tbody>"
-            while (j <= count && is_table_row(lines[j])) {
-                n_body = split_row(lines[j], body)
-                print "<tr>"
-                for (c = 1; c <= n_cols; c++) {
-                    cell = (c <= n_body ? render_cell(body[c]) : "")
-                    a = align_for(sep[c])
-                    if (a != "") print "<td style=\"text-align: " a ";\">" cell "</td>"
-                    else print "<td>" cell "</td>"
-                }
-                print "</tr>"
-                j++
-            }
-            print "</tbody>"
-            print "</table>"
-
-            i = j
-            continue
-        }
-
-        print lines[i]
-        i++
-    }
-}
-' "$temp_file" > "$temp_file.table.$$" && mv "$temp_file.table.$$" "$temp_file"
-
-# br tags
-sed_ere_inplace '
-# if an empty line, append it to the next line, then check on whether there is two in a row
-/^$/ {
-N
-N
-/^\n{2}/s/(.*)/\n<br \/>\1/
-}
-' "$temp_file"
-
-# emphasis and strong emphasis and strikethrough
-sed_ere_inplace_n '
-# batch up the entire stream of text until a line break in the action
-/^$/b emphasis
-
-H
-$ b emphasis
-b
-
-:emphasis
-x
-s/\*\*([^\n]+)\*\*/<strong>\1<\/strong>/g
-s/__([^_\n]+)__/<strong>\1<\/strong>/g
-s/\*([^\*\n]+)\*/<em>\1<\/em>/g
-s/([^\\])_([^_\n]+)_/\1<em>\2<\/em>/g
-s/\~\~([^\n]+)\~\~/<strike>\1<\/strike>/g
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# paragraphs
-sed_ere_inplace_n '
-# if an empty line, check the paragraph
-/^$/ b para
-# else append it to the hold buffer
-H
-# at end of file, check paragraph
-$ b para
-# now branch to end of script
-b
-# this is where a paragraph is checked for the pattern
-:para
-# return the entire paragraph into the pattern space
-x
-# look for non block-level elements, if there - print the p tags
-/\n<(div|table|pre|p|[ou]l|h[1-6]|[bh]r|blockquote|li)/!{
-s/(\n+)(.*)/\1<p>\n\2\n<\/p>/
-p
-b
-}
-p
-' "$temp_file"
-
-sed_inplace '1 d' "$temp_file" # cleanup superfluous first line
-
-# cleanup area where P tags have broken nesting
-sed_ere_inplace_n '
-# if the line looks like like an end tag
-/^<\/(div|table|pre|p|[ou]l|h[1-6]|[bh]r|blockquote)>/{
-h
-# if EOF, print the line
-$ {
-x
-b done
-}
-# fetch the next line and check on whether or not it is a P tag
-n
-/^<\/p>/{
-G
-b done
-}
-# else, append the line to the previous line and print them both
-H
-x
-}
-:done
-p
-' "$temp_file"
-
-# inline styles and special characters
-sed_ere_inplace '
-/^<pre><code>/,/^<\/code><\/pre>/b
-
-s/<(http[s]?:\/\/.*)>/<a href=\"\1\">\1<\/a>/g # automatic links
-s/<(.*@.*\..*)>/<a href=\"mailto:\1\">\1<\/a>/g # automatic email address links
-
-# force-inline image syntax (double bang)
-s/!!\[([^]]*)\]\(([^)]*) \"([^\"]*)\"\)/<img data-force-inline=\"1\" alt=\"\1\" src=\"\2\" title=\"\3\" \/>/g
-s/!!\[([^]]*)\]\(([^)]*)\)/<img data-force-inline=\"1\" alt=\"\1\" src=\"\2\" \/>/g
-
-s/(^|[^\\])!\[([^]]*)\]\(([^)]*) \"([^\"]*)\"\)/\1<img alt=\"\2\" src=\"\3\" title=\"\4\" \/>/g # inline image with title
-s/(^|[^\\])!\[([^]]*)\]\(([^)]*)\)/\1<img alt=\"\2\" src=\"\3\" \/>/g # inline image without title
-
-s/(^|[^\\!])\[([^]]*)\]\(([^)]*) \"([^\"]*)\"\)/\1<a href=\"\3\" title=\"\4\">\2<\/a>/g # inline link with title
-s/(^|[^\\!])\[([^]]*)\]\(([^)]*)\)/\1<a href=\"\3\">\2<\/a>/g # inline link
-
-# MFM font syntax
-s/\$\[font\.serif ([^]]+)\]/<span style=\"font-family: serif;\">\1<\/span>/g
-s/\$\[font\.monospace ([^]]+)\]/<span style=\"font-family: monospace;\">\1<\/span>/g
-s/\$\[font\.sans ([^]]+)\]/<span style=\"font-family: sans-serif;\">\1<\/span>/g
-
-# special characters
-/&.+;/!s/&/\&amp;/g # ampersand
-/<[\/a-zA-Z]/!s/</\&lt;/g# less than bracket
-' "$temp_file"
-
-# display and cleanup
+awk -f "$awk_dir/blockquote_to_admonition.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/fenced_code.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/indented_code.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/pipe_tables.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/headers.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/lists.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+
+sed_inplace "s/^\*\*\*+$/<hr \/>/g" "$temp_file"
+sed_inplace "s/^---+$/<hr \/>/g" "$temp_file"
+sed_inplace "s/^___+$/<hr \/>/g" "$temp_file"
+
+# Spacing
+awk -f "$awk_dir/breaks.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+awk -f "$awk_dir/paragraphs.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
+
+# Inline styles
+awk -f "$awk_dir/markdown_inline.awk" "$temp_file" > "$temp_file.tmp" && mv "$temp_file.tmp" "$temp_file"
 awk -v input_file="$1" -v site_root="$MARKDOWN_SITE_ROOT" -v fallback_file="$MARKDOWN_FALLBACK_FILE" -f "$awk_dir/markdown_embed.awk" "$temp_file"
 rm "$temp_file"