summaryrefslogtreecommitdiff
path: root/purify_html
blob: 4cf582af50c8deb914824485a6e160e38eabed5d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
#!/bin/sh

# Mangle the rendered files to cause fewer differernces upon re-rendering.

# Written by Thomas Schwinge <tschwinge@gnu.org>.

# Un-mangle mailto links: convert HTML character entities to real characters.
find ./ -name \*.html -print0 \
  | xargs -0 \
    perl -p -i -l -e \
      'BEGIN { $replacing = 0; }
      # The replacing-toggling logic is a bit rough, but so is life.
      $replacing = 1 if /<a href="mailto:/;
      s%\&#(x?)([^;]*);%chr(length($1) ? hex($2) : $2)%eg if $replacing;
      $replacing = 0 if /<\/a>/;'