1 #! /bin/sh
2 case $1 in
3 *.html)
4 tidy -latin1 -wrap 0 -q -asxhtml $1 >$1.fixed 2>$1.report
5 TIDY_RET=$?
6 perl -i -0777 -p -e 's/^\s*//;s{="mailto:(oetiker|tobi|tobias)@(oetiker.ch|ee.ethz.ch)"}{="http://tobi.oetiker.ch/"}g;s{="mailto:(\S*?)\@(\S*?)"}{="mailto:$1@..delete..this..$2"}g' $1.fixed
7 # yes, beleive it or not IE chockes on propper xhtml pages ... sigh
8 perl -i -0777 -p -e 's/^\s*<\?xml.+?\?>\s*//;' $1.fixed
9 if [ $TIDY_RET != 0 ]; then
10 echo Parsing: $1
11 egrep -v "^(HTML Tidy|$1:|To learn|Please send|HTML and CSS|Lobby your)" $1.report
12 rm $1.report
13 name=`basename $1 .html`
14 name=`basename $name .en`
15 name=`basename $name .de`
16 touch -m -t 198001010000 $name.*.html
17 exit 1
18 fi
19 mv $1.fixed $1
20 rm $1.report
21 ;;
22 esac