#!/bin/sh
# html2xhtml -- change old-style uppercae tags to lower case

USAGE='html2xhtml file1 [file2] ...'

# no arguments?
if test $# -eq 0
then
	echo "$USAGE" >&2
	exit 1
fi

for f
do
    mv $f ${f}.old || continue
    sed -e '
    s#<!DOCTYPE HTML .*>#<?xml version="1.0" encoding="iso-8859-1"?>\
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">#
    s#<HTML>#<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">#
    s/<META/<meta/g
    s/SU[Pp]>/sup>/g
    s/<P/<p/g
    s/P>/p>/g
    s/ADDRESS>/address>/g
    s/<A/<a/g
    s/A>/a>/g
    s/B>/b>/g
    s/<CODE/<code/g
    s/CODE>/code>/g
    s/HREF=/href=/g
    s/NAME=/name=/g
    s/CLASS=/class=/g
    s/VALIGN=/valign=/g
    s/CITE>/cite>/g
    s/EM>/em>/g
    s/STRONG>/strong>/g
    s/CAPTION>/caption>/g
    s/<IMG/img/g
    s/\(<img .*\)">/\1" \/>/g
    s/H1>/h1>/g
    s/H2>/h2>/g
    s/H3>/h3>/g
    s/H4>/h4>/g
    s/H5>/h5>/g
    s/UL>/ul>/g
    s/OL>/ol>/g
    s/DL>/dl>/g
    s/LI>/li>/g
    s/Li>/li>/g
    s/<BR>/<br \/>/g
    s/<br>/<br \/>/g
    s/<TABLE WIDTH="100%"/<table width="80%"/g
    s/TABLE>/table>/g
    s/THEAD>/thead>/g
    s/TITLE>/title>/g
    s/TBODY>/tbody>/g
    s/HEAD>/head>/g
    s/BODY>/body>/g
    s/<TR/<tr/g
    s/TR>/tr>/g
    s/TH>/th>/g
    s/TD>/td>/g
    s/TD /td /g
    s/DT>/dt>/g
    s/DD>/dd>/g
    s/<KBD/<kbd/g
    s/KBD>/kbd>/g
    s/<HR SIZE=\([^ ]*\)>/<hr size="\1" \/>/g
    s/<HR>/<hr \/>/g
    ' ${f}.old > $f
done
