#!/bin/sh
#
# html2latex.sh - convert HTML to jLaTeX
#	$Id: html2latex.sh,v 1.5 1995/02/22 01:25:24 saka Exp $
# Copyright (C) 1994, by Tetsuo Sakaguchi,
#       University of Library and Information Science. (saka@ulis.ac.jp)
#
# Warning: this script is made for HTML produced with text2html.sh
#
jisto='jconv'
cat "$@" \
| ${jisto} \
| sed -e '
/<PRE>/,/<\/PRE>/ !s/[{}$]/\\&/g
/<PRE>/,/<\/PRE>/ !s/\\\([^{}$]\)/$\\backslash$\1/g
' \
| awk '
BEGIN {
    print "\\documentstyle[a4j]{jarticle}";
    print "\\setlength{\\parindent}{0cm}";
    print "\\setlength{\\parskip}{4pt plus 3pt minus 2pt}";
    print "\\setcounter{page}{1001}";
}

/<HTML>|<\/HTML>/ {
    next;
}

/<HEAD>/,/<\/HEAD>/ {
    next;
}

/<BODY>/ {
    print "\\begin{document}";
    next;
}
/<\/BODY>/ {
    print "\\end{document}";
    next;
}

/<H1>/ {
    print "\\vspace{1cm}";
    print "\\begin{center} {\Large\bf";
    next;
}
/<\/H1>/ {
    print "} \\end{center}";
    next;
}

/<ADDRESS>/ {
    print "\\begin{center}";
    next;
}
/<\/ADDRESS>/ {
    print "\\end{center}";
    next;
}

/<BR>/ {
    print "\\\\";
    next;
}

/<H2>/ {
    print "\\subsection*{";
    next;
}
/<\/H2>/ {
    print "}";
    next;
}

/<HR>/ {
    next;
}

/<!-- FF[^>]*>/ {
    print "\\newpage";
    next;
}

/<P>/ {
    print "\\par";
    next;
}

/<UL>/ {
    print "\\begin{itemize}";
    next;
}
/<\/UL>/ {
    print "\\end{itemize}";
    next;
}

/<LI>/ {
    print "\\item";
    next;
}

/<PRE>/ {
    print "\\begin{verbatim}";
    next;
}
/<\/PRE>/ {
    print "\\end{verbatim}";
    next;
}

{
    print;
}

END {
}
' \
| sed -e '
s/<[^>]*>//g
s/&lt;/</g
s/&gt;/>/g
s/&quot;/"/g
s/&amp;/\&/g
/\\begin{verbatim}/,/\\end{verbatim}/ !s/[&#%]/\\&/g
/\\begin{verbatim}/,/\\end{verbatim}/ !s/[_^~]/\\&{}/g
/\\begin{verbatim}/,/\\end{verbatim}/ !s/[<>]/$&$/g
'

