#!/bin/sh

in=$*
out=`echo $in | sed 's/\.html/\.txt/'`

cat > $out <<EOF
---------------------------------------------------------------------------
Haskell Weekly News
http://sequence.complete.org/hwn/`date +"%Y%m%d"`
`cat issue` - `date +"%B %d, %Y"`
---------------------------------------------------------------------------
EOF

lynx -dump -force_html -width=80 $in | \
    sed "s/^ *\(Announce\)/\1/;     \
         s/^ *\(Community\)/\1/;    \
         s/^ *\(Google\)/\1/;       \
         s/^ *\(Discussion\)/\1/;   \
         s/^ *\(Conference\)/\1/;   \
         s/^ *\(Blog noise\)/\1/;   \
         s/^ *\(Quotes\)/\1/;       \
         s/^ *\(Jobs\)/\1/;       \
         s/^ *\(Code Watch\)/\1/;       \
         s/^ *\(About\)/\1/;       \
         s/^ *\(Contrib\)/\1/;      \
         s/^ *\(Librar\)/\1/;      \
         s/^ *\(Hackage\)^/\1/;      \
         s/^ *\(Haskell'\)/\1/" | uniq >> $out
