#! /local/bin/perl -s # # ll2html --- convert (standardized) language list to html # # Assumes that The Language List has first been converted by stdll. # # Oscar Nierstrasz 27/5/93 # $v = "ll2html v1.0"; # Re-written to perl 28/6/93 $u = 'Usage: ll2html [-(option)] -i introduction -b body (split by language name) -a appendix -idx index '; chop($date = `date +%d.%m.%y`); $omn = 'OMN

'; $sig = "This file was generated by $v on $date.\n$omn

\n"; if ($i) { &intro; } elsif ($b) { &body; } elsif ($a) { &app; } elsif ($idx) { &idx; } else { die($u); } # Process the introduction. # Try to guess which lines are supposed to be broken, and # which can be justified. Mode 0 means the previous line was blank. # Mode 1 means we are inside a justified paragraph. Mode 2 means we # are inside a list. # Use

instead of

to cut down on white space. sub intro { print "Introduction to The Language List\n\n"; $mode = 0; while (<>) { chop; # strip record separator &htmlescape; s/\s*$//; # remove trailing white space s/\s+/ /; # compress remaining space if (/^$/) { # terminate lists & paragraphs: if (($mode == 1) || ($mode == 2)) { print "

\n"; } $mode = 0; } # non-blank lines: elsif ($mode == 0) { if (/^The Language List/) { print "\n

$_

\n"; $mode = 1; } # e.g., Version #: elsif (/^[A-Z].*: /) { print "\n

$_\n"; $mode = 2; } # section heading: elsif (/^[A-Z].*:$/) { print "\n

$_

\n\n"; $mode = 0; } elsif (/^\S/) { print "\n

$_

\n\n"; $mode = 0; } # indented list: elsif (/^\s/) { print "\n

$_\n"; $mode = 1; } } elsif ($mode == 1) { if (/^ /) { print "

"; } print "$_\n"; } else { print "

$_\n"; } } print "$sig"; } # process the body (for use with parscan) sub body { $/ = ""; while (<>) { &htmlescape; chop; s!^L (.*)!

$1\n

!; s!\n\| (.*)!\n$1!g; s!\nP (.*)!\n

$1!g; s!\nI (.*)!\n

Info: $1!g; s!\nF (.*)!\n

Ftp:\n\n$1!g; s!(HREF=".*)[,.;]"!$1"!g; # remove garbage punctuation s!(HREF=".*)[^/]*\.Z"!$1"!g; # delete trailing .Z and * s!(HREF=".*)[^/]*\*"!$1"!g; s!(file://[^:]*):!$1!g; # remove colons in ftp addresses print "

\n$_\n\n"; } } # escape special characters sub htmlescape { s/\&/\&/g; s//\>/g; } # Process the appendices. # Again, try to guess where lines are supposed to be broken. # Mode 3 means we are building up the subtitle. sub app { print "Appendices to The Language List\n\n"; $mode = 0; while (<>) { chop; # strip record separator &htmlescape; if (/^$/) { # terminate lists & paragraphs: if ($mode != 3) { if ($mode > 0) { print "

\n"; } $mode = 0; } } elsif (/^APPENDIX/) { print "

$_

\n\n"; $mode = 3 ; } elsif (/^=+$/) { $mode = 0 ; next ; } # non-blank lines: elsif ($mode == 0) { if (/^19\d\d\s\s/) { print "

$_\n"; $mode = 2 ; } else { print "

$_"; $mode = 1 ; } } elsif ($mode == 1) { if (/^\s/) { print "

$_\n"; } else { print; } } elsif ($mode == 2) { print "

$_\n"; } elsif ($mode == 3) { print "

$_

\n\n"; $mode = 0; } } if ($mode > 0) { print "

\n"; } print "

\n$sig"; } sub idx { print "Index to The Language List\n\n"; print "

Index to The Language List

\n\n"; while (<>) { # chop; if (/^L (.*)/) { $lang = $1; } if (/^N (\d+)/) { $num = $1; } if ($lang =~ /[^a-zA-Z]*([a-zA-Z])/) { $char = $1; } if (/^$/) { print "$lang"; if ($num =~ /\d/) { print "[$num]"; $num = ""; } print ";\n"; } } print "

\n$sig"; }