-# Maps HTML character entities to the corresponding Latin1 characters.
-#
-my %entity_table = (
- "quot" => '"', "amp" => '&', "lt" => '<',
- "gt" => '>', "nbsp" => " ", "iexcl" => "\xA1",
- "cent" => "\xA2", "pound" => "\xA3", "curren" => "\xA4",
- "yen" => "\xA5", "brvbar" => "\xA6", "sect" => "\xA7",
- "uml" => "\xA8", "copy" => "\xA9", "ordf" => "\xAA",
- "laquo" => "\xAB", "not" => "\xAC", "shy" => "\xAD",
- "reg" => "\xAE", "macr" => "\xAF", "deg" => "\xB0",
- "plusmn" => "\xB1", "sup2" => "\xB2", "sup3" => "\xB3",
- "acute" => "\xB4", "micro" => "\xB5", "para" => "\xB6",
- "middot" => "\xB7", "cedil" => "\xB8", "sup1" => "\xB9",
- "ordm" => "\xBA", "raquo" => "\xBB", "frac14" => "\xBC",
- "frac12" => "\xBD", "frac34" => "\xBE", "iquest" => "\xBF",
- "Agrave" => "\xC0", "Aacute" => "\xC1", "Acirc" => "\xC2",
- "Atilde" => "\xC3", "Auml" => "\xC4", "Aring" => "\xC5",
- "AElig" => "\xC6", "Ccedil" => "\xC7", "Egrave" => "\xC8",
- "Eacute" => "\xC9", "Ecirc" => "\xCA", "Euml" => "\xCB",
- "Igrave" => "\xCC", "Iacute" => "\xCD", "Icirc" => "\xCE",
- "Iuml" => "\xCF", "ETH" => "\xD0", "Ntilde" => "\xD1",
- "Ograve" => "\xD2", "Oacute" => "\xD3", "Ocirc" => "\xD4",
- "Otilde" => "\xD5", "Ouml" => "\xD6", "times" => "\xD7",
- "Oslash" => "\xD8", "Ugrave" => "\xD9", "Uacute" => "\xDA",
- "Ucirc" => "\xDB", "Uuml" => "\xDC", "Yacute" => "\xDD",
- "THORN" => "\xDE", "szlig" => "\xDF", "agrave" => "\xE0",
- "aacute" => "\xE1", "acirc" => "\xE2", "atilde" => "\xE3",
- "auml" => "\xE4", "aring" => "\xE5", "aelig" => "\xE6",
- "ccedil" => "\xE7", "egrave" => "\xE8", "eacute" => "\xE9",
- "ecirc" => "\xEA", "euml" => "\xEB", "igrave" => "\xEC",
- "iacute" => "\xED", "icirc" => "\xEE", "iuml" => "\xEF",
- "eth" => "\xF0", "ntilde" => "\xF1", "ograve" => "\xF2",
- "oacute" => "\xF3", "ocirc" => "\xF4", "otilde" => "\xF5",
- "ouml" => "\xF6", "divide" => "\xF7", "oslash" => "\xF8",
- "ugrave" => "\xF9", "uacute" => "\xFA", "ucirc" => "\xFB",
- "uuml" => "\xFC", "yacute" => "\xFD", "thorn" => "\xFE",
- "yuml" => "\xFF", "apos" => "\'",
-
- # HTML 4 entities that do not have 1:1 Latin1 mappings.
- "bull" => "*", "hellip"=> "...", "prime" => "'", "Prime" => "\"",
- "frasl" => "/", "trade" => "[tm]", "larr" => "<-", "rarr" => "->",
- "harr" => "<->", "lArr" => "<=", "rArr" => "=>", "hArr" => "<=>",
- "empty" => "\xD8", "minus" => "-", "lowast"=> "*", "sim" => "~",
- "cong" => "=~", "asymp" => "~", "ne" => "!=", "equiv" => "==",
- "le" => "<=", "ge" => ">=", "lang" => "<", "rang" => ">",
- "loz" => "<>", "OElig" => "OE", "oelig" => "oe", "Yuml" => "Y",
- "circ" => "^", "tilde" => "~", "ensp" => " ", "emsp" => " ",
- "thinsp"=> " ", "ndash" => "-", "mdash" => "-", "lsquo" => "`",
- "rsquo" => "'", "sbquo" => "'", "ldquo" => "\"", "rdquo" => "\"",
- "bdquo" => "\"", "lsaquo"=> "<", "rsaquo"=> ">",
-);
-
-# Maps certain UTF8 characters (2 or 3 bytes) to the corresponding
-# Latin1 characters.
-#
-my %unicode_latin1_table = (
- "\xC2\xA1" => "\xA1", "\xC2\xA2" => "\xA2", "\xC2\xA3" => "\xA3",
- "\xC2\xA4" => "\xA4", "\xC2\xA5" => "\xA5", "\xC2\xA6" => "\xA6",
- "\xC2\xA7" => "\xA7", "\xC2\xA8" => "\xA8", "\xC2\xA9" => "\xA9",
- "\xC2\xAA" => "\xAA", "\xC2\xAB" => "\xAB", "\xC2\xAC" => "\xAC",
- "\xC2\xAD" => "\xAD", "\xC2\xAE" => "\xAE", "\xC2\xAF" => "\xAF",
- "\xC2\xB0" => "\xB0", "\xC2\xB1" => "\xB1", "\xC2\xB2" => "\xB2",
- "\xC2\xB3" => "\xB3", "\xC2\xB4" => "\xB4", "\xC2\xB5" => "\xB5",
- "\xC2\xB6" => "\xB6", "\xC2\xB7" => "\xB7", "\xC2\xB8" => "\xB8",
- "\xC2\xB9" => "\xB9", "\xC2\xBA" => "\xBA", "\xC2\xBB" => "\xBB",
- "\xC2\xBC" => "\xBC", "\xC2\xBD" => "\xBD", "\xC2\xBE" => "\xBE",
- "\xC2\xBF" => "\xBF", "\xC3\x80" => "\xC0", "\xC3\x81" => "\xC1",
- "\xC3\x82" => "\xC2", "\xC3\x83" => "\xC3", "\xC3\x84" => "\xC4",
- "\xC3\x85" => "\xC5", "\xC3\x86" => "\xC6", "\xC3\x87" => "\xC7",
- "\xC3\x88" => "\xC8", "\xC3\x89" => "\xC9", "\xC3\x8A" => "\xCA",
- "\xC3\x8B" => "\xCB", "\xC3\x8C" => "\xCC", "\xC3\x8D" => "\xCD",
- "\xC3\x8E" => "\xCE", "\xC3\x8F" => "\xCF", "\xC3\x90" => "\xD0",
- "\xC3\x91" => "\xD1", "\xC3\x92" => "\xD2", "\xC3\x93" => "\xD3",
- "\xC3\x94" => "\xD4", "\xC3\x95" => "\xD5", "\xC3\x96" => "\xD6",
- "\xC3\x97" => "\xD7", "\xC3\x98" => "\xD8", "\xC3\x99" => "\xD9",
- "\xC3\x9A" => "\xDA", "\xC3\x9B" => "\xDB", "\xC3\x9C" => "\xDC",
- "\xC3\x9D" => "\xDD", "\xC3\x9E" => "\xDE", "\xC3\x9F" => "\xDF",
- "\xC3\xA0" => "\xE0", "\xC3\xA1" => "\xE1", "\xC3\xA2" => "\xE2",
- "\xC3\xA3" => "\xE3", "\xC3\xA4" => "\xE4", "\xC3\xA5" => "\xE5",
- "\xC3\xA6" => "\xE6", "\xC3\xA7" => "\xE7", "\xC3\xA8" => "\xE8",
- "\xC3\xA9" => "\xE9", "\xC3\xAA" => "\xEA", "\xC3\xAB" => "\xEB",
- "\xC3\xAC" => "\xEC", "\xC3\xAD" => "\xED", "\xC3\xAE" => "\xEE",
- "\xC3\xAF" => "\xEF", "\xC3\xB0" => "\xF0", "\xC3\xB1" => "\xF1",
- "\xC3\xB2" => "\xF2", "\xC3\xB3" => "\xF3", "\xC3\xB4" => "\xF4",
- "\xC3\xB5" => "\xF5", "\xC3\xB6" => "\xF6", "\xC3\xB7" => "\xF7",
- "\xC3\xB8" => "\xF8", "\xC3\xB9" => "\xF9", "\xC3\xBA" => "\xFA",
- "\xC3\xBB" => "\xFB", "\xC3\xBC" => "\xFC", "\xC3\xBD" => "\xFD",
- "\xC3\xBE" => "\xFE", "\xC3\xBF" => "\xFF",
-
- "\xE2\x80\x93" => '--', "\xE2\x80\x94" => '--',
- "\xE2\x80\x98" => '`', "\xE2\x80\x99" => '\'',
- "\xE2\x80\x9C" => "``", "\xE2\x80\x9D" => "''",
- "\xE2\x80\xB2" => "'", "\xE2\x80\xA6" => '...',
- "\xE2\x86\x90" => ' ← ', "\xE2\x84\xA2" => '™',
- "\xE2\x80\xA2" => '•', "\xC2\xA0" => ' ', #
- );
-