"Fossies" - the Fresh Open Source Software Archive

Member "latex2html-2002-2-1/versions/latin7.pl" (29 Nov 2002, 12877 Bytes) of archive /linux/www/latex2html-2002-2-1.tar.gz:


As a special service "Fossies" has tried to format the requested source page into HTML format (assuming markdown format). Alternatively you can here view or download the uninterpreted source code file. A member file download can also be achieved by clicking within a package contents listing on the according byte size field.

File: latin7.pl

Version 0.1, September 10, 1999

Written by Ross Moore ross@maths.mq.edu.au

#

ISO_8859-13 encoding information

#

Copyright © 1999 by Ross Moore

This program is free software; you can redistribute it and/or modify

it under the terms of the GNU General Public License as published by

the Free Software Foundation; either version 2 of the License, or

(at your option) any later version.

This program is distributed in the hope that it will be useful,

but WITHOUT ANY WARRANTY; without even the implied warranty of

MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

GNU General Public License for more details.

You should have received a copy of the GNU General Public License

along with this program; if not, write to the Free Software

Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.

$CHARSET = ‘iso-8859-13’; $INPUTENC = ‘latin7’;

Character ranges for lower –> upper-case conversion

$sclower = “\270\272\277\340-\366\370-\376”; $scupper = “\250\252\257\300-\326\330-\336”;

extra pattern match preceding lower –> upper-case conversion

$scextra = “s/\337/ss/g”;

%extra_small_caps = ( ‘223’ , ‘ss’ );

%low_entities = ( ‘224’, ‘192’ ,‘225’, ‘193’ ,‘226’, ‘194’ ,‘227’, ‘195’ ,‘228’, ‘196’ ,‘229’, ‘197’ ,‘230’, ‘198’ ,‘231’, ‘199’ ,‘232’, ‘200’ ,‘233’, ‘201’ ,‘234’, ‘202’ ,‘235’, ‘203’ ,‘236’, ‘204’ ,‘237’, ‘205’ ,‘238’, ‘206’ ,‘239’, ‘207’ ,‘240’, ‘208’ ,‘241’, ‘209’ ,‘242’, ‘210’ ,‘243’, ‘211’ ,‘244’, ‘212’ ,‘245’, ‘213’ ,‘246’, ‘214’

,‘247’, ‘215’

             ,'248', '216'
             ,'249', '217'
             ,'250', '218'
             ,'251', '219'
             ,'252', '220'
             ,'253', '221'
             ,'254', '222'

,‘255’, ‘223’

             ,'184', '200'
             ,'186', '202'
             ,'191', '207'

);

sub do_cmd_oe { join(‘’, &iso_map(“oe”, “lig”), $_[0]);}

sub do_cmd_OE { join(‘’, &iso_map(“OE”, “lig”), $_[0]);}

sub do_cmd_l { join(‘’, &iso_map(“l”, “stroke”), $[0]);} sub do_cmd_L { join(‘’, &iso_map(“L”, “stroke”), $[0]);}

sub do_cmd_ng { join(‘’, &iso_map(“eng”, “”), $_[0]);}

sub do_cmd_ss { join(‘’, &iso_map(“sz”, “lig”), $[0]);} sub do_cmd_i { join(‘’, &iso_map(“i”, “nodot”), $[0]);}

sub do_cmd_textonequarter { join(‘’, &iso_map(“frac14”, “”), $[0]);} sub do_cmd_textonehalf { join(‘’, &iso_map(“frac12”, “”), $[0]);} sub do_cmd_textthreequarters { join(‘’, &iso_map(“frac34”, “”), $[0]);} sub do_cmd_textcent { join(‘’, &iso_map(“cent”, “”), $[0]);} sub do_cmd_textyen { join(‘’, &iso_map(“yen”, “”), $[0]);} sub do_cmd_textcurrency { join(‘’, &iso_map(“curren”, “”), $[0]);} sub do_cmd_textbrokenbar { join(‘’, &iso_map(“brvbar”, “”), $[0]);} sub do_cmd_textregistered { join(‘’, &iso_map(“reg”, “”), $[0]);} sub do_cmd_textperiodcentered { join(‘’, &iso_map(“middot”, “”), $[0]);} sub do_cmd_guillemotleft { join(‘’, &iso_map(“laquo”, “”), $[0]);} sub do_cmd_guillemotright { join(‘’, &iso_map(“raquo”, “”), $[0]);} sub do_cmd_quotedblbase { join(‘’, &iso_map(“dbquo”, “”), $[0]);} sub do_cmd_quotesinglbase { join(‘’, &iso_map(“sbquo”, “”), $_[0]);}

sub do_cmd_mathdegree { join(‘’, &iso_map(“deg”, “”), $[0]);} sub do_cmd_mathonesuperior { join(‘’, &iso_map(“sup1”, “”), $[0]);} sub do_cmd_mathtwosuperior { join(‘’, &iso_map(“sup2”, “”), $[0]);} sub do_cmd_maththreesuperior { join(‘’, &iso_map(“sup3”, “”), $[0]);} sub do_cmd_mathordmasculine { join(‘’, &iso_map(“ordm”, “”), $[0]);} sub do_cmd_mathordfeminine { join(‘’, &iso_map(“ordf”, “”), $[0]);}

sub do_cmd_P { join(‘’, &iso_map(“para”, “”), $[0]);} sub do_cmd_S { join(‘’, &iso_map(“sect”, “”), $[0]);}

sub do_cmd_pm { join(‘’, &iso_map(“plusmn”, “”), $[0]);} sub do_cmd_div { join(‘’, &iso_map(“divide”, “”), $[0]);} sub do_cmd_times { join(‘’, &iso_map(“times”, “”), $[0]);} sub do_cmd_minus { join(‘’, &iso_map(“shy”, “”), $[0]);} sub do_cmd_copyright { join(‘’, &iso_map(“copy”, “”), $[0]);} sub do_cmd_pounds { join(‘’, &iso_map(“pound”, “”), $[0]);} sub do_cmd_cents { join(‘’, &iso_map(“cent”, “”), $[0]);} sub do_cmd_lnot { join(‘’, &iso_map(“not”, “”), $[0]);} sub do_cmd_cdot { join(‘’, &iso_map(“middot”, “”), $[0]);} sub do_cmd_micron { join(‘’, &iso_map(“micro”, “”), $[0]);}

%iso_8859_13_character_map = ( ‘AElig’, ‘¿’, # capital AE diphthong (ligature) ‘Amacr’, ‘Â’, # capital A, with macron ‘Aogon’, ‘À’, # capital A, with ogonek ‘Aring’, ‘Å’, # capital A, with ring ‘Auml’ , ‘Ä’, # capital A, dieresis or umlaut mark ‘Cacute’,‘Ã’, # capital C, acute accent ‘Ccaron’,‘È’, # capital C, with caron ‘Eacute’,‘É’, # capital E, acute accent ‘Edot’ , ‘Ë’, # capital E, with dot ‘Emacr’, ‘Ç’, # capital E, with macron ‘Eogon’, ‘Æ’, # capital E, with ogonek ‘Euml’ , ‘Ë’, # capital E, dieresis or umlaut mark ‘Gcedil’,‘Ì’, # capital G, cedilla ‘Imacr’, ‘Î’, # capital I, with macron ‘Iogon’, ‘Á’, # capital I, with ogonek ‘Kcedil’,‘Í’, # capital K, cedilla ‘Lcedil’,‘Ï’, # capital L, cedilla ‘Lstrok’,‘Ù’, # capital L, with stroke ‘Nacute’,‘Ñ’, # capital N, acute accent ‘Ncedil’,‘Ò’, # capital N, cedilla ‘Oacute’,‘Ó’, # capital O, acute accent ‘Omacr’, ‘Ô’, # capital O, with macron ‘Oslash’,‘¨’, # capital O, slash ‘Otilde’,‘Õ’, # capital O, tilde ‘Ouml’, ‘Ö’, # capital O, dieresis or umlaut mark ‘Rcedil’,‘ª’, # capital R, cedil accent ‘Sacute’,‘Ú’, # capital S, acute accent ‘Scaron’,‘Ð’, # capital S, caron accent ‘Umacr’, ‘Û’, # capital U, with macron ‘Uogon’, ‘Ø’, # capital U, with ogonek ‘Uuml’ , ‘Ü’, # capital U, dieresis or umlaut mark ‘Zacute’,‘Ê’, # capital Z, acute accent ‘Zcaron’,‘Þ’, # capital Z, caron accent ‘Zdot’ , ‘Ý’, # capital Z, with dot # ‘aelig’, ‘¿’, # small ae diphthong (ligature) ‘amacr’, ‘â’, # small a, with macron ‘amp’, ‘&’, # ampersand ‘aogon’, ‘à’, # small a, with ogonek ‘aring’, ‘å’, # small a, ring ‘auml’ , ‘ä’, # small a, dieresis or umlaut mark ‘cacute’,‘ã’, # small c, acute accent ‘cmacr’, ‘è’, # small c, with macron ‘eacute’,‘é’, # small e, acute accent ‘edot’ ,‘ë’, # small e, with dot ‘emacr’, ‘ç’, # small e, with macron ‘eogon’, ‘æ’, # small e, with ogonek ‘gcedil’,‘ì’, # small g, cedilla ‘gt’, ‘>’, # greater than ‘imacr’, ‘î’, # small i, with macron ‘iogon’, ‘á’, # small i, with ogonek ‘lstrok’,‘ñ’, # small l, with stroke ‘lt’, ‘<’, # less than ‘nacute’,‘ñ’, # small n, acute accent ‘ncedil’,‘ò’, # small n, cedilla ‘oacute’,‘ó’, # small o, acute accent ‘omacr’, ‘ô’, # small o, with macron ‘oslash’,‘¸’, # small o, slash ‘otilde’,‘õ’, # small o, tilde ‘ouml’ , ‘ö’, # small o, dieresis or umlaut mark ‘rcedil’,‘º’, # small r, cedil accent ‘sacute’,‘ú’, # small s, acute accent ‘scaron’,‘ð’, # small s, with caron ‘szlig’, ‘ß’, # small sharp s, German (sz ligature) ‘umacr’, ‘û’, # small u, with macron ‘uogon’, ‘ø’, # small u, with ogonek ‘uuml’ , ‘ü’, # small u, dieresis or umlaut mark ‘zdot’ ,‘ý’, # small z, with dot ‘zcaron’,‘þ’, # small z, with caron ‘quot’, ‘"’, # double quote

These have HTML mnemonic names for HTML 4.0 …

   'nbsp', '&#160;',       # non-breaking space
   'rdquo', '&#161;',      # double quote, right
   'cent', '&#162;',       # cents sign
   'pound', '&#163;',      # pound sign
   'curren', '&#164;',     # currency sign
   'dbquo', '&#165;',
   'brvbar', '&#166;',  
   'sect', '&#167;',       # section mark
   'copy', '&#169;',       # copyright mark
   'laquo', '&#171;', 
   'raquo', '&#187;', 
   'not', '&#172;',
   'shy', '&#173;',
   'reg', '&#174;',
   'plusmn', '&#177;',
   'sup1', '&#185;',
   'sup2', '&#178;',
   'sup3', '&#179;',
   'ldquo', '&#180;',
   'micro', '&#181;',
   'para', '&#182;',    # paragraph mark
   'middot', '&#183;',
   'frac14', '&#188;',
   'frac12', '&#189;',
   'frac34', '&#190;',
   'times', '&#215;',
   'divide', '&#247;',
   'rsquo', '&#255;',

These are character types without arguments …

   'grave', "`",
   'circ', '^',
   'tilde', '&#126;',
   'dot', '.'
);

%iso_8859_13_character_map_inv = ( ‘^’ , ‘\^{}’, ‘>’ , ‘\ensuremath{>}’, ‘<’ , ‘\ensuremath{<}’, ‘&’ , ‘\&’, ‘~’ , ‘\~{}’, ‘ ’ , ‘\nobreakspace{}’, ‘¡’ , “{‘’}”, ‘¢’ , ‘\textcent{}’, ‘£’ , ‘\pounds{}’, ‘¤’ , ‘\textcurrency{}’, ‘¥’ , ‘\quotedblbase{}’, ‘¦’ , ‘\textbrokenbar{}’, ‘§’ , ‘\S{}’, ‘¨’ , ‘\O{}’, ‘©’ , ‘\copyright{}’, ‘ª’ , ‘\c{R}’, ‘«’ , ‘\guillemotleft{}’, ‘¬’ , ‘\lnot{}’, ‘­’ , ‘\-’,

‘®’ , ‘\textregistered{}’,

 '&#174;' , '\\ensuremath{\\circledR}',
 '&#175;' , '\\AE{}',

‘°’ , ‘\mathdegree{}’,

 '&#176;' , '\\ensuremath{^{\\circ}}',
'&#177;' , '\\ensuremath{\\pm}',

‘²’ , ‘\mathtwosuperior{}’,

'&#178;' , '\\ensuremath{^{2}}',

‘³’ , ‘\maththreesuperior{}’,

'&#179;' , '\\ensuremath{^{3}}',
 '&#180;' , '{``}',
'&#181;' , '\\ensuremath{\\mu}',
 '&#182;' , '\\P{}',

‘·’ , ‘\textperiodcentered{}’,

 '&#183;' , '\\ensuremath{\\cdot{}}',
 '&#184;' , '\\o{}',

‘¹’ , ‘\mathonesuperior{}’,

'&#185;' , '\\ensuremath{^{1}}',
'&#186;' , '\\c{r}',
'&#187;' , '\\guillemotright{}',

‘¼’ , ‘\textonequarter{}’,

'&#188;' , '\\ensuremath{\\frac{1}{4}}',

‘½’ , ‘\textonehalf{}’,

'&#189;' , '\\ensuremath{\\frac{1}{2}}',

‘¾’ , ‘\textthreequarters{}’,

'&#190;' , '\\ensuremath{\\frac{3}{4}}',
 '&#191;' , '\\ae{}',
 '&#192;' , '\\k{A}',
 '&#193;' , '\\k{I}',
 '&#194;' , '\\={A}',
 '&#195;' , '\\\'{C}',
 '&#196;' , '\\"{A}',
 '&#197;' , '\\r{A}',
 '&#198;' , '\\k{E}',
 '&#199;' , '\\={E}',
 '&#200;' , '\\v{C}',
 '&#201;' , '\\\'{E}',
 '&#202;' , '\\\'{Z}',
 '&#203;' , '\\.{E}',
 '&#204;' , '\\c{G}',
 '&#205;' , '\\c{K}',
 '&#206;' , '\\={I}',
 '&#207;' , '\\c{L}',
 '&#208;' , '\\v{S}',
 '&#209;' , '\\\'{N}',
 '&#210;' , '\\c{N}',
 '&#211;' , '\\\'{O}',
 '&#212;' , '\\={O}',
 '&#213;' , '\\~{O}',
 '&#214;' , '\\"{O}',
'&#215;' , '\\ensuremath{\\times}',
 '&#216;' , '\\k{U}',
 '&#217;' , '\\L{}',
 '&#218;' , '\\\'{S}',
 '&#219;' , '\\={U}',
 '&#220;' , '\\"{U}',
 '&#221;' , '\\.{Z}',
 '&#222;' , '\\v{Z}',
 '&#223;' , '\\ss{}',
 '&#224;' , '\\k{a}',
 '&#225;' , '\\k{\\i}',
 '&#226;' , '\\={a}',
 '&#227;' , '\\\'{c}',
 '&#228;' , '\\"{a}',
 '&#229;' , '\\r{a}',
 '&#230;' , '\\k{e}',
 '&#231;' , '\\={e}',
 '&#232;' , '\\v{c}',
 '&#233;' , '\\\'{e}',
 '&#234;' , '\\\'{z}',
 '&#235;' , '\\.{e}',
 '&#236;' , '\\c{g}',
 '&#237;' , '\\c{k}',
 '&#238;' , '\\={\\i}',
 '&#239;' , '\\c{l}',
 '&#240;' , '\\v{s}',
 '&#241;' , '\\\'{n}',
 '&#242;' , '\\c{n}',
 '&#243;' , '\\\'{o}',
 '&#244;' , '\\={o}',
 '&#245;' , '\\~{o}',
 '&#246;' , '\\"{o}',
'&#247;' , '\\ensuremath{\\div}',
 '&#248;' , '\\k{u}',
 '&#249;' , '\\l{}',
 '&#250;' , '\\\'{s}',
 '&#251;' , '\\={u}',
 '&#252;' , '\\"{u}',
 '&#253;' , '\\.{z}',
 '&#254;' , '\\v{z}',
 '&#255;' , "{'}",

);

1;