From ae5d181b854d3ccb373b6bc01b4869e44ff4d87a Mon Sep 17 00:00:00 2001 From: Daniel Baumann Date: Sun, 7 Apr 2024 18:37:15 +0200 Subject: Adding upstream version 2.9.0dev.12. Signed-off-by: Daniel Baumann --- test/iso-8859-2.html | 174 +++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 174 insertions(+) create mode 100644 test/iso-8859-2.html (limited to 'test/iso-8859-2.html') diff --git a/test/iso-8859-2.html b/test/iso-8859-2.html new file mode 100644 index 0000000..39380e3 --- /dev/null +++ b/test/iso-8859-2.html @@ -0,0 +1,174 @@ + + + + +Martin Ramsch's character table modified and enhanced for iso8859-2 + + + + + + + + + +

iso8859-2 plus table

+ +
+Description                               Code            Entity name   
+===================================       ============    ==============
+quotation mark                            "  --> "     "   --> "
+ampersand                                 &  --> &     &    --> &
+less-than sign                            &#60;  --> <     &lt;     --> <
+greater-than sign                         &#62;  --> >     &gt;     --> >
+
+Description                          Char Code            Entity name   
+===================================  ==== ============    ==============
+non-breaking space                        &#160; -->      &nbsp;   -->  
+capital A, ogonek                    ¡    &#260; --> Ą    &Aogon;  --> Ą
+breve                               {¢}  {&#728;}-->{˘}  {&breve;} -->{˘}
+capital L, stroke                    £    &#321; --> Ł    &Lstrok; --> Ł
+general currency sign                ¤    &#164; --> ¤    &curren; --> ¤
+capital L, caron                     ¥    &#317; --> Ľ    &Lcaron; --> Ľ
+capital S, acute accent              ¦    &#346; --> Ś    &Sacute; --> Ś
+section sign                         §    &#167; --> §    &sect;   --> §
+umlaut (dieresis)                    ¨    &#168; --> ¨    &uml;    --> ¨
+                                                          &die;    --> ¨
+capital S, caron                     ©    &#352; --> Š    &Scaron; --> Š
+capital S, cedilla                   ª    &#350; --> Ş    &Scedil; --> Ş
+capital T, caron                     «    &#356; --> Ť    &Tcaron; --> Ť
+capital Z, acute accent              ¬    &#377; --> Ź    &Zacute; --> Ź
+soft hyphen                         [­]  [&#173;]-->[­]  [&shy;]   -->[­]
+capital Z, caron                     ®    &#381; --> Ž    &Zcaron; --> Ž
+capital Z, dot above                 ¯    &#379; --> Ż    &Zdot;   --> Ż
+degree sign                          °    &#176; --> °    &deg;    --> °
+small a, ogonek                      ±    &#261; --> ą    &aogon;  --> ą
+ogonek                              {²}  {&#731;}-->{˛}  {&ogon;}  -->{˛}
+small l, stroke                      ³    &#322; --> ł    &lstrok; --> ł
+acute accent                         ´    &#180; --> ´    &acute;  --> ´
+small l, caron                       µ    &#318; --> ľ    &lcaron; --> ľ
+small s, acute accent                ¶    &#347; --> ś    &sacute; --> ś
+caron                               {·}  {&#711;}-->{ˇ}  {&caron;} -->{ˇ}
+cedilla                              ¸    &#184; --> ¸    &cedil;  --> ¸
+small s, caron                       ¹    &#353; --> š    &scaron; --> š
+small s, cedilla                     º    &#351; --> ş    &scedil; --> ş
+small t, caron                       »    &#357; --> ť    &tcaron; --> ť
+small z, acute accent                ¼    &#378; --> ź    &zacute; --> ź
+double acute accent                 {½}  {&#733;}-->{˝}  {&dblac;} -->{˝}
+small z, caron                       ¾    &#382; --> ž    &zcaron; --> ž
+small z, dot above                   ¿    &#380; --> ż    &zdot;   --> ż  
+capital R, acute accent              À    &#340; --> Ŕ    &Racute; --> Ŕ
+capital A, acute accent              Á    &#193; --> Á    &Aacute; --> Á
+capital A, circumflex accent         Â    &#194; --> Â    &Acirc;  --> Â
+capital A, breve                     Ã    &#258; --> Ă    &Abreve; --> Ă
+capital A, dieresis or umlaut mark   Ä    &#196; --> Ä    &Auml;   --> Ä
+capital L, acute accent              Å    &#313; --> Ĺ    &Lacute; --> Ĺ
+capital C, acute accent              Æ    &#262; --> Ć    &Cacute; --> Ć
+capital C, cedilla                   Ç    &#199; --> Ç    &Ccedil; --> Ç
+capital C, caron                     È    &#268; --> Č    &Ccaron; --> Č
+capital E, acute accent              É    &#201; --> É    &Eacute; --> É
+capital E, ogonek                    Ê    &#280; --> Ę    &Eogon;  --> Ę
+capital E, dieresis or umlaut mark   Ë    &#203; --> Ë    &Euml;   --> Ë
+capital E, caron                     Ì    &#282; --> Ě    &Ecaron; --> Ě
+capital I, acute accent              Í    &#205; --> Í    &Iacute; --> Í
+capital I, circumflex accent         Î    &#206; --> Î    &Icirc;  --> Î
+capital D, caron                     Ï    &#270; --> Ď    &Dcaron; --> Ď
+capital D, stroke                    Ð    &#272; --> Đ    &Dstrok; --> Đ
+capital Eth, Icelandic               N/A  &#208; --> Ð    &ETH;    --> Ð
+capital N, acute accent              Ñ    &#323; --> Ń    &Nacute; --> Ń
+capital N, caron                     Ò    &#327; --> Ň    &Ncaron; --> Ň
+capital O, acute accent              Ó    &#211; --> Ó    &Oacute; --> Ó
+capital O, circumflex accent         Ô    &#212; --> Ô    &Ocirc;  --> Ô
+capital O, double acute accent       Õ    &#368; --> Ű    &Odblac; --> Ő
+capital O, dieresis or umlaut mark   Ö    &#214; --> Ö    &Ouml;   --> Ö
+multiply sign                        ×    &#215; --> ×    &times;  --> ×
+capital R, caron                     Ø    &#344; --> Ř    &Rcaron; --> Ř
+capital U, ring                      Ù    &#366; --> Ů    &Uring;  --> Ů
+capital U, acute accent              Ú    &#218; --> Ú    &Uacute; --> Ú
+capital U, double acute accent       Û    &#368; --> Ű    &Udblac; --> Ű
+capital U, dieresis or umlaut mark   Ü    &#220; --> Ü    &Uuml;   --> Ü
+capital Y, acute accent              Ý    &#221; --> Ý    &Yacute; --> Ý
+capital T, cedilla                   Þ    &#354; --> Ţ    &Tcedil; --> Ţ
+small sharp s, German (sz ligature)  ß    &#223; --> ß    &szlig;  --> ß
+small r, acute accent                à    &#341; --> ŕ    &racute; --> ŕ
+small a, acute accent                á    &#225; --> á    &aacute; --> á
+small a, circumflex accent           â    &#226; --> â    &acirc;  --> â
+small a, breve                       ã    &#259; --> ă    &abreve; --> ă
+small a, dieresis or umlaut mark     ä    &#228; --> ä    &auml;   --> ä
+small l, acute accent                å    &#314; --> ĺ    &lacute; --> ĺ
+small c, acute accent                æ    &#263; --> ć    &cacute; --> ć
+small c, cedilla                     ç    &#231; --> ç    &ccedil; --> ç
+small c, caron                       è    &#269; --> č    &ccaron; --> č
+small e, acute accent                é    &#233; --> é    &eacute; --> é
+small e, ogonek                      ê    &#281; --> ę    &eogon;  --> ę
+small e, dieresis or umlaut mark     ë    &#235; --> ë    &euml;   --> ë
+small e, caron                       ì    &#283; --> ě    &ecaron; --> ě
+small i, acute accent                í    &#237; --> í    &iacute; --> í
+small i, circumflex accent           î    &#238; --> î    &icirc;  --> î
+small d, caron                       ï    &#271; --> ď    &dcaron; --> ď
+small d, stroke                      ð    &#273; --> đ    &dstrok; --> đ
+small eth, Icelandic                 N/A  &#240; --> ð    &eth;    --> ð
+small n, acute accent                ñ    &#324; --> ń    &nacute; --> ń
+small n, caron                       ò    &#328; --> ň    &ncaron; --> ň
+small o, acute accent                ó    &#243; --> ó    &oacute; --> ó
+small o, circumflex accent           ô    &#244; --> ô    &ocirc;  --> ô
+small o, double acute accent         õ    &#369; --> ű    &odblac; --> ő
+small o, dieresis or umlaut mark     ö    &#246; --> ö    &ouml;   --> ö
+division sign                        ÷    &#247; --> ÷    &divide; --> ÷
+small r, caron                       ø    &#345; --> ř    &rcaron; --> ř
+small u, ring                        ù    &#367; --> ů    &uring;  --> ů
+small u, acute accent                ú    &#250; --> ú    &uacute; --> ú
+small u, double acute accent         û    &#369; --> ű    &udblac; --> ű
+small u, dieresis or umlaut mark     ü    &#252; --> ü    &uuml;   --> ü
+small y, acute accent                ý    &#253; --> ý    &yacute; --> ý
+small t, cedilla                     þ    &#355; --> ţ    &tcedil; --> ţ
+dot above                           {ÿ}  {&#729;}-->{˙}  {&dot;}   -->{˙}
+
+Some other characters of interest    Char Code            Entity name   
+===================================  ==== ============    ==============
+capital AE diphthong (ligature)      N/A  &#198; --> Æ    &AElig;  --> Æ
+small ae diphthong (ligature)        N/A  &#230; --> æ    &aelig;  --> æ
+capital OE ligature                  N/A {&#338;}-->{Œ}  {&OElig;} -->{Œ}
+small oe ligature                    N/A {&#339;}-->{œ}  {&oelig;} -->{œ}
+copyright                            N/A  &#169; --> ©    &copy;   --> ©
+registered trademark                 N/A  &#174; --> ®    &reg;    --> ®
+trademark sign                       N/A  &#8482;--> ™   &trade;  --> ™
+em space                             N/A [&#8195;]->[ ] [&emsp;]  -->[ ]
+en space                             N/A [&#8194;]->[ ] [&ensp;]  -->[ ]
+1/3-em space                         N/A [&#8196;]->[ ] [&emsp13;] -->[ ]
+1/4-em space                         N/A [&#8197;]->[ ] [&emsp14;] -->[ ]
+thin space                           N/A [&#8201;]->[ ] [&thinsp;]-->[ ]
+hair space                           N/A [&#8202;]->[ ] [&hairsp;]-->[ ]
+em dash                              N/A [&#8212;]->[—] [&mdash;] -->[—]
+en dash                              N/A [&#8211;]->[–] [&ndash;] -->[–]
+
+
+ +
+

+Characters not found in ISO-8859-2 have "N/A" in the Char column. +Some characters for which I could not find entity names in either +RFC 2070 +or the +ISOlat1, ISOlat2, ISOnum, ISOpub and ISOtech +sets (the ones included by Peter Flynn's +HTML Pro DTD) +are shown enclosed in {braces}. +

+

+There also is a variation of this table which tests +ISO-8859-2 characters and entities in ALT attributes. +

+

+See Martin Ramsch's original +ISO-8859-1 Table +for related info and links, and for some notes on entity names. +This file is mostly just an adaptation of his table +to the ISO-8859-2 character set. +

+
+ +
kweide@tezcat.com 1997-03-09
+ + + -- cgit v1.2.3