diff options
author | Thomas E. Dickey <dickey@invisible-island.net> | 1999-10-13 14:29:33 -0400 |
---|---|---|
committer | Thomas E. Dickey <dickey@invisible-island.net> | 1999-10-13 14:29:33 -0400 |
commit | 9a7862a61cbb047e3eadda7557bc634cc06f9e02 (patch) | |
tree | c0b317d8fd9f552eb848571702a2f26c897a427a /test | |
parent | 95586cc28c61df18b7a2cd2a9b3ee4c4c83aa583 (diff) | |
download | lynx-snapshots-9a7862a61cbb047e3eadda7557bc634cc06f9e02.tar.gz |
snapshot of project "lynx", label v2-8-3dev_11
Diffstat (limited to 'test')
-rw-r--r-- | test/c1.html | 144 |
1 files changed, 62 insertions, 82 deletions
diff --git a/test/c1.html b/test/c1.html index 0b43ab07..e74f6dba 100644 --- a/test/c1.html +++ b/test/c1.html @@ -1,82 +1,62 @@ -<HTML> -<HEAD> -<TITLE> Test of some symbols </TITLE> -</HEAD> -<BODY> -<PRE> -You may press '\' to view the source of this test - -NCRs for symbols which are the C1 control chars for iso-8859-1 and Unicode, -but assumed as <em>windows-1252</em> codepoints (common for windows-xxxx), -say mercy to MS FrontPage (WYSIWYG HTML editor). - -<em>Number NCR alt-NCR windows-1252</em> - -0x80 € <IMG SRC=X ALT="€"> € #EURO SIGN -0x81  <IMG SRC=X ALT=""> <!----> #NOT USED -0x82 ‚ <IMG SRC=X ALT="‚"> ‚ #SINGLE LOW-9 QUOTATION MARK -0x83 ƒ <IMG SRC=X ALT="ƒ"> ƒ #LATIN SMALL LETTER F WITH HOOK -0x84 „ <IMG SRC=X ALT="„"> „ #DOUBLE LOW-9 QUOTATION MARK -0x85 … <IMG SRC=X ALT="…"> … #HORIZONTAL ELLIPSIS -0x86 † <IMG SRC=X ALT="†"> † #DAGGER -0x87 ‡ <IMG SRC=X ALT="‡"> ‡ #DOUBLE DAGGER -0x88 ˆ <IMG SRC=X ALT="ˆ"> ˆ #MODIFIER LETTER CIRCUMFLEX ACCENT -0x89 ‰ <IMG SRC=X ALT="‰"> ‰ #PER MILLE SIGN -0x8a Š <IMG SRC=X ALT="Š"> Š #LATIN CAPITAL LETTER S WITH CARON -0x8b ‹ <IMG SRC=X ALT="‹"> ‹ #SINGLE LEFT-POINTING ANGLE QUOTATION MARK -0x8c Œ <IMG SRC=X ALT="Œ"> Œ #LATIN CAPITAL LIGATURE OE -0x8d  <IMG SRC=X ALT=""> <!----> #NOT USED -0x8e Ž <IMG SRC=X ALT="Ž"> <!--Ž--> #NOT USED -0x8f  <IMG SRC=X ALT=""> <!----> #NOT USED -0x90  <IMG SRC=X ALT=""> <!----> #NOT USED -0x91 ‘ <IMG SRC=X ALT="‘"> ‘ #LEFT SINGLE QUOTATION MARK -0x92 ’ <IMG SRC=X ALT="’"> ’ #RIGHT SINGLE QUOTATION MARK -0x93 “ <IMG SRC=X ALT="“"> “ #LEFT DOUBLE QUOTATION MARK -0x94 ” <IMG SRC=X ALT="”"> ” #RIGHT DOUBLE QUOTATION MARK -0x95 • <IMG SRC=X ALT="•"> • #BULLET -0x96 – <IMG SRC=X ALT="–"> – #EN DASH -0x97 — <IMG SRC=X ALT="—"> — #EM DASH -0x98 ˜ <IMG SRC=X ALT="˜"> ˜ #SMALL TILDE -0x99 ™ <IMG SRC=X ALT="™"> ™ #TRADE MARK SIGN -0x9a š <IMG SRC=X ALT="š"> š #LATIN SMALL LETTER S WITH CARON -0x9b › <IMG SRC=X ALT="›"> › #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK -0x9c œ <IMG SRC=X ALT="œ"> œ #LATIN SMALL LIGATURE OE -0x9d  <IMG SRC=X ALT=""> <!----> #NOT USED -0x9e ž <IMG SRC=X ALT="ž"> <!--ž--> #NOT USED -0x9f Ÿ <IMG SRC=X ALT="Ÿ"> Ÿ #LATIN CAPITAL LETTER Y WITH DIAERESIS - - -</PRE> -</BODY> -</HTML> - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - +<HTML> +<HEAD> +<TITLE>Test of invalid NCRs 128-159</TITLE> +</HEAD> +<BODY><H2>Test of invalid NCRs 128-159</H2> +<P> +Authoring tools on MS Windows, in particular MS FrontPage ("WYSIWYG" HTML editor), +generate invalid <DFN>Numerical Character References</DFN> for characters +commonly found in positions 128...159 (0x80...0x9f) in Windows fonts. Although +these are valid codepoints for <em>windows-1252</em> (and other +windows-xxxx) charsets, valid NCRs always refer to the document character set +in the SGML sense, not to the character encoding scheme (or charset). For HTML, +the SGML document character set is fixed, it is always a subset of Unicode +(or ISO 10646). In Unicode and its iso-8859-1 subset, values 128...159 are +C1 control characters, they must not appear in HTML. Valid NCRs for the +intended characters use Unicode values greater than 256. +<p> +Lynx tries to interpret some of the invalid codes, by assuming that they are +windows-1252 codepoints. +<PRE> + +You may want to press '\' to view the source of this test. + +<em>Code invalid NCR <!-- --> <tab id=c>valid NCR, description</em> +<em> normal in ALT <a id=table></a> </em> + +0x80 € <IMG SRC=X ALT="€"> <tab to=c>€ #EURO SIGN +0x81  <IMG SRC=X ALT=""> <!----> #NOT USED +0x82 ‚ <IMG SRC=X ALT="‚"> <tab to=c>‚ #SINGLE LOW-9 QUOTATION MARK +0x83 ƒ <IMG SRC=X ALT="ƒ"> <tab to=c>ƒ #LATIN SMALL LETTER F WITH HOOK +0x84 „ <IMG SRC=X ALT="„"> <tab to=c>„ #DOUBLE LOW-9 QUOTATION MARK +0x85 … <IMG SRC=X ALT="…"> <tab to=c>… #HORIZONTAL ELLIPSIS +0x86 † <IMG SRC=X ALT="†"> <tab to=c>† #DAGGER +0x87 ‡ <IMG SRC=X ALT="‡"> <tab to=c>‡ #DOUBLE DAGGER +0x88 ˆ <IMG SRC=X ALT="ˆ"> <tab to=c>ˆ #MODIFIER LETTER CIRCUMFLEX ACCENT +0x89 ‰ <IMG SRC=X ALT="‰"> <tab to=c>‰ #PER MILLE SIGN +0x8a Š <IMG SRC=X ALT="Š"> <tab to=c>Š #LATIN CAPITAL LETTER S WITH CARON +0x8b ‹ <IMG SRC=X ALT="‹"> <tab to=c>‹ #SINGLE LEFT-POINTING ANGLE QUOTATION MARK +0x8c Œ <IMG SRC=X ALT="Œ"> <tab to=c>Œ #LATIN CAPITAL LIGATURE OE +0x8d  <IMG SRC=X ALT=""> <!----> #NOT USED +0x8e Ž <IMG SRC=X ALT="Ž"> <!--Ž--> #NOT USED +0x8f  <IMG SRC=X ALT=""> <!----> #NOT USED +0x90  <IMG SRC=X ALT=""> <!----> #NOT USED +0x91 ‘ <IMG SRC=X ALT="‘"> <tab to=c>‘ #LEFT SINGLE QUOTATION MARK +0x92 ’ <IMG SRC=X ALT="’"> <tab to=c>’ #RIGHT SINGLE QUOTATION MARK +0x93 “ <IMG SRC=X ALT="“"> <tab to=c>“ #LEFT DOUBLE QUOTATION MARK +0x94 ” <IMG SRC=X ALT="”"> <tab to=c>” #RIGHT DOUBLE QUOTATION MARK +0x95 • <IMG SRC=X ALT="•"> <tab to=c>• #BULLET +0x96 – <IMG SRC=X ALT="–"> <tab to=c>– #EN DASH +0x97 — <IMG SRC=X ALT="—"> <tab to=c>— #EM DASH +0x98 ˜ <IMG SRC=X ALT="˜"> <tab to=c>˜ #SMALL TILDE +0x99 ™ <IMG SRC=X ALT="™"> <tab to=c>™ #TRADE MARK SIGN +0x9a š <IMG SRC=X ALT="š"> <tab to=c>š #LATIN SMALL LETTER S WITH CARON +0x9b › <IMG SRC=X ALT="›"> <tab to=c>› #SINGLE RIGHT-POINTING ANGLE QUOTATION MARK +0x9c œ <IMG SRC=X ALT="œ"> <tab to=c>œ #LATIN SMALL LIGATURE OE +0x9d  <IMG SRC=X ALT=""> <!----> #NOT USED +0x9e ž <IMG SRC=X ALT="ž"> <!--ž--> #NOT USED +0x9f Ÿ <IMG SRC=X ALT="Ÿ"> <tab to=c>Ÿ #LATIN CAPITAL LETTER Y WITH DIAERESIS + +</PRE> +</BODY> +</HTML> |