mirror of
https://github.com/ezyang/htmlpurifier.git
synced 2024-11-14 01:08:41 +00:00
0ad09e5d94
git-svn-id: http://htmlpurifier.org/svnroot/html_purifier/trunk@61 48356398-32a2-884e-a903-53898d9a118a
77 lines
4.0 KiB
Plaintext
77 lines
4.0 KiB
Plaintext
<!-- Special characters for HTML -->
|
|
|
|
<!-- Character entity set. Typical invocation:
|
|
<!ENTITY % HTMLspecial PUBLIC
|
|
"-//W3C//ENTITIES Special//EN//HTML">
|
|
%HTMLspecial; -->
|
|
|
|
<!-- Portions © International Organization for Standardization 1986:
|
|
Permission to copy in any form is granted for use with
|
|
conforming SGML systems and applications as defined in
|
|
ISO 8879, provided this notice is included in all copies.
|
|
-->
|
|
|
|
<!-- Relevant ISO entity set is given unless names are newly introduced.
|
|
New names (i.e., not in ISO 8879 list) do not clash with any
|
|
existing ISO 8879 entity names. ISO 10646 character numbers
|
|
are given for each character, in hex. CDATA values are decimal
|
|
conversions of the ISO 10646 values and refer to the document
|
|
character set. Names are ISO 10646 names.
|
|
|
|
-->
|
|
|
|
<!-- C0 Controls and Basic Latin -->
|
|
<!ENTITY quot CDATA """ -- quotation mark = APL quote,
|
|
U+0022 ISOnum -->
|
|
<!ENTITY amp CDATA "&" -- ampersand, U+0026 ISOnum -->
|
|
<!ENTITY lt CDATA "<" -- less-than sign, U+003C ISOnum -->
|
|
<!ENTITY gt CDATA ">" -- greater-than sign, U+003E ISOnum -->
|
|
|
|
<!-- Latin Extended-A -->
|
|
<!ENTITY OElig CDATA "Œ" -- latin capital ligature OE,
|
|
U+0152 ISOlat2 -->
|
|
<!ENTITY oelig CDATA "œ" -- latin small ligature oe, U+0153 ISOlat2 -->
|
|
<!-- ligature is a misnomer, this is a separate character in some languages -->
|
|
<!ENTITY Scaron CDATA "Š" -- latin capital letter S with caron,
|
|
U+0160 ISOlat2 -->
|
|
<!ENTITY scaron CDATA "š" -- latin small letter s with caron,
|
|
U+0161 ISOlat2 -->
|
|
<!ENTITY Yuml CDATA "Ÿ" -- latin capital letter Y with diaeresis,
|
|
U+0178 ISOlat2 -->
|
|
|
|
<!-- Spacing Modifier Letters -->
|
|
<!ENTITY circ CDATA "ˆ" -- modifier letter circumflex accent,
|
|
U+02C6 ISOpub -->
|
|
<!ENTITY tilde CDATA "˜" -- small tilde, U+02DC ISOdia -->
|
|
|
|
<!-- General Punctuation -->
|
|
<!ENTITY ensp CDATA " " -- en space, U+2002 ISOpub -->
|
|
<!ENTITY emsp CDATA " " -- em space, U+2003 ISOpub -->
|
|
<!ENTITY thinsp CDATA " " -- thin space, U+2009 ISOpub -->
|
|
<!ENTITY zwnj CDATA "‌" -- zero width non-joiner,
|
|
U+200C NEW RFC 2070 -->
|
|
<!ENTITY zwj CDATA "‍" -- zero width joiner, U+200D NEW RFC 2070 -->
|
|
<!ENTITY lrm CDATA "‎" -- left-to-right mark, U+200E NEW RFC 2070 -->
|
|
<!ENTITY rlm CDATA "‏" -- right-to-left mark, U+200F NEW RFC 2070 -->
|
|
<!ENTITY ndash CDATA "–" -- en dash, U+2013 ISOpub -->
|
|
<!ENTITY mdash CDATA "—" -- em dash, U+2014 ISOpub -->
|
|
<!ENTITY lsquo CDATA "‘" -- left single quotation mark,
|
|
U+2018 ISOnum -->
|
|
<!ENTITY rsquo CDATA "’" -- right single quotation mark,
|
|
U+2019 ISOnum -->
|
|
<!ENTITY sbquo CDATA "‚" -- single low-9 quotation mark, U+201A NEW -->
|
|
<!ENTITY ldquo CDATA "“" -- left double quotation mark,
|
|
U+201C ISOnum -->
|
|
<!ENTITY rdquo CDATA "”" -- right double quotation mark,
|
|
U+201D ISOnum -->
|
|
<!ENTITY bdquo CDATA "„" -- double low-9 quotation mark, U+201E NEW -->
|
|
<!ENTITY dagger CDATA "†" -- dagger, U+2020 ISOpub -->
|
|
<!ENTITY Dagger CDATA "‡" -- double dagger, U+2021 ISOpub -->
|
|
<!ENTITY permil CDATA "‰" -- per mille sign, U+2030 ISOtech -->
|
|
<!ENTITY lsaquo CDATA "‹" -- single left-pointing angle quotation mark,
|
|
U+2039 ISO proposed -->
|
|
<!-- lsaquo is proposed but not yet ISO standardized -->
|
|
<!ENTITY rsaquo CDATA "›" -- single right-pointing angle quotation mark,
|
|
U+203A ISO proposed -->
|
|
<!-- rsaquo is proposed but not yet ISO standardized -->
|
|
<!ENTITY euro CDATA "€" -- euro sign, U+20AC NEW --> |