text 查找HTML字符实体并将引用转换为XQuery中与XML兼容的字符
Posted
tags:
篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了text 查找HTML字符实体并将引用转换为XQuery中与XML兼容的字符相关的知识,希望对你有一定的参考价值。
xquery version "3.1";
let $json-string := ``[
[
[
"quot",
""",
"quotation mark (APL quote)"
],
[
"amp",
"&",
"ampersand"
],
[
"apos",
"'",
"apostrophe (apostrophe-quote)"
],
[
"lt",
"<",
"less-than sign"
],
[
"gt",
">",
"greater-than sign"
],
[
"nbsp",
" ",
"no-break space (non-breaking space)"
],
[
"iexcl",
"¡",
"inverted exclamation mark"
],
[
"cent",
"¢",
"cent sign"
],
[
"pound",
"£",
"pound sign"
],
[
"curren",
"¤",
"currency sign"
],
[
"yen",
"¥",
"yen sign (yuan sign)"
],
[
"brvbar",
"¦",
"broken bar (broken vertical bar)"
],
[
"sect",
"§",
"section sign"
],
[
"uml",
"¨",
"diaeresis (spacing diaeresis); see Germanic umlaut"
],
[
"copy",
"©",
"copyright symbol"
],
[
"ordf",
"ª",
"feminine ordinal indicator"
],
[
"laquo",
"«",
"left-pointing double angle quotation mark (left pointing guillemet)"
],
[
"not",
"¬",
"not sign"
],
[
"shy",
"­",
"soft hyphen (discretionary hyphen)"
],
[
"reg",
"®",
"registered sign (registered trademark symbol)"
],
[
"macr",
"¯",
"macron (spacing macron, overline, APL overbar)"
],
[
"deg",
"°",
"degree symbol"
],
[
"plusmn",
"±",
"plus-minus sign (plus-or-minus sign)"
],
[
"sup2",
"²",
"superscript two (superscript digit two, squared)"
],
[
"sup3",
"³",
"superscript three (superscript digit three, cubed)"
],
[
"acute",
"´",
"acute accent (spacing acute)"
],
[
"micro",
"µ",
"micro sign"
],
[
"para",
"¶",
"pilcrow sign (paragraph sign)"
],
[
"middot",
"·",
"middle dot (Georgian comma, Greek middle dot)"
],
[
"cedil",
"¸",
"cedilla (spacing cedilla)"
],
[
"sup1",
"¹",
"superscript one (superscript digit one)"
],
[
"ordm",
"º",
"masculine ordinal indicator"
],
[
"raquo",
"»",
"right-pointing double angle quotation mark (right pointing guillemet)"
],
[
"frac14",
"¼",
"vulgar fraction one quarter (fraction one quarter)"
],
[
"frac12",
"½",
"vulgar fraction one half (fraction one half)"
],
[
"frac34",
"¾",
"vulgar fraction three quarters (fraction three quarters)"
],
[
"iquest",
"¿",
"inverted question mark (turned question mark)"
],
[
"Agrave",
"À",
"Latin capital letter A with grave accent (Latin capital letter A grave)"
],
[
"Aacute",
"Á",
"Latin capital letter A with acute accent"
],
[
"Acirc",
"Â",
"Latin capital letter A with circumflex"
],
[
"Atilde",
"Ã",
"Latin capital letter A with tilde"
],
[
"Auml",
"Ä",
"Latin capital letter A with diaeresis"
],
[
"Aring",
"Å",
"Latin capital letter A with ring above (Latin capital letter A ring)"
],
[
"AElig",
"Æ",
"Latin capital letter AE (Latin capital ligature AE)"
],
[
"Ccedil",
"Ç",
"Latin capital letter C with cedilla"
],
[
"Egrave",
"È",
"Latin capital letter E with grave accent"
],
[
"Eacute",
"É",
"Latin capital letter E with acute accent"
],
[
"Ecirc",
"Ê",
"Latin capital letter E with circumflex"
],
[
"Euml",
"Ë",
"Latin capital letter E with diaeresis"
],
[
"Igrave",
"Ì",
"Latin capital letter I with grave accent"
],
[
"Iacute",
"Í",
"Latin capital letter I with acute accent"
],
[
"Icirc",
"Î",
"Latin capital letter I with circumflex"
],
[
"Iuml",
"Ï",
"Latin capital letter I with diaeresis"
],
[
"ETH",
"Ð",
"Latin capital letter Eth"
],
[
"Ntilde",
"Ñ",
"Latin capital letter N with tilde"
],
[
"Ograve",
"Ò",
"Latin capital letter O with grave accent"
],
[
"Oacute",
"Ó",
"Latin capital letter O with acute accent"
],
[
"Ocirc",
"Ô",
"Latin capital letter O with circumflex"
],
[
"Otilde",
"Õ",
"Latin capital letter O with tilde"
],
[
"Ouml",
"Ö",
"Latin capital letter O with diaeresis"
],
[
"times",
"×",
"multiplication sign"
],
[
"Oslash",
"Ø",
"Latin capital letter O with stroke (Latin capital letter O slash)"
],
[
"Ugrave",
"Ù",
"Latin capital letter U with grave accent"
],
[
"Uacute",
"Ú",
"Latin capital letter U with acute accent"
],
[
"Ucirc",
"Û",
"Latin capital letter U with circumflex"
],
[
"Uuml",
"Ü",
"Latin capital letter U with diaeresis"
],
[
"Yacute",
"Ý",
"Latin capital letter Y with acute accent"
],
[
"THORN",
"Þ",
"Latin capital letter THORN"
],
[
"szlig",
"ß",
"Latin small letter sharp s (ess-zed); see German Eszett"
],
[
"agrave",
"à",
"Latin small letter a with grave accent"
],
[
"aacute",
"á",
"Latin small letter a with acute accent"
],
[
"acirc",
"â",
"Latin small letter a with circumflex"
],
[
"atilde",
"ã",
"Latin small letter a with tilde"
],
[
"auml",
"ä",
"Latin small letter a with diaeresis"
],
[
"aring",
"å",
"Latin small letter a with ring above"
],
[
"aelig",
"æ",
"Latin small letter ae (Latin small ligature ae)"
],
[
"ccedil",
"ç",
"Latin small letter c with cedilla"
],
[
"egrave",
"è",
"Latin small letter e with grave accent"
],
[
"eacute",
"é",
"Latin small letter e with acute accent"
],
[
"ecirc",
"ê",
"Latin small letter e with circumflex"
],
[
"euml",
"ë",
"Latin small letter e with diaeresis"
],
[
"igrave",
"ì",
"Latin small letter i with grave accent"
],
[
"iacute",
"í",
"Latin small letter i with acute accent"
],
[
"icirc",
"î",
"Latin small letter i with circumflex"
],
[
"iuml",
"ï",
"Latin small letter i with diaeresis"
],
[
"eth",
"ð",
"Latin small letter eth"
],
[
"ntilde",
"ñ",
"Latin small letter n with tilde"
],
[
"ograve",
"ò",
"Latin small letter o with grave accent"
],
[
"oacute",
"ó",
"Latin small letter o with acute accent"
],
[
"ocirc",
"ô",
"Latin small letter o with circumflex"
],
[
"otilde",
"õ",
"Latin small letter o with tilde"
],
[
"ouml",
"ö",
"Latin small letter o with diaeresis"
],
[
"divide",
"÷",
"division sign (obelus)"
],
[
"oslash",
"ø",
"Latin small letter o with stroke (Latin small letter o slash)"
],
[
"ugrave",
"ù",
"Latin small letter u with grave accent"
],
[
"uacute",
"ú",
"Latin small letter u with acute accent"
],
[
"ucirc",
"û",
"Latin small letter u with circumflex"
],
[
"uuml",
"ü",
"Latin small letter u with diaeresis"
],
[
"yacute",
"ý",
"Latin small letter y with acute accent"
],
[
"thorn",
"þ",
"Latin small letter thorn"
],
[
"yuml",
"ÿ",
"Latin small letter y with diaeresis"
],
[
"OElig",
"Œ",
"Latin capital ligature oe"
],
[
"oelig",
"œ",
"Latin small ligature oe"
],
[
"Scaron",
"Š",
"Latin capital letter s with caron"
],
[
"scaron",
"š",
"Latin small letter s with caron"
],
[
"Yuml",
"Ÿ",
"Latin capital letter y with diaeresis"
],
[
"fnof",
"ƒ",
"Latin small letter f with hook (function, florin)"
],
[
"circ",
"ˆ",
"modifier letter circumflex accent"
],
[
"tilde",
"˜",
"small tilde"
],
[
"Alpha",
"Α",
"Greek capital letter Alpha"
],
[
"Beta",
"Β",
"Greek capital letter Beta"
],
[
"Gamma",
"Γ",
"Greek capital letter Gamma"
],
[
"Delta",
"Δ",
"Greek capital letter Delta"
],
[
"Epsilon",
"Ε",
"Greek capital letter Epsilon"
],
[
"Zeta",
"Ζ",
"Greek capital letter Zeta"
],
[
"Eta",
"Η",
"Greek capital letter Eta"
],
[
"Theta",
"Θ",
"Greek capital letter Theta"
],
[
"Iota",
"Ι",
"Greek capital letter Iota"
],
[
"Kappa",
"Κ",
"Greek capital letter Kappa"
],
[
"Lambda",
"Λ",
"Greek capital letter Lambda"
],
[
"Mu",
"Μ",
"Greek capital letter Mu"
],
[
"Nu",
"Ν",
"Greek capital letter Nu"
],
[
"Xi",
"Ξ",
"Greek capital letter Xi"
],
[
"Omicron",
"Ο",
"Greek capital letter Omicron"
],
[
"Pi",
"Π",
"Greek capital letter Pi"
],
[
"Rho",
"Ρ",
"Greek capital letter Rho"
],
[
"Sigma",
"Σ",
"Greek capital letter Sigma"
],
[
"Tau",
"Τ",
"Greek capital letter Tau"
],
[
"Upsilon",
"Υ",
"Greek capital letter Upsilon"
],
[
"Phi",
"Φ",
"Greek capital letter Phi"
],
[
"Chi",
"Χ",
"Greek capital letter Chi"
],
[
"Psi",
"Ψ",
"Greek capital letter Psi"
],
[
"Omega",
"Ω",
"Greek capital letter Omega"
],
[
"alpha",
"α",
"Greek small letter alpha"
],
[
"beta",
"β",
"Greek small letter beta"
],
[
"gamma",
"γ",
"Greek small letter gamma"
],
[
"delta",
"δ",
"Greek small letter delta"
],
[
"epsilon",
"ε",
"Greek small letter epsilon"
],
[
"zeta",
"ζ",
"Greek small letter zeta"
],
[
"eta",
"η",
"Greek small letter eta"
],
[
"theta",
"θ",
"Greek small letter theta"
],
[
"iota",
"ι",
"Greek small letter iota"
],
[
"kappa",
"κ",
"Greek small letter kappa"
],
[
"lambda",
"λ",
"Greek small letter lambda"
],
[
"mu",
"μ",
"Greek small letter mu"
],
[
"nu",
"ν",
"Greek small letter nu"
],
[
"xi",
"ξ",
"Greek small letter xi"
],
[
"omicron",
"ο",
"Greek small letter omicron"
],
[
"pi",
"π",
"Greek small letter pi"
],
[
"rho",
"ρ",
"Greek small letter rho"
],
[
"sigmaf",
"ς",
"Greek small letter final sigma"
],
[
"sigma",
"σ",
"Greek small letter sigma"
],
[
"tau",
"τ",
"Greek small letter tau"
],
[
"upsilon",
"υ",
"Greek small letter upsilon"
],
[
"phi",
"φ",
"Greek small letter phi"
],
[
"chi",
"χ",
"Greek small letter chi"
],
[
"psi",
"ψ",
"Greek small letter psi"
],
[
"omega",
"ω",
"Greek small letter omega"
],
[
"thetasym",
"ϑ",
"Greek theta symbol"
],
[
"upsih",
"ϒ",
"Greek Upsilon with hook symbol"
],
[
"piv",
"ϖ",
"Greek pi symbol"
],
[
"ensp",
" ",
"en space"
],
[
"emsp",
" ",
"em space"
],
[
"thinsp",
" ",
"thin space"
],
[
"zwnj",
"‌",
"zero-width non-joiner"
],
[
"zwj",
"‍",
"zero-width joiner"
],
[
"lrm",
"‎",
"left-to-right mark"
],
[
"rlm",
"‏",
"right-to-left mark"
],
[
"ndash",
"–",
"en dash"
],
[
"mdash",
"—",
"em dash"
],
[
"lsquo",
"‘",
"left single quotation mark"
],
[
"rsquo",
"’",
"right single quotation mark"
],
[
"sbquo",
"‚",
"single low-9 quotation mark"
],
[
"ldquo",
"“",
"left double quotation mark"
],
[
"rdquo",
"”",
"right double quotation mark"
],
[
"bdquo",
"„",
"double low-9 quotation mark"
],
[
"dagger",
"†",
"dagger, obelisk"
],
[
"Dagger",
"‡",
"double dagger, double obelisk"
],
[
"bull",
"•",
"bullet (black small circle)"
],
[
"hellip",
"…",
"horizontal ellipsis (three dot leader)"
],
[
"permil",
"‰",
"per mille sign"
],
[
"prime",
"′",
"prime (minutes, feet)"
],
[
"Prime",
"″",
"double prime (seconds, inches)"
],
[
"lsaquo",
"‹",
"single left-pointing angle quotation mark"
],
[
"rsaquo",
"›",
"single right-pointing angle quotation mark"
],
[
"oline",
"‾",
"overline (spacing overscore)"
],
[
"frasl",
"⁄",
"fraction slash (solidus)"
],
[
"euro",
"€",
"euro sign"
],
[
"image",
"ℑ",
"black-letter capital I (imaginary part)"
],
[
"weierp",
"℘",
"script capital P (power set, Weierstrass p)"
],
[
"real",
"ℜ",
"black-letter capital R (real part symbol)"
],
[
"trade",
"™",
"trademark symbol"
],
[
"alefsym",
"ℵ",
"alef symbol (first transfinite cardinal)"
],
[
"larr",
"←",
"leftwards arrow"
],
[
"uarr",
"↑",
"upwards arrow"
],
[
"rarr",
"→",
"rightwards arrow"
],
[
"darr",
"↓",
"downwards arrow"
],
[
"harr",
"↔",
"left right arrow"
],
[
"crarr",
"↵",
"downwards arrow with corner leftwards (carriage return)"
],
[
"lArr",
"⇐",
"leftwards double arrow"
],
[
"uArr",
"⇑",
"upwards double arrow"
],
[
"rArr",
"⇒",
"rightwards double arrow"
],
[
"dArr",
"⇓",
"downwards double arrow"
],
[
"hArr",
"⇔",
"left right double arrow"
],
[
"forall",
"∀",
"for all"
],
[
"part",
"∂",
"partial differential"
],
[
"exist",
"∃",
"there exists"
],
[
"empty",
"∅",
"empty set (null set); see also U+8960, ⌀"
],
[
"nabla",
"∇",
"del or nabla (vector differential operator)"
],
[
"isin",
"∈",
"element of"
],
[
"notin",
"∉",
"not an element of"
],
[
"ni",
"∋",
"contains as member"
],
[
"prod",
"∏",
"n-ary product (product sign)"
],
[
"sum",
"∑",
"n-ary summation"
],
[
"minus",
"−",
"minus sign"
],
[
"lowast",
"∗",
"asterisk operator"
],
[
"radic",
"√",
"square root (radical sign)"
],
[
"prop",
"∝",
"proportional to"
],
[
"infin",
"∞",
"infinity"
],
[
"ang",
"∠",
"angle"
],
[
"and",
"∧",
"logical and (wedge)"
],
[
"or",
"∨",
"logical or (vee)"
],
[
"cap",
"∩",
"intersection (cap)"
],
[
"cup",
"∪",
"union (cup)"
],
[
"int",
"∫",
"integral"
],
[
"there4",
"∴",
"therefore sign"
],
[
"sim",
"∼",
"tilde operator (varies with, similar to)"
],
[
"cong",
"≅",
"congruent to"
],
[
"asymp",
"≈",
"almost equal to (asymptotic to)"
],
[
"ne",
"≠",
"not equal to"
],
[
"equiv",
"≡",
"identical to; sometimes used for 'equivalent to'"
],
[
"le",
"≤",
"less-than or equal to"
],
[
"ge",
"≥",
"greater-than or equal to"
],
[
"sub",
"⊂",
"subset of"
],
[
"sup",
"⊃",
"superset of"
],
[
"nsub",
"⊄",
"not a subset of"
],
[
"sube",
"⊆",
"subset of or equal to"
],
[
"supe",
"⊇",
"superset of or equal to"
],
[
"oplus",
"⊕",
"circled plus (direct sum)"
],
[
"otimes",
"⊗",
"circled times (vector product)"
],
[
"perp",
"⊥",
"up tack (orthogonal to, perpendicular)"
],
[
"sdot",
"⋅",
"dot operator"
],
[
"lceil",
"⌈",
"left ceiling (APL upstile)"
],
[
"rceil",
"⌉",
"right ceiling"
],
[
"lfloor",
"⌊",
"left floor (APL downstile)"
],
[
"rfloor",
"⌋",
"right floor"
],
[
"lang",
"〈",
"left-pointing angle bracket (bra)"
],
[
"rang",
"〉",
"right-pointing angle bracket (ket)"
],
[
"loz",
"◊",
"lozenge"
],
[
"spades",
"♠",
"black spade suit"
],
[
"clubs",
"♣",
"black club suit (shamrock)"
],
[
"hearts",
"♥",
"black heart suit (valentine)"
],
[
"diams",
"♦",
"black diamond suit"
]
]
]``
let $json := parse-json($json-string)
let $entities :=
for $array in $json?*
return
map {
$array?1: map {
"character": parse-xml-fragment($array?2)/string(),
"name": $array?1,
"escape-sequence": $array?2,
"description": $array?3
}
}
return
$entities
xquery version "3.1";
(:~ A module containing a lookup table, in the form of a map, for HTML entities
: that aren't defined in XML, and a function for converting HTML entities in
: strings to the appropriate characters. Look up characters via map lookup:
:
: $entities:entities?ograve?character => ò
:
: @author Joe Wicentowski
: @see https://en.wikipedia.org/wiki/List_of_XML_and_HTML_character_entity_references#Character_entity_references_in_HTML
: @see https://gist.github.com/lcahlander/b040744256b81f881c583169e4f7b4d0
: :)
module namespace entities = "http://joewiz.org/ns/xquery/entities";
(:~ A map for looking up HTML entities that aren't defined in XML :)
declare variable $entities:entities as map(*)+ := (
map {
"quot": map {
"character": """",
"name": "quot",
"escape-sequence": """,
"description": "quotation mark (APL quote)"
}
},map {
"amp": map {
"character": "&",
"name": "amp",
"escape-sequence": "&",
"description": "ampersand"
}
},map {
"apos": map {
"character": "'",
"name": "apos",
"escape-sequence": "'",
"description": "apostrophe (apostrophe-quote)"
}
},map {
"lt": map {
"character": "<",
"name": "lt",
"escape-sequence": "<",
"description": "less-than sign"
}
},map {
"gt": map {
"character": ">",
"name": "gt",
"escape-sequence": ">",
"description": "greater-than sign"
}
},map {
"nbsp": map {
"character": " ",
"name": "nbsp",
"escape-sequence": " ",
"description": "no-break space (non-breaking space)"
}
},map {
"iexcl": map {
"character": "¡",
"name": "iexcl",
"escape-sequence": "¡",
"description": "inverted exclamation mark"
}
},map {
"cent": map {
"character": "¢",
"name": "cent",
"escape-sequence": "¢",
"description": "cent sign"
}
},map {
"pound": map {
"character": "£",
"name": "pound",
"escape-sequence": "£",
"description": "pound sign"
}
},map {
"curren": map {
"character": "¤",
"name": "curren",
"escape-sequence": "¤",
"description": "currency sign"
}
},map {
"yen": map {
"character": "¥",
"name": "yen",
"escape-sequence": "¥",
"description": "yen sign (yuan sign)"
}
},map {
"brvbar": map {
"character": "¦",
"name": "brvbar",
"escape-sequence": "¦",
"description": "broken bar (broken vertical bar)"
}
},map {
"sect": map {
"character": "§",
"name": "sect",
"escape-sequence": "§",
"description": "section sign"
}
},map {
"uml": map {
"character": "¨",
"name": "uml",
"escape-sequence": "¨",
"description": "diaeresis (spacing diaeresis); see Germanic umlaut"
}
},map {
"copy": map {
"character": "©",
"name": "copy",
"escape-sequence": "©",
"description": "copyright symbol"
}
},map {
"ordf": map {
"character": "ª",
"name": "ordf",
"escape-sequence": "ª",
"description": "feminine ordinal indicator"
}
},map {
"laquo": map {
"character": "«",
"name": "laquo",
"escape-sequence": "«",
"description": "left-pointing double angle quotation mark (left pointing guillemet)"
}
},map {
"not": map {
"character": "¬",
"name": "not",
"escape-sequence": "¬",
"description": "not sign"
}
},map {
"shy": map {
"character": "",
"name": "shy",
"escape-sequence": "­",
"description": "soft hyphen (discretionary hyphen)"
}
},map {
"reg": map {
"character": "®",
"name": "reg",
"escape-sequence": "®",
"description": "registered sign (registered trademark symbol)"
}
},map {
"macr": map {
"character": "¯",
"name": "macr",
"escape-sequence": "¯",
"description": "macron (spacing macron, overline, APL overbar)"
}
},map {
"deg": map {
"character": "°",
"name": "deg",
"escape-sequence": "°",
"description": "degree symbol"
}
},map {
"plusmn": map {
"character": "±",
"name": "plusmn",
"escape-sequence": "±",
"description": "plus-minus sign (plus-or-minus sign)"
}
},map {
"sup2": map {
"character": "²",
"name": "sup2",
"escape-sequence": "²",
"description": "superscript two (superscript digit two, squared)"
}
},map {
"sup3": map {
"character": "³",
"name": "sup3",
"escape-sequence": "³",
"description": "superscript three (superscript digit three, cubed)"
}
},map {
"acute": map {
"character": "´",
"name": "acute",
"escape-sequence": "´",
"description": "acute accent (spacing acute)"
}
},map {
"micro": map {
"character": "µ",
"name": "micro",
"escape-sequence": "µ",
"description": "micro sign"
}
},map {
"para": map {
"character": "¶",
"name": "para",
"escape-sequence": "¶",
"description": "pilcrow sign (paragraph sign)"
}
},map {
"middot": map {
"character": "·",
"name": "middot",
"escape-sequence": "·",
"description": "middle dot (Georgian comma, Greek middle dot)"
}
},map {
"cedil": map {
"character": "¸",
"name": "cedil",
"escape-sequence": "¸",
"description": "cedilla (spacing cedilla)"
}
},map {
"sup1": map {
"character": "¹",
"name": "sup1",
"escape-sequence": "¹",
"description": "superscript one (superscript digit one)"
}
},map {
"ordm": map {
"character": "º",
"name": "ordm",
"escape-sequence": "º",
"description": "masculine ordinal indicator"
}
},map {
"raquo": map {
"character": "»",
"name": "raquo",
"escape-sequence": "»",
"description": "right-pointing double angle quotation mark (right pointing guillemet)"
}
},map {
"frac14": map {
"character": "¼",
"name": "frac14",
"escape-sequence": "¼",
"description": "vulgar fraction one quarter (fraction one quarter)"
}
},map {
"frac12": map {
"character": "½",
"name": "frac12",
"escape-sequence": "½",
"description": "vulgar fraction one half (fraction one half)"
}
},map {
"frac34": map {
"character": "¾",
"name": "frac34",
"escape-sequence": "¾",
"description": "vulgar fraction three quarters (fraction three quarters)"
}
},map {
"iquest": map {
"character": "¿",
"name": "iquest",
"escape-sequence": "¿",
"description": "inverted question mark (turned question mark)"
}
},map {
"Agrave": map {
"character": "À",
"name": "Agrave",
"escape-sequence": "À",
"description": "Latin capital letter A with grave accent (Latin capital letter A grave)"
}
},map {
"Aacute": map {
"character": "Á",
"name": "Aacute",
"escape-sequence": "Á",
"description": "Latin capital letter A with acute accent"
}
},map {
"Acirc": map {
"character": "Â",
"name": "Acirc",
"escape-sequence": "Â",
"description": "Latin capital letter A with circumflex"
}
},map {
"Atilde": map {
"character": "Ã",
"name": "Atilde",
"escape-sequence": "Ã",
"description": "Latin capital letter A with tilde"
}
},map {
"Auml": map {
"character": "Ä",
"name": "Auml",
"escape-sequence": "Ä",
"description": "Latin capital letter A with diaeresis"
}
},map {
"Aring": map {
"character": "Å",
"name": "Aring",
"escape-sequence": "Å",
"description": "Latin capital letter A with ring above (Latin capital letter A ring)"
}
},map {
"AElig": map {
"character": "Æ",
"name": "AElig",
"escape-sequence": "Æ",
"description": "Latin capital letter AE (Latin capital ligature AE)"
}
},map {
"Ccedil": map {
"character": "Ç",
"name": "Ccedil",
"escape-sequence": "Ç",
"description": "Latin capital letter C with cedilla"
}
},map {
"Egrave": map {
"character": "È",
"name": "Egrave",
"escape-sequence": "È",
"description": "Latin capital letter E with grave accent"
}
},map {
"Eacute": map {
"character": "É",
"name": "Eacute",
"escape-sequence": "É",
"description": "Latin capital letter E with acute accent"
}
},map {
"Ecirc": map {
"character": "Ê",
"name": "Ecirc",
"escape-sequence": "Ê",
"description": "Latin capital letter E with circumflex"
}
},map {
"Euml": map {
"character": "Ë",
"name": "Euml",
"escape-sequence": "Ë",
"description": "Latin capital letter E with diaeresis"
}
},map {
"Igrave": map {
"character": "Ì",
"name": "Igrave",
"escape-sequence": "Ì",
"description": "Latin capital letter I with grave accent"
}
},map {
"Iacute": map {
"character": "Í",
"name": "Iacute",
"escape-sequence": "Í",
"description": "Latin capital letter I with acute accent"
}
},map {
"Icirc": map {
"character": "Î",
"name": "Icirc",
"escape-sequence": "Î",
"description": "Latin capital letter I with circumflex"
}
},map {
"Iuml": map {
"character": "Ï",
"name": "Iuml",
"escape-sequence": "Ï",
"description": "Latin capital letter I with diaeresis"
}
},map {
"ETH": map {
"character": "Ð",
"name": "ETH",
"escape-sequence": "Ð",
"description": "Latin capital letter Eth"
}
},map {
"Ntilde": map {
"character": "Ñ",
"name": "Ntilde",
"escape-sequence": "Ñ",
"description": "Latin capital letter N with tilde"
}
},map {
"Ograve": map {
"character": "Ò",
"name": "Ograve",
"escape-sequence": "Ò",
"description": "Latin capital letter O with grave accent"
}
},map {
"Oacute": map {
"character": "Ó",
"name": "Oacute",
"escape-sequence": "Ó",
"description": "Latin capital letter O with acute accent"
}
},map {
"Ocirc": map {
"character": "Ô",
"name": "Ocirc",
"escape-sequence": "Ô",
"description": "Latin capital letter O with circumflex"
}
},map {
"Otilde": map {
"character": "Õ",
"name": "Otilde",
"escape-sequence": "Õ",
"description": "Latin capital letter O with tilde"
}
},map {
"Ouml": map {
"character": "Ö",
"name": "Ouml",
"escape-sequence": "Ö",
"description": "Latin capital letter O with diaeresis"
}
},map {
"times": map {
"character": "×",
"name": "times",
"escape-sequence": "×",
"description": "multiplication sign"
}
},map {
"Oslash": map {
"character": "Ø",
"name": "Oslash",
"escape-sequence": "Ø",
"description": "Latin capital letter O with stroke (Latin capital letter O slash)"
}
},map {
"Ugrave": map {
"character": "Ù",
"name": "Ugrave",
"escape-sequence": "Ù",
"description": "Latin capital letter U with grave accent"
}
},map {
"Uacute": map {
"character": "Ú",
"name": "Uacute",
"escape-sequence": "Ú",
"description": "Latin capital letter U with acute accent"
}
},map {
"Ucirc": map {
"character": "Û",
"name": "Ucirc",
"escape-sequence": "Û",
"description": "Latin capital letter U with circumflex"
}
},map {
"Uuml": map {
"character": "Ü",
"name": "Uuml",
"escape-sequence": "Ü",
"description": "Latin capital letter U with diaeresis"
}
},map {
"Yacute": map {
"character": "Ý",
"name": "Yacute",
"escape-sequence": "Ý",
"description": "Latin capital letter Y with acute accent"
}
},map {
"THORN": map {
"character": "Þ",
"name": "THORN",
"escape-sequence": "Þ",
"description": "Latin capital letter THORN"
}
},map {
"szlig": map {
"character": "ß",
"name": "szlig",
"escape-sequence": "ß",
"description": "Latin small letter sharp s (ess-zed); see German Eszett"
}
},map {
"agrave": map {
"character": "à",
"name": "agrave",
"escape-sequence": "à",
"description": "Latin small letter a with grave accent"
}
},map {
"aacute": map {
"character": "á",
"name": "aacute",
"escape-sequence": "á",
"description": "Latin small letter a with acute accent"
}
},map {
"acirc": map {
"character": "â",
"name": "acirc",
"escape-sequence": "â",
"description": "Latin small letter a with circumflex"
}
},map {
"atilde": map {
"character": "ã",
"name": "atilde",
"escape-sequence": "ã",
"description": "Latin small letter a with tilde"
}
},map {
"auml": map {
"character": "ä",
"name": "auml",
"escape-sequence": "ä",
"description": "Latin small letter a with diaeresis"
}
},map {
"aring": map {
"character": "å",
"name": "aring",
"escape-sequence": "å",
"description": "Latin small letter a with ring above"
}
},map {
"aelig": map {
"character": "æ",
"name": "aelig",
"escape-sequence": "æ",
"description": "Latin small letter ae (Latin small ligature ae)"
}
},map {
"ccedil": map {
"character": "ç",
"name": "ccedil",
"escape-sequence": "ç",
"description": "Latin small letter c with cedilla"
}
},map {
"egrave": map {
"character": "è",
"name": "egrave",
"escape-sequence": "è",
"description": "Latin small letter e with grave accent"
}
},map {
"eacute": map {
"character": "é",
"name": "eacute",
"escape-sequence": "é",
"description": "Latin small letter e with acute accent"
}
},map {
"ecirc": map {
"character": "ê",
"name": "ecirc",
"escape-sequence": "ê",
"description": "Latin small letter e with circumflex"
}
},map {
"euml": map {
"character": "ë",
"name": "euml",
"escape-sequence": "ë",
"description": "Latin small letter e with diaeresis"
}
},map {
"igrave": map {
"character": "ì",
"name": "igrave",
"escape-sequence": "ì",
"description": "Latin small letter i with grave accent"
}
},map {
"iacute": map {
"character": "í",
"name": "iacute",
"escape-sequence": "í",
"description": "Latin small letter i with acute accent"
}
},map {
"icirc": map {
"character": "î",
"name": "icirc",
"escape-sequence": "î",
"description": "Latin small letter i with circumflex"
}
},map {
"iuml": map {
"character": "ï",
"name": "iuml",
"escape-sequence": "ï",
"description": "Latin small letter i with diaeresis"
}
},map {
"eth": map {
"character": "ð",
"name": "eth",
"escape-sequence": "ð",
"description": "Latin small letter eth"
}
},map {
"ntilde": map {
"character": "ñ",
"name": "ntilde",
"escape-sequence": "ñ",
"description": "Latin small letter n with tilde"
}
},map {
"ograve": map {
"character": "ò",
"name": "ograve",
"escape-sequence": "ò",
"description": "Latin small letter o with grave accent"
}
},map {
"oacute": map {
"character": "ó",
"name": "oacute",
"escape-sequence": "ó",
"description": "Latin small letter o with acute accent"
}
},map {
"ocirc": map {
"character": "ô",
"name": "ocirc",
"escape-sequence": "ô",
"description": "Latin small letter o with circumflex"
}
},map {
"otilde": map {
"character": "õ",
"name": "otilde",
"escape-sequence": "õ",
"description": "Latin small letter o with tilde"
}
},map {
"ouml": map {
"character": "ö",
"name": "ouml",
"escape-sequence": "ö",
"description": "Latin small letter o with diaeresis"
}
},map {
"divide": map {
"character": "÷",
"name": "divide",
"escape-sequence": "÷",
"description": "division sign (obelus)"
}
},map {
"oslash": map {
"character": "ø",
"name": "oslash",
"escape-sequence": "ø",
"description": "Latin small letter o with stroke (Latin small letter o slash)"
}
},map {
"ugrave": map {
"character": "ù",
"name": "ugrave",
"escape-sequence": "ù",
"description": "Latin small letter u with grave accent"
}
},map {
"uacute": map {
"character": "ú",
"name": "uacute",
"escape-sequence": "ú",
"description": "Latin small letter u with acute accent"
}
},map {
"ucirc": map {
"character": "û",
"name": "ucirc",
"escape-sequence": "û",
"description": "Latin small letter u with circumflex"
}
},map {
"uuml": map {
"character": "ü",
"name": "uuml",
"escape-sequence": "ü",
"description": "Latin small letter u with diaeresis"
}
},map {
"yacute": map {
"character": "ý",
"name": "yacute",
"escape-sequence": "ý",
"description": "Latin small letter y with acute accent"
}
},map {
"thorn": map {
"character": "þ",
"name": "thorn",
"escape-sequence": "þ",
"description": "Latin small letter thorn"
}
},map {
"yuml": map {
"character": "ÿ",
"name": "yuml",
"escape-sequence": "ÿ",
"description": "Latin small letter y with diaeresis"
}
},map {
"OElig": map {
"character": "Œ",
"name": "OElig",
"escape-sequence": "Œ",
"description": "Latin capital ligature oe"
}
},map {
"oelig": map {
"character": "œ",
"name": "oelig",
"escape-sequence": "œ",
"description": "Latin small ligature oe"
}
},map {
"Scaron": map {
"character": "Š",
"name": "Scaron",
"escape-sequence": "Š",
"description": "Latin capital letter s with caron"
}
},map {
"scaron": map {
"character": "š",
"name": "scaron",
"escape-sequence": "š",
"description": "Latin small letter s with caron"
}
},map {
"Yuml": map {
"character": "Ÿ",
"name": "Yuml",
"escape-sequence": "Ÿ",
"description": "Latin capital letter y with diaeresis"
}
},map {
"fnof": map {
"character": "ƒ",
"name": "fnof",
"escape-sequence": "ƒ",
"description": "Latin small letter f with hook (function, florin)"
}
},map {
"circ": map {
"character": "ˆ",
"name": "circ",
"escape-sequence": "ˆ",
"description": "modifier letter circumflex accent"
}
},map {
"tilde": map {
"character": "˜",
"name": "tilde",
"escape-sequence": "˜",
"description": "small tilde"
}
},map {
"Alpha": map {
"character": "Α",
"name": "Alpha",
"escape-sequence": "Α",
"description": "Greek capital letter Alpha"
}
},map {
"Beta": map {
"character": "Β",
"name": "Beta",
"escape-sequence": "Β",
"description": "Greek capital letter Beta"
}
},map {
"Gamma": map {
"character": "Γ",
"name": "Gamma",
"escape-sequence": "Γ",
"description": "Greek capital letter Gamma"
}
},map {
"Delta": map {
"character": "Δ",
"name": "Delta",
"escape-sequence": "Δ",
"description": "Greek capital letter Delta"
}
},map {
"Epsilon": map {
"character": "Ε",
"name": "Epsilon",
"escape-sequence": "Ε",
"description": "Greek capital letter Epsilon"
}
},map {
"Zeta": map {
"character": "Ζ",
"name": "Zeta",
"escape-sequence": "Ζ",
"description": "Greek capital letter Zeta"
}
},map {
"Eta": map {
"character": "Η",
"name": "Eta",
"escape-sequence": "Η",
"description": "Greek capital letter Eta"
}
},map {
"Theta": map {
"character": "Θ",
"name": "Theta",
"escape-sequence": "Θ",
"description": "Greek capital letter Theta"
}
},map {
"Iota": map {
"character": "Ι",
"name": "Iota",
"escape-sequence": "Ι",
"description": "Greek capital letter Iota"
}
},map {
"Kappa": map {
"character": "Κ",
"name": "Kappa",
"escape-sequence": "Κ",
"description": "Greek capital letter Kappa"
}
},map {
"Lambda": map {
"character": "Λ",
"name": "Lambda",
"escape-sequence": "Λ",
"description": "Greek capital letter Lambda"
}
},map {
"Mu": map {
"character": "Μ",
"name": "Mu",
"escape-sequence": "Μ",
"description": "Greek capital letter Mu"
}
},map {
"Nu": map {
"character": "Ν",
"name": "Nu",
"escape-sequence": "Ν",
"description": "Greek capital letter Nu"
}
},map {
"Xi": map {
"character": "Ξ",
"name": "Xi",
"escape-sequence": "Ξ",
"description": "Greek capital letter Xi"
}
},map {
"Omicron": map {
"character": "Ο",
"name": "Omicron",
"escape-sequence": "Ο",
"description": "Greek capital letter Omicron"
}
},map {
"Pi": map {
"character": "Π",
"name": "Pi",
"escape-sequence": "Π",
"description": "Greek capital letter Pi"
}
},map {
"Rho": map {
"character": "Ρ",
"name": "Rho",
"escape-sequence": "Ρ",
"description": "Greek capital letter Rho"
}
},map {
"Sigma": map {
"character": "Σ",
"name": "Sigma",
"escape-sequence": "Σ",
"description": "Greek capital letter Sigma"
}
},map {
"Tau": map {
"character": "Τ",
"name": "Tau",
"escape-sequence": "Τ",
"description": "Greek capital letter Tau"
}
},map {
"Upsilon": map {
"character": "Υ",
"name": "Upsilon",
"escape-sequence": "Υ",
"description": "Greek capital letter Upsilon"
}
},map {
"Phi": map {
"character": "Φ",
"name": "Phi",
"escape-sequence": "Φ",
"description": "Greek capital letter Phi"
}
},map {
"Chi": map {
"character": "Χ",
"name": "Chi",
"escape-sequence": "Χ",
"description": "Greek capital letter Chi"
}
},map {
"Psi": map {
"character": "Ψ",
"name": "Psi",
"escape-sequence": "Ψ",
"description": "Greek capital letter Psi"
}
},map {
"Omega": map {
"character": "Ω",
"name": "Omega",
"escape-sequence": "Ω",
"description": "Greek capital letter Omega"
}
},map {
"alpha": map {
"character": "α",
"name": "alpha",
"escape-sequence": "α",
"description": "Greek small letter alpha"
}
},map {
"beta": map {
"character": "β",
"name": "beta",
"escape-sequence": "β",
"description": "Greek small letter beta"
}
},map {
"gamma": map {
"character": "γ",
"name": "gamma",
"escape-sequence": "γ",
"description": "Greek small letter gamma"
}
},map {
"delta": map {
"character": "δ",
"name": "delta",
"escape-sequence": "δ",
"description": "Greek small letter delta"
}
},map {
"epsilon": map {
"character": "ε",
"name": "epsilon",
"escape-sequence": "ε",
"description": "Greek small letter epsilon"
}
},map {
"zeta": map {
"character": "ζ",
"name": "zeta",
"escape-sequence": "ζ",
"description": "Greek small letter zeta"
}
},map {
"eta": map {
"character": "η",
"name": "eta",
"escape-sequence": "η",
"description": "Greek small letter eta"
}
},map {
"theta": map {
"character": "θ",
"name": "theta",
"escape-sequence": "θ",
"description": "Greek small letter theta"
}
},map {
"iota": map {
"character": "ι",
"name": "iota",
"escape-sequence": "ι",
"description": "Greek small letter iota"
}
},map {
"kappa": map {
"character": "κ",
"name": "kappa",
"escape-sequence": "κ",
"description": "Greek small letter kappa"
}
},map {
"lambda": map {
"character": "λ",
"name": "lambda",
"escape-sequence": "λ",
"description": "Greek small letter lambda"
}
},map {
"mu": map {
"character": "μ",
"name": "mu",
"escape-sequence": "μ",
"description": "Greek small letter mu"
}
},map {
"nu": map {
"character": "ν",
"name": "nu",
"escape-sequence": "ν",
"description": "Greek small letter nu"
}
},map {
"xi": map {
"character": "ξ",
"name": "xi",
"escape-sequence": "ξ",
"description": "Greek small letter xi"
}
},map {
"omicron": map {
"character": "ο",
"name": "omicron",
"escape-sequence": "ο",
"description": "Greek small letter omicron"
}
},map {
"pi": map {
"character": "π",
"name": "pi",
"escape-sequence": "π",
"description": "Greek small letter pi"
}
},map {
"rho": map {
"character": "ρ",
"name": "rho",
"escape-sequence": "ρ",
"description": "Greek small letter rho"
}
},map {
"sigmaf": map {
"character": "ς",
"name": "sigmaf",
"escape-sequence": "ς",
"description": "Greek small letter final sigma"
}
},map {
"sigma": map {
"character": "σ",
"name": "sigma",
"escape-sequence": "σ",
"description": "Greek small letter sigma"
}
},map {
"tau": map {
"character": "τ",
"name": "tau",
"escape-sequence": "τ",
"description": "Greek small letter tau"
}
},map {
"upsilon": map {
"character": "υ",
"name": "upsilon",
"escape-sequence": "υ",
"description": "Greek small letter upsilon"
}
},map {
"phi": map {
"character": "φ",
"name": "phi",
"escape-sequence": "φ",
"description": "Greek small letter phi"
}
},map {
"chi": map {
"character": "χ",
"name": "chi",
"escape-sequence": "χ",
"description": "Greek small letter chi"
}
},map {
"psi": map {
"character": "ψ",
"name": "psi",
"escape-sequence": "ψ",
"description": "Greek small letter psi"
}
},map {
"omega": map {
"character": "ω",
"name": "omega",
"escape-sequence": "ω",
"description": "Greek small letter omega"
}
},map {
"thetasym": map {
"character": "ϑ",
"name": "thetasym",
"escape-sequence": "ϑ",
"description": "Greek theta symbol"
}
},map {
"upsih": map {
"character": "ϒ",
"name": "upsih",
"escape-sequence": "ϒ",
"description": "Greek Upsilon with hook symbol"
}
},map {
"piv": map {
"character": "ϖ",
"name": "piv",
"escape-sequence": "ϖ",
"description": "Greek pi symbol"
}
},map {
"ensp": map {
"character": " ",
"name": "ensp",
"escape-sequence": " ",
"description": "en space"
}
},map {
"emsp": map {
"character": " ",
"name": "emsp",
"escape-sequence": " ",
"description": "em space"
}
},map {
"thinsp": map {
"character": " ",
"name": "thinsp",
"escape-sequence": " ",
"description": "thin space"
}
},map {
"zwnj": map {
"character": "",
"name": "zwnj",
"escape-sequence": "‌",
"description": "zero-width non-joiner"
}
},map {
"zwj": map {
"character": "",
"name": "zwj",
"escape-sequence": "‍",
"description": "zero-width joiner"
}
},map {
"lrm": map {
"character": "",
"name": "lrm",
"escape-sequence": "‎",
"description": "left-to-right mark"
}
},map {
"rlm": map {
"character": "",
"name": "rlm",
"escape-sequence": "‏",
"description": "right-to-left mark"
}
},map {
"ndash": map {
"character": "–",
"name": "ndash",
"escape-sequence": "–",
"description": "en dash"
}
},map {
"mdash": map {
"character": "—",
"name": "mdash",
"escape-sequence": "—",
"description": "em dash"
}
},map {
"lsquo": map {
"character": "‘",
"name": "lsquo",
"escape-sequence": "‘",
"description": "left single quotation mark"
}
},map {
"rsquo": map {
"character": "’",
"name": "rsquo",
"escape-sequence": "’",
"description": "right single quotation mark"
}
},map {
"sbquo": map {
"character": "‚",
"name": "sbquo",
"escape-sequence": "‚",
"description": "single low-9 quotation mark"
}
},map {
"ldquo": map {
"character": "“",
"name": "ldquo",
"escape-sequence": "“",
"description": "left double quotation mark"
}
},map {
"rdquo": map {
"character": "”",
"name": "rdquo",
"escape-sequence": "”",
"description": "right double quotation mark"
}
},map {
"bdquo": map {
"character": "„",
"name": "bdquo",
"escape-sequence": "„",
"description": "double low-9 quotation mark"
}
},map {
"dagger": map {
"character": "†",
"name": "dagger",
"escape-sequence": "†",
"description": "dagger, obelisk"
}
},map {
"Dagger": map {
"character": "‡",
"name": "Dagger",
"escape-sequence": "‡",
"description": "double dagger, double obelisk"
}
},map {
"bull": map {
"character": "•",
"name": "bull",
"escape-sequence": "•",
"description": "bullet (black small circle)"
}
},map {
"hellip": map {
"character": "…",
"name": "hellip",
"escape-sequence": "…",
"description": "horizontal ellipsis (three dot leader)"
}
},map {
"permil": map {
"character": "‰",
"name": "permil",
"escape-sequence": "‰",
"description": "per mille sign"
}
},map {
"prime": map {
"character": "′",
"name": "prime",
"escape-sequence": "′",
"description": "prime (minutes, feet)"
}
},map {
"Prime": map {
"character": "″",
"name": "Prime",
"escape-sequence": "″",
"description": "double prime (seconds, inches)"
}
},map {
"lsaquo": map {
"character": "‹",
"name": "lsaquo",
"escape-sequence": "‹",
"description": "single left-pointing angle quotation mark"
}
},map {
"rsaquo": map {
"character": "›",
"name": "rsaquo",
"escape-sequence": "›",
"description": "single right-pointing angle quotation mark"
}
},map {
"oline": map {
"character": "‾",
"name": "oline",
"escape-sequence": "‾",
"description": "overline (spacing overscore)"
}
},map {
"frasl": map {
"character": "⁄",
"name": "frasl",
"escape-sequence": "⁄",
"description": "fraction slash (solidus)"
}
},map {
"euro": map {
"character": "€",
"name": "euro",
"escape-sequence": "€",
"description": "euro sign"
}
},map {
"image": map {
"character": "ℑ",
"name": "image",
"escape-sequence": "ℑ",
"description": "black-letter capital I (imaginary part)"
}
},map {
"weierp": map {
"character": "℘",
"name": "weierp",
"escape-sequence": "℘",
"description": "script capital P (power set, Weierstrass p)"
}
},map {
"real": map {
"character": "ℜ",
"name": "real",
"escape-sequence": "ℜ",
"description": "black-letter capital R (real part symbol)"
}
},map {
"trade": map {
"character": "™",
"name": "trade",
"escape-sequence": "™",
"description": "trademark symbol"
}
},map {
"alefsym": map {
"character": "ℵ",
"name": "alefsym",
"escape-sequence": "ℵ",
"description": "alef symbol (first transfinite cardinal)"
}
},map {
"larr": map {
"character": "←",
"name": "larr",
"escape-sequence": "←",
"description": "leftwards arrow"
}
},map {
"uarr": map {
"character": "↑",
"name": "uarr",
"escape-sequence": "↑",
"description": "upwards arrow"
}
},map {
"rarr": map {
"character": "→",
"name": "rarr",
"escape-sequence": "→",
"description": "rightwards arrow"
}
},map {
"darr": map {
"character": "↓",
"name": "darr",
"escape-sequence": "↓",
"description": "downwards arrow"
}
},map {
"harr": map {
"character": "↔",
"name": "harr",
"escape-sequence": "↔",
"description": "left right arrow"
}
},map {
"crarr": map {
"character": "↵",
"name": "crarr",
"escape-sequence": "↵",
"description": "downwards arrow with corner leftwards (carriage return)"
}
},map {
"lArr": map {
"character": "⇐",
"name": "lArr",
"escape-sequence": "⇐",
"description": "leftwards double arrow"
}
},map {
"uArr": map {
"character": "⇑",
"name": "uArr",
"escape-sequence": "⇑",
"description": "upwards double arrow"
}
},map {
"rArr": map {
"character": "⇒",
"name": "rArr",
"escape-sequence": "⇒",
"description": "rightwards double arrow"
}
},map {
"dArr": map {
"character": "⇓",
"name": "dArr",
"escape-sequence": "⇓",
"description": "downwards double arrow"
}
},map {
"hArr": map {
"character": "⇔",
"name": "hArr",
"escape-sequence": "⇔",
"description": "left right double arrow"
}
},map {
"forall": map {
"character": "∀",
"name": "forall",
"escape-sequence": "∀",
"description": "for all"
}
},map {
"part": map {
"character": "∂",
"name": "part",
"escape-sequence": "∂",
"description": "partial differential"
}
},map {
"exist": map {
"character": "∃",
"name": "exist",
"escape-sequence": "∃",
"description": "there exists"
}
},map {
"empty": map {
"character": "∅",
"name": "empty",
"escape-sequence": "∅",
"description": "empty set (null set); see also U+8960, ⌀"
}
},map {
"nabla": map {
"character": "∇",
"name": "nabla",
"escape-sequence": "∇",
"description": "del or nabla (vector differential operator)"
}
},map {
"isin": map {
"character": "∈",
"name": "isin",
"escape-sequence": "∈",
"description": "element of"
}
},map {
"notin": map {
"character": "∉",
"name": "notin",
"escape-sequence": "∉",
"description": "not an element of"
}
},map {
"ni": map {
"character": "∋",
"name": "ni",
"escape-sequence": "∋",
"description": "contains as member"
}
},map {
"prod": map {
"character": "∏",
"name": "prod",
"escape-sequence": "∏",
"description": "n-ary product (product sign)"
}
},map {
"sum": map {
"character": "∑",
"name": "sum",
"escape-sequence": "∑",
"description": "n-ary summation"
}
},map {
"minus": map {
"character": "−",
"name": "minus",
"escape-sequence": "−",
"description": "minus sign"
}
},map {
"lowast": map {
"character": "∗",
"name": "lowast",
"escape-sequence": "∗",
"description": "asterisk operator"
}
},map {
"radic": map {
"character": "√",
"name": "radic",
"escape-sequence": "√",
"description": "square root (radical sign)"
}
},map {
"prop": map {
"character": "∝",
"name": "prop",
"escape-sequence": "∝",
"description": "proportional to"
}
},map {
"infin": map {
"character": "∞",
"name": "infin",
"escape-sequence": "∞",
"description": "infinity"
}
},map {
"ang": map {
"character": "∠",
"name": "ang",
"escape-sequence": "∠",
"description": "angle"
}
},map {
"and": map {
"character": "∧",
"name": "and",
"escape-sequence": "∧",
"description": "logical and (wedge)"
}
},map {
"or": map {
"character": "∨",
"name": "or",
"escape-sequence": "∨",
"description": "logical or (vee)"
}
},map {
"cap": map {
"character": "∩",
"name": "cap",
"escape-sequence": "∩",
"description": "intersection (cap)"
}
},map {
"cup": map {
"character": "∪",
"name": "cup",
"escape-sequence": "∪",
"description": "union (cup)"
}
},map {
"int": map {
"character": "∫",
"name": "int",
"escape-sequence": "∫",
"description": "integral"
}
},map {
"there4": map {
"character": "∴",
"name": "there4",
"escape-sequence": "∴",
"description": "therefore sign"
}
},map {
"sim": map {
"character": "∼",
"name": "sim",
"escape-sequence": "∼",
"description": "tilde operator (varies with, similar to)"
}
},map {
"cong": map {
"character": "≅",
"name": "cong",
"escape-sequence": "≅",
"description": "congruent to"
}
},map {
"asymp": map {
"character": "≈",
"name": "asymp",
"escape-sequence": "≈",
"description": "almost equal to (asymptotic to)"
}
},map {
"ne": map {
"character": "≠",
"name": "ne",
"escape-sequence": "≠",
"description": "not equal to"
}
},map {
"equiv": map {
"character": "≡",
"name": "equiv",
"escape-sequence": "≡",
"description": "identical to; sometimes used for 'equivalent to'"
}
},map {
"le": map {
"character": "≤",
"name": "le",
"escape-sequence": "≤",
"description": "less-than or equal to"
}
},map {
"ge": map {
"character": "≥",
"name": "ge",
"escape-sequence": "≥",
"description": "greater-than or equal to"
}
},map {
"sub": map {
"character": "⊂",
"name": "sub",
"escape-sequence": "⊂",
"description": "subset of"
}
},map {
"sup": map {
"character": "⊃",
"name": "sup",
"escape-sequence": "⊃",
"description": "superset of"
}
},map {
"nsub": map {
"character": "⊄",
"name": "nsub",
"escape-sequence": "⊄",
"description": "not a subset of"
}
},map {
"sube": map {
"character": "⊆",
"name": "sube",
"escape-sequence": "⊆",
"description": "subset of or equal to"
}
},map {
"supe": map {
"character": "⊇",
"name": "supe",
"escape-sequence": "⊇",
"description": "superset of or equal to"
}
},map {
"oplus": map {
"character": "⊕",
"name": "oplus",
"escape-sequence": "⊕",
"description": "circled plus (direct sum)"
}
},map {
"otimes": map {
"character": "⊗",
"name": "otimes",
"escape-sequence": "⊗",
"description": "circled times (vector product)"
}
},map {
"perp": map {
"character": "⊥",
"name": "perp",
"escape-sequence": "⊥",
"description": "up tack (orthogonal to, perpendicular)"
}
},map {
"sdot": map {
"character": "⋅",
"name": "sdot",
"escape-sequence": "⋅",
"description": "dot operator"
}
},map {
"lceil": map {
"character": "⌈",
"name": "lceil",
"escape-sequence": "⌈",
"description": "left ceiling (APL upstile)"
}
},map {
"rceil": map {
"character": "⌉",
"name": "rceil",
"escape-sequence": "⌉",
"description": "right ceiling"
}
},map {
"lfloor": map {
"character": "⌊",
"name": "lfloor",
"escape-sequence": "⌊",
"description": "left floor (APL downstile)"
}
},map {
"rfloor": map {
"character": "⌋",
"name": "rfloor",
"escape-sequence": "⌋",
"description": "right floor"
}
},map {
"lang": map {
"character": "〈",
"name": "lang",
"escape-sequence": "〈",
"description": "left-pointing angle bracket (bra)"
}
},map {
"rang": map {
"character": "〉",
"name": "rang",
"escape-sequence": "〉",
"description": "right-pointing angle bracket (ket)"
}
},map {
"loz": map {
"character": "◊",
"name": "loz",
"escape-sequence": "◊",
"description": "lozenge"
}
},map {
"spades": map {
"character": "♠",
"name": "spades",
"escape-sequence": "♠",
"description": "black spade suit"
}
},map {
"clubs": map {
"character": "♣",
"name": "clubs",
"escape-sequence": "♣",
"description": "black club suit (shamrock)"
}
},map {
"hearts": map {
"character": "♥",
"name": "hearts",
"escape-sequence": "♥",
"description": "black heart suit (valentine)"
}
},map {
"diams": map {
"character": "♦",
"name": "diams",
"escape-sequence": "♦",
"description": "black diamond suit"
}
}
);
(:~
: Convert HTML entities in strings to XML-compatible characters. Unrecognized
: entities are returned unchanged.
:
: @param A string of characters that may contain HTML entities
: @return Modified string with XML-compatible characters
:)
declare function entities:name-to-character($string as xs:string) {
let $pattern := "&([a-z]+);"
let $analysis := analyze-string($string, $pattern)
return
string-join(
for $elem in $analysis/*
return
if ($elem instance of element(fn:non-match)) then
$elem/string()
else
let $name := $elem/fn:group
let $replacement := $entities:entities?($name)?character
return
if (exists($replacement)) then
$replacement
else
$elem/string()
)
};
以上是关于text 查找HTML字符实体并将引用转换为XQuery中与XML兼容的字符的主要内容,如果未能解决你的问题,请参考以下文章
javascript 怎么将html字符实体 转换成 正常显示的字符
在 PHP 字符串中查找 youtube 链接并将其转换为嵌入代码?