| 23 |
35 |
# |
\#
|
|
#
|
US-ASCII |
|
| 25 |
37 |
% |
\%
|
|
%
|
US-ASCII |
|
| 26 |
38 |
& |
\&
|
|
&
|
US-ASCII |
|
| 7E |
126 |
~ |
\~{}
|
|
~
|
US-ASCII |
|
| A1 |
161 |
¡ |
!`
|
|
¡
|
ISO-8859-1 |
|
| A7 |
167 |
§ |
\S{}
|
|
§
|
ISO-8859-1 |
|
| A8 |
168 |
¨ |
\"{}
|
|
¨
|
ISO-8859-1 |
|
| A9 |
169 |
© |
\copyright{}
|
|
©
|
ISO-8859-1 |
|
| AD |
173 |
|
\-
|
|
­
|
ISO-8859-1 |
|
| AF |
175 |
¯ |
\={}
|
|
¯
|
ISO-8859-1 |
|
| B0 |
176 |
° |
$^\circ$
|
$^{\circ}$
|
°
|
ISO-8859-1 |
|
| B1 |
177 |
± |
$\pm$
|
|
±
|
ISO-8859-1 |
|
| B2 |
178 |
² |
$^2$
|
$^{2}$
|
²
|
ISO-8859-1 |
|
| B3 |
179 |
³ |
$^3$
|
$^{3}$
|
³
|
ISO-8859-1 |
|
| B4 |
180 |
´ |
\'{}
|
|
´
|
ISO-8859-1 |
|
| B5 |
181 |
µ |
$\mu$
|
|
µ
|
ISO-8859-1 |
also mapped as U+03BC |
| B6 |
182 |
¶ |
\P{}
|
|
¶
|
ISO-8859-1 |
|
| B7 |
183 |
· |
$\cdot$
|
|
·
|
ISO-8859-1 |
also mapped as U+22C5 |
| B8 |
184 |
¸ |
\c{ }
|
|
¸
|
ISO-8859-1 |
|
| B9 |
185 |
¹ |
$^1$
|
$^{1}$
|
¹
|
ISO-8859-1 |
|
| BF |
191 |
¿ |
?`
|
|
¿
|
ISO-8859-1 |
|
| C0 |
192 |
À |
\`A
|
\`{A}
|
À
|
ISO-8859-1 |
|
| C1 |
193 |
Á |
\'A
|
\'{A}
|
Á
|
ISO-8859-1 |
|
| C2 |
194 |
 |
\^A
|
\^{A}
|
Â
|
ISO-8859-1 |
|
| C3 |
195 |
à |
\~A
|
\~{A}
|
Ã
|
ISO-8859-1 |
|
| C4 |
196 |
Ä |
\"A
|
\"{A}
|
Ä
|
ISO-8859-1 |
|
| C5 |
197 |
Å |
\r{A}
|
|
Å
|
ISO-8859-1 |
|
| C6 |
198 |
Æ |
{\AE}
|
\AE{}
|
Æ
|
ISO-8859-1 |
|
| C7 |
199 |
Ç |
\c{C}
|
|
Ç
|
ISO-8859-1 |
|
| C8 |
200 |
È |
\`E
|
\`{E}
|
È
|
ISO-8859-1 |
|
| C9 |
201 |
É |
\'E
|
\'{E}
|
É
|
ISO-8859-1 |
|
| CA |
202 |
Ê |
\^E
|
\^{E}
|
Ê
|
ISO-8859-1 |
|
| CB |
203 |
Ë |
\"E
|
\"{E}
|
Ë
|
ISO-8859-1 |
|
| CC |
204 |
Ì |
\`I
|
\`{I}
|
Ì
|
ISO-8859-1 |
|
| CD |
205 |
Í |
\'I
|
\'{I}
|
Í
|
ISO-8859-1 |
|
| CE |
206 |
Î |
\^I
|
\^{I}
|
Î
|
ISO-8859-1 |
|
| CF |
207 |
Ï |
\"I
|
\"{I}
|
Ï
|
ISO-8859-1 |
|
| D0 |
208 |
Ð |
{\DH}
|
\DH{}
|
Ð
|
ISO-8859-1 |
|
| D1 |
209 |
Ñ |
\~N
|
\~{N}
|
Ñ
|
ISO-8859-1 |
|
| D2 |
210 |
Ò |
\`O
|
\`{O}
|
Ò
|
ISO-8859-1 |
|
| D3 |
211 |
Ó |
\'O
|
\'{O}
|
Ó
|
ISO-8859-1 |
|
| D4 |
212 |
Ô |
\^O
|
\^{O}
|
Ô
|
ISO-8859-1 |
|
| D5 |
213 |
Õ |
\~O
|
\~{O}
|
Õ
|
ISO-8859-1 |
|
| D6 |
214 |
Ö |
\"O
|
\"{O}
|
Ö
|
ISO-8859-1 |
|
| D7 |
215 |
× |
$\times$
|
|
×
|
ISO-8859-1 |
|
| D8 |
216 |
Ø |
{\O}
|
\O{}
|
Ø
|
ISO-8859-1 |
|
| D9 |
217 |
Ù |
\`U
|
\`{U}
|
Ù
|
ISO-8859-1 |
|
| DA |
218 |
Ú |
\'U
|
\'{U}
|
Ú
|
ISO-8859-1 |
|
| DB |
219 |
Û |
\^U
|
\^{U}
|
Û
|
ISO-8859-1 |
|
| DC |
220 |
Ü |
\"U
|
\"{U}
|
Ü
|
ISO-8859-1 |
|
| DD |
221 |
Ý |
\'Y
|
\'{Y}
|
Ý
|
ISO-8859-1 |
|
| DE |
222 |
Þ |
{\TH}
|
\TH{}
|
Þ
|
ISO-8859-1 |
|
| DF |
223 |
ß |
{\ss}
|
\ss{}
|
ß
|
ISO-8859-1 |
|
| E0 |
224 |
à |
\`a
|
\`{a}
|
à
|
ISO-8859-1 |
|
| E1 |
225 |
á |
\'a
|
\'{a}
|
á
|
ISO-8859-1 |
|
| E2 |
226 |
â |
\^a
|
\^{a}
|
â
|
ISO-8859-1 |
|
| E3 |
227 |
ã |
\~a
|
\~{a}
|
ã
|
ISO-8859-1 |
|
| E4 |
228 |
ä |
\"a
|
\"{a}
|
ä
|
ISO-8859-1 |
|
| E5 |
229 |
å |
\r{a}
|
|
å
|
ISO-8859-1 |
|
| E6 |
230 |
æ |
{\ae}
|
\ae{}
|
æ
|
ISO-8859-1 |
|
| E7 |
231 |
ç |
\c{c}
|
|
ç
|
ISO-8859-1 |
|
| E8 |
232 |
è |
\`e
|
\`{e}
|
è
|
ISO-8859-1 |
|
| E9 |
233 |
é |
\'e
|
\'{e}
|
é
|
ISO-8859-1 |
|
| EA |
234 |
ê |
\^e
|
\^{e}
|
ê
|
ISO-8859-1 |
|
| EB |
235 |
ë |
\"e
|
\"{e}
|
ë
|
ISO-8859-1 |
|
| EC |
236 |
ì |
{\`\i}
|
\`{\i}
\`\i{}
|
ì
|
ISO-8859-1 |
|
| ED |
237 |
í |
{\'\i}
|
\'{\i}
\'\i{}
|
í
|
ISO-8859-1 |
|
| EE |
238 |
î |
{\^\i}
|
\^{\i}
\^\i{}
|
î
|
ISO-8859-1 |
|
| EF |
239 |
ï |
{\"\i}
|
\"{\i}
\"\i{}
|
ï
|
ISO-8859-1 |
|
| F0 |
240 |
ð |
{\dh}
|
\dh{}
|
ð
|
ISO-8859-1 |
|
| F1 |
241 |
ñ |
\~n
|
\~{n}
|
ñ
|
ISO-8859-1 |
|
| F2 |
242 |
ò |
\`o
|
\`{o}
|
ò
|
ISO-8859-1 |
|
| F3 |
243 |
ó |
\'o
|
\'{o}
|
ó
|
ISO-8859-1 |
|
| F4 |
244 |
ô |
\^o
|
\^{o}
|
ô
|
ISO-8859-1 |
|
| F5 |
245 |
õ |
\~o
|
\~{o}
|
õ
|
ISO-8859-1 |
|
| F6 |
246 |
ö |
\"o
|
\"{o}
|
ö
|
ISO-8859-1 |
|
| F7 |
247 |
÷ |
$\div$
|
|
÷
|
ISO-8859-1 |
|
| F8 |
248 |
ø |
{\o}
|
\o{}
|
ø
|
ISO-8859-1 |
|
| F9 |
249 |
ù |
\`u
|
\`{u}
|
ù
|
ISO-8859-1 |
|
| FA |
250 |
ú |
\'u
|
\'{u}
|
ú
|
ISO-8859-1 |
|
| FB |
251 |
û |
\^u
|
\^{u}
|
û
|
ISO-8859-1 |
|
| FC |
252 |
ü |
\"u
|
\"{u}
|
ü
|
ISO-8859-1 |
|
| FD |
253 |
ý |
\'y
|
\'{y}
|
ý
|
ISO-8859-1 |
|
| FE |
254 |
þ |
{\th}
|
\th{}
|
þ
|
ISO-8859-1 |
|
| FF |
255 |
ÿ |
\"y
|
\"{y}
|
ÿ
|
ISO-8859-1 |
|
| 100 |
256 |
Ā |
\=A
|
\={A}
|
Ā
|
|
|
| 101 |
257 |
ā |
\=a
|
\={a}
|
ā
|
|
|
| 102 |
258 |
Ă |
\u{A}
|
|
Ă
|
|
|
| 103 |
259 |
ă |
\u{a}
|
|
ă
|
|
|
| 106 |
262 |
Ć |
\'C
|
\'{C}
|
Ć
|
|
|
| 107 |
263 |
ć |
\'c
|
\'{c}
|
ć
|
|
|
| 108 |
264 |
Ĉ |
\^C
|
\^{C}
|
Ĉ
|
|
|
| 109 |
265 |
ĉ |
\^c
|
\^{c}
|
ĉ
|
|
|
| 10A |
266 |
Ċ |
\.C
|
\.{C}
|
Ċ
|
|
|
| 10B |
267 |
ċ |
\.c
|
\.{c}
|
ċ
|
|
|
| 10C |
268 |
Č |
\v{C}
|
|
Č
|
|
|
| 10D |
269 |
č |
\v{c}
|
|
č
|
|
|
| 10E |
270 |
Ď |
\v{D}
|
|
Ď
|
|
|
| 10F |
271 |
ď |
\v{d}
|
|
ď
|
|
|
| 110 |
272 |
Đ |
{\DJ}
|
\DJ{}
|
Đ
|
|
|
| 111 |
273 |
đ |
{\dj}
|
\dj{}
|
đ
|
|
|
| 112 |
274 |
Ē |
\=E
|
\={E}
|
Ē
|
|
|
| 113 |
275 |
ē |
\=e
|
\={e}
|
ē
|
|
|
| 114 |
276 |
Ĕ |
\u{E}
|
|
Ĕ
|
|
|
| 115 |
277 |
ĕ |
\u{e}
|
|
ĕ
|
|
|
| 116 |
278 |
Ė |
\.E
|
\.{E}
|
Ė
|
|
|
| 117 |
279 |
ė |
\.e
|
\.{e}
|
ė
|
|
|
| 11A |
282 |
Ě |
\v{E}
|
|
Ě
|
|
|
| 11B |
283 |
ě |
\v{e}
|
|
ě
|
|
|
| 11C |
284 |
Ĝ |
\^G
|
\^{G}
|
Ĝ
|
|
|
| 11D |
285 |
ĝ |
\^g
|
\^{g}
|
ĝ
|
|
|
| 11E |
286 |
Ğ |
\u{G}
|
|
Ğ
|
|
|
| 11F |
287 |
ğ |
\u{g}
|
|
ğ
|
|
|
| 120 |
288 |
Ġ |
\.G
|
\.{G}
|
Ġ
|
|
|
| 121 |
289 |
ġ |
\.g
|
\.{g}
|
ġ
|
|
|
| 122 |
290 |
Ģ |
\c{G}
|
|
Ģ
|
|
|
| 123 |
291 |
ģ |
\c{g}
|
|
ģ
|
|
|
| 124 |
292 |
Ĥ |
\^H
|
\^{H}
|
Ĥ
|
|
|
| 125 |
293 |
ĥ |
\^h
|
\^{h}
|
ĥ
|
|
|
| 131 |
305 |
ı |
{\i}
|
\i{}
|
ı
|
|
|
| 13D |
317 |
Ľ |
\v{L}
|
|
Ľ
|
|
|
| 13E |
318 |
ľ |
\v{l}
|
|
ľ
|
|
|
| 141 |
321 |
Ł |
{\L}
|
\L{}
|
Ł
|
|
|
| 142 |
322 |
ł |
{\l}
|
\l{}
|
ł
|
|
|
| 147 |
327 |
Ň |
\v{N}
|
|
Ň
|
|
|
| 148 |
328 |
ň |
\v{n}
|
|
ň
|
|
|
| 150 |
336 |
Ő |
\H{O}
|
|
Ő
|
|
|
| 151 |
337 |
ő |
\H{o}
|
|
ő
|
|
|
| 152 |
338 |
Œ |
{\OE}
|
\OE{}
|
Œ
|
|
|
| 153 |
339 |
œ |
{\oe}
|
\oe{}
|
œ
|
|
|
| 158 |
344 |
Ř |
\v{R}
|
|
Ř
|
|
|
| 159 |
345 |
ř |
\v{r}
|
|
ř
|
|
|
| 160 |
352 |
Š |
\v{S}
|
|
Š
|
|
|
| 161 |
353 |
š |
\v{s}
|
|
š
|
|
|
| 164 |
356 |
Ť |
\v{T}
|
|
Ť
|
|
|
| 165 |
357 |
ť |
\v{t}
|
|
ť
|
|
|
| 170 |
368 |
Ű |
\H{U}
|
|
Ű
|
|
|
| 171 |
369 |
ű |
\H{u}
|
|
ű
|
|
|
| 1C4 |
452 |
DŽ |
D\v{Z}
|
|
DŽ
|
|
|
| 1C5 |
453 |
Dž |
D\v{z}
|
|
Dž
|
|
|
| 1C6 |
454 |
dž |
d\v{z}
|
|
dž
|
|
|
| 17D |
381 |
Ž |
\v{Z}
|
|
Ž
|
|
must be substituted after DŽ, because only after substituting all "DŽ" occurrences does it make sense to substitute "Ž". |
| 17E |
382 |
ž |
\v{z}
|
|
ž
|
|
must be substituted after Dž and dž, because only after substituting all "Dž" and "dž" occurrences does it make sense
to substitute "ž".
|
| 1CD |
461 |
Ǎ |
\v{A}
|
|
Ǎ
|
|
|
| 1CE |
462 |
ǎ |
\v{a}
|
|
ǎ
|
|
|
| 1CF |
463 |
Ǐ |
\v{I}
|
|
Ǐ
|
|
|
| 1D0 |
464 |
ǐ |
{\v\i}
|
\v{\i}
\v\i{}
|
ǐ
|
|
|
| 1D1 |
465 |
Ǒ |
\v{O}
|
|
Ǒ
|
|
|
| 1D2 |
466 |
ǒ |
\v{o}
|
|
ǒ
|
|
|
| 1D3 |
467 |
Ǔ |
\v{U}
|
|
Ǔ
|
|
|
| 1D4 |
468 |
ǔ |
\v{u}
|
|
ǔ
|
|
|
| 1E6 |
486 |
Ǧ |
\v{G}
|
|
Ǧ
|
|
|
| 1E7 |
487 |
ǧ |
\v{g}
|
|
ǧ
|
|
|
| 1E8 |
488 |
Ǩ |
\v{K}
|
|
Ǩ
|
|
|
| 1E9 |
489 |
ǩ |
\v{k}
|
|
ǩ
|
|
|
| 21E |
542 |
Ȟ |
\v{H}
|
|
Ȟ
|
|
|
| 21F |
543 |
ȟ |
\v{h}
|
|
ȟ
|
|
|
| 393 |
915 |
Γ |
$\Gamma$
|
|
Γ
|
|
|
| 394 |
916 |
Δ |
$\Delta$
|
|
Δ
|
|
|
| 398 |
920 |
Θ |
$\Theta$
|
|
Θ
|
|
|
| 39B |
923 |
Λ |
$\Lambda$
|
|
Λ
|
|
|
| 39E |
926 |
Ξ |
$\Xi$
|
|
Ξ
|
|
|
| 3A0 |
928 |
Π |
$\Pi$
|
|
Π
|
|
|
| 3A3 |
931 |
Σ |
$\Sigma$
|
|
Σ
|
|
|
| 3A5 |
933 |
Υ |
$\Upsilon$
|
|
Υ
|
|
|
| 3A6 |
934 |
Φ |
$\Phi$
|
|
Φ
|
|
|
| 3A8 |
936 |
Ψ |
$\Psi$
|
|
Ψ
|
|
|
| 3A9 |
937 |
Ω |
$\Omega$
|
|
Ω
|
|
|
| 3B1 |
945 |
α |
$\alpha$
|
|
α
|
|
|
| 3B2 |
946 |
β |
$\beta$
|
|
β
|
|
|
| 3B3 |
947 |
γ |
$\gamma$
|
|
γ
|
|
|
| 3B4 |
948 |
δ |
$\delta$
|
|
δ
|
|
|
| 3F5 |
1013 |
ϵ |
$\epsilon$
|
|
ϵ
|
|
|
| 3B5 |
949 |
ε |
$\varepsilon$
|
|
ε
|
|
|
| 3B6 |
950 |
ζ |
$\zeta$
|
|
ζ
|
|
|
| 3B7 |
951 |
η |
$\eta$
|
|
η
|
|
|
| 3B8 |
952 |
θ |
$\theta$
|
|
θ
|
|
|
| 3D1 |
977 |
ϑ |
$\vartheta$
|
|
ϑ
|
|
|
| 3B9 |
953 |
ι |
$\iota$
|
|
ι
|
|
|
| 3BA |
954 |
κ |
$\kappa$
|
|
κ
|
|
|
| 3BB |
955 |
λ |
$\lamba$
|
|
λ
|
|
|
| 3BC |
956 |
μ |
$\mu$
|
|
μ
|
|
also mapped as U+00B5 |
| 3BD |
957 |
ν |
$\nu$
|
|
ν
|
|
|
| 3BE |
958 |
ξ |
$\xi$
|
|
ξ
|
|
|
| 3C0 |
960 |
π |
$\pi$
|
|
π
|
|
|
| 3D6 |
982 |
ϖ |
$\varpi$
|
|
ϖ
|
|
|
| 3C1 |
961 |
ρ |
$\rho$
|
|
ρ
|
|
|
| 3F1 |
1009 |
ϱ |
$\varrho$
|
|
ϱ
|
|
|
| 3C3 |
963 |
σ |
$\sigma$
|
|
σ
|
|
|
| 3C2 |
962 |
ς |
$\varsigma$
|
|
ς
|
|
|
| 3C4 |
964 |
τ |
$\tau$
|
|
τ
|
|
|
| 3C5 |
965 |
υ |
$\upsilon$
|
|
υ
|
|
|
| 3D5 |
981 |
ϕ |
$\phi$
|
|
ϕ
|
|
|
| 3C6 |
966 |
φ |
$\varphi$
|
|
φ
|
|
|
| 3C7 |
967 |
χ |
$\chi$
|
|
χ
|
|
|
| 3C8 |
968 |
ψ |
$\psi$
|
|
ψ
|
|
|
| 3C9 |
969 |
ω |
$\omega$
|
|
ω
|
|
|
| 2202 |
8706 |
∂ |
$\partial$
|
|
∂
|
|
|
| 2213 |
8723 |
∓ |
$\mp$
|
|
∓
|
|
|
| 2214 |
8724 |
∔ |
$\dotplus$
|
|
∔
|
|
|
| 2217 |
8727 |
∗ |
$\ast$
|
|
∗
|
|
|
| 2218 |
8728 |
∘ |
$\circ$
|
|
∘
|
|
|
| 2219 |
8729 |
∙ |
$\bullet$
|
|
∙
|
|
|
| 2227 |
8743 |
∧ |
$\vee$
|
|
∧
|
|
|
| 2228 |
8744 |
∨ |
$\wedge$
|
|
∨
|
|
|
| 2229 |
8745 |
∩ |
$\cap$
|
|
∩
|
|
|
| 222A |
8746 |
∪ |
$\cup$
|
|
∪
|
|
|
| 228E |
8846 |
⊎ |
$\uplus$
|
|
⊎
|
|
|
| 2293 |
8851 |
⊓ |
$\sqcap$
|
|
⊓
|
|
|
| 2294 |
8852 |
⊔ |
$\sqcup$
|
|
⊔
|
|
|
| 2295 |
8853 |
⊕ |
$\oplus$
|
|
⊕
|
|
|
| 2296 |
8854 |
⊖ |
$\ominus$
|
|
⊖
|
|
|
| 2297 |
8855 |
⊗ |
$\otimes$
|
|
⊗
|
|
|
| 2298 |
8856 |
⊘ |
$\oslash$
|
|
⊘
|
|
|
| 2299 |
8857 |
⊙ |
$\odot$
|
|
⊙
|
|
|
| 22C5 |
8901 |
⋅ |
$\cdot$
|
$\centerdot$
|
⋅
|
|
also mapped as U+00B7 |
| 22C6 |
8902 |
⋆ |
$\star$
|
|
⋆
|
|
|
| 2014 |
8212 |
— |
---
|
|
—
|
|
must be substituted before –, because – ('--') is a literal substring of '---'. |
| 2013 |
8211 |
– |
--
|
|
–
|
|
must be substituted after —, because only after substituting all '---' occurrences does it make sense to substitute
'--'.
|
| 201C |
8220 |
“ |
``
|
|
“
|
|
must be substituted before ‘, because ‘ ('`') is a literal substring of '``'. |
| 201D |
8221 |
” |
''
|
|
”
|
|
must be substituted before ’, because ’ ("'") is a literal substring of "''". |
| 2018 |
8216 |
‘ |
`
|
|
‘
|
|
must be substituted after “, because only after substituting all "''" occurrences does it make sense to substitute
"'".
|
| 2019 |
8217 |
’ |
'
|
|
’
|
|
must be substituted after ”, because only after substituting all '``' occurrences does it make sense to substitute
'`'.
|
| FEFF |
65279 |
|
|
|

|
|
if there is a BOM in the Unicode, discard it. |