aboutsummaryrefslogtreecommitdiff
path: root/src/libhtml
diff options
context:
space:
mode:
authorrsc <devnull@localhost>2005-09-19 16:46:08 +0000
committerrsc <devnull@localhost>2005-09-19 16:46:08 +0000
commit5b76ae26d81d215084f42aa0de20231decce273e (patch)
tree391c78957a87a04610f676172e8aaf3614daef67 /src/libhtml
parent3a6c348fba8ca00ff22315a0e270eca5bc55e84d (diff)
downloadplan9port-5b76ae26d81d215084f42aa0de20231decce273e.tar.gz
plan9port-5b76ae26d81d215084f42aa0de20231decce273e.tar.bz2
plan9port-5b76ae26d81d215084f42aa0de20231decce273e.zip
The people who use emdash and endash are probably the same ones who think data is plural.
Diffstat (limited to 'src/libhtml')
-rw-r--r--src/libhtml/lex.c10
1 files changed, 6 insertions, 4 deletions
diff --git a/src/libhtml/lex.c b/src/libhtml/lex.c
index 0755ac34..81391f96 100644
--- a/src/libhtml/lex.c
+++ b/src/libhtml/lex.c
@@ -253,7 +253,7 @@ char* _attrnames[] = {
// Character entity to unicode character number map.
// Keep sorted by name.
StringInt *chartab;
-AsciiInt _chartab[142] = {
+AsciiInt _chartab[] = {
{"AElig", 198},
{"Aacute", 193},
{"Acirc", 194},
@@ -310,9 +310,9 @@ AsciiInt _chartab[142] = {
{"eacute", 233},
{"ecirc", 234},
{"egrave", 232},
- {"emdash", 8212},
+ {"emdash", 8212}, /* non-standard but commonly used */
{"emsp", 8195},
- {"endash", 8211},
+ {"endash", 8211}, /* non-standard but commonly used */
{"ensp", 8194},
{"epsilon", 949},
{"eta", 951},
@@ -336,10 +336,12 @@ AsciiInt _chartab[142] = {
{"ldots", 8230},
{"lt", 60},
{"macr", 175},
+ {"mdash", 8212},
{"micro", 181},
{"middot", 183},
{"mu", 956},
{"nbsp", 160},
+ {"ndash", 8211},
{"not", 172},
{"ntilde", 241},
{"nu", 957},
@@ -397,7 +399,7 @@ AsciiInt _chartab[142] = {
{"yuml", 255},
{"zeta", 950}
};
-#define NCHARTAB (sizeof(chartab)/sizeof(chartab[0]))
+#define NCHARTAB (sizeof(_chartab)/sizeof(_chartab[0]))
// Characters Winstart..Winend are those that Windows
// uses interpolated into the Latin1 set.