forked from SWI-Prolog/packages-sgml
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcharmap.c
104 lines (85 loc) · 2.54 KB
/
charmap.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
/* $Id$
Part of SWI-Prolog
Author: Jan Wielemaker
E-mail: [email protected]
WWW: http://www.swi-prolog.org
Copyright (C): 1985-2002, University of Amsterdam
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include <stdio.h>
#include <stdlib.h>
#include "dtd.h"
static void
char_range(dtd_charclass *map, int from, int to, int msk)
{ unsigned char *ca;
int i;
for(i=from, ca=map->class+i; i++<=to; )
*ca++ |= msk;
}
dtd_charclass *
new_charclass()
{ dtd_charclass *map = sgml_calloc(1, sizeof(*map));
unsigned char *ca = map->class;
char_range(map, 'a', 'z', CH_LCLETTER);
char_range(map, 'A', 'Z', CH_LCLETTER);
char_range(map, '0', '9', CH_DIGIT);
ca['.'] |= CH_CNM;
ca['-'] |= CH_CNM;
ca[183] |= CH_CNM; /* XML */
ca[':'] |= CH_CNMSTRT; /* HTML and XML */
ca['_'] |= CH_CNMSTRT; /* HTML and XML */
char_range(map, 192, 214, CH_CNMSTRT); /* XML ISO-LATIN-1 accented chars */
char_range(map, 216, 246, CH_CNMSTRT);
char_range(map, 248, 255, CH_CNMSTRT);
ca['\t'] |= CH_WHITE;
ca[' '] |= CH_WHITE;
ca['\r'] |= CH_RE;
ca['\n'] |= CH_RS;
return map;
}
dtd_charfunc *
new_charfunc()
{ dtd_charfunc *f = sgml_calloc(1, sizeof(*f));
ichar *cf = f->func;
cf[CF_STAGO] = '<';
cf[CF_STAGC] = '>';
cf[CF_ETAGO1] = '<';
cf[CF_ETAGO2] = '/';
cf[CF_VI] = '=';
cf[CF_NS] = ':';
cf[CF_LIT] = '"';
cf[CF_LITA] = '\'';
cf[CF_PERO] = '%';
cf[CF_ERO] = '&';
cf[CF_ERC] = ';';
cf[CF_MDO1] = '<';
cf[CF_MDO2] = '!';
cf[CF_MDC] = '>';
cf[CF_PRO1] = '<';
cf[CF_PRO2] = '?';
cf[CF_PRC] = '>';
cf[CF_GRPO] = '(';
cf[CF_GRPC] = ')';
cf[CF_SEQ] = ',';
cf[CF_AND] = '&';
cf[CF_OR] = '|';
cf[CF_OPT] = '?';
cf[CF_PLUS] = '+';
cf[CF_DSO] = '[';
cf[CF_DSC] = ']';
cf[CF_REP] = '*';
cf[CF_RS] = '\n';
cf[CF_RE] = '\r';
cf[CF_CMT] = '-';
return f;
}