Annotation of libwww/Library/src/HTMLPDTD.c, revision 2.12.2.1
2.12 frystyk 1: /* HTMLPDTD.c
2: ** STATIC DTD FOR HTML
3: **
4: ** (c) COPYRIGHT CERN 1994.
5: ** Please first read the full copyright statement in the file COPYRIGH.
2.1 timbl 6: **
7: ** 6 Nov 93 MD Increased size of img_attr array to make space
8: ** for terminator.
9: */
10:
2.12.2.1! frystyk 11: /* Library include files */
! 12: #include "tcp.h"
! 13: #include "HTUtils.h"
2.1 timbl 14: #include "HTMLPDTD.h"
15:
16: /* Entity Names
17: ** ------------
18: **
19: ** This table must be matched exactly with ALL the translation tables
20: */
2.11 timbl 21:
2.10 timbl 22: static CONST char* entities[HTML_ENTITIES] = {
2.1 timbl 23: "AElig", /* capital AE diphthong (ligature) */
24: "Aacute", /* capital A, acute accent */
25: "Acirc", /* capital A, circumflex accent */
26: "Agrave", /* capital A, grave accent */
27: "Aring", /* capital A, ring */
28: "Atilde", /* capital A, tilde */
29: "Auml", /* capital A, dieresis or umlaut mark */
30: "Ccedil", /* capital C, cedilla */
31: "ETH", /* capital Eth, Icelandic */
32: "Eacute", /* capital E, acute accent */
33: "Ecirc", /* capital E, circumflex accent */
34: "Egrave", /* capital E, grave accent */
35: "Euml", /* capital E, dieresis or umlaut mark */
36: "Iacute", /* capital I, acute accent */
37: "Icirc", /* capital I, circumflex accent */
38: "Igrave", /* capital I, grave accent */
39: "Iuml", /* capital I, dieresis or umlaut mark */
40: "Ntilde", /* capital N, tilde */
41: "Oacute", /* capital O, acute accent */
42: "Ocirc", /* capital O, circumflex accent */
43: "Ograve", /* capital O, grave accent */
44: "Oslash", /* capital O, slash */
45: "Otilde", /* capital O, tilde */
46: "Ouml", /* capital O, dieresis or umlaut mark */
47: "THORN", /* capital THORN, Icelandic */
48: "Uacute", /* capital U, acute accent */
49: "Ucirc", /* capital U, circumflex accent */
50: "Ugrave", /* capital U, grave accent */
51: "Uuml", /* capital U, dieresis or umlaut mark */
52: "Yacute", /* capital Y, acute accent */
53: "aacute", /* small a, acute accent */
54: "acirc", /* small a, circumflex accent */
55: "aelig", /* small ae diphthong (ligature) */
56: "agrave", /* small a, grave accent */
57: "amp", /* ampersand */
58: "aring", /* small a, ring */
59: "atilde", /* small a, tilde */
60: "auml", /* small a, dieresis or umlaut mark */
61: "ccedil", /* small c, cedilla */
62: "eacute", /* small e, acute accent */
63: "ecirc", /* small e, circumflex accent */
64: "egrave", /* small e, grave accent */
65: "eth", /* small eth, Icelandic */
66: "euml", /* small e, dieresis or umlaut mark */
67: "gt", /* greater than */
68: "iacute", /* small i, acute accent */
69: "icirc", /* small i, circumflex accent */
70: "igrave", /* small i, grave accent */
71: "iuml", /* small i, dieresis or umlaut mark */
72: "lt", /* less than */
73: "ntilde", /* small n, tilde */
74: "oacute", /* small o, acute accent */
75: "ocirc", /* small o, circumflex accent */
76: "ograve", /* small o, grave accent */
77: "oslash", /* small o, slash */
78: "otilde", /* small o, tilde */
2.10 timbl 79: "ouml", /* small o, dieresis or umlaut mark */
80: "quot", /* double quote sign - June 1994 */
2.1 timbl 81: "szlig", /* small sharp s, German (sz ligature) */
82: "thorn", /* small thorn, Icelandic */
83: "uacute", /* small u, acute accent */
84: "ucirc", /* small u, circumflex accent */
85: "ugrave", /* small u, grave accent */
86: "uuml", /* small u, dieresis or umlaut mark */
87: "yacute", /* small y, acute accent */
88: "yuml", /* small y, dieresis or umlaut mark */
89: };
90:
91:
92:
93: /* Attribute Lists
94: ** ---------------
95: **
96: ** Lists must be in alphatbetical order by attribute name
97: ** The tag elements contain the number of attributes
98: */
99: static attr no_attr[1] =
100: {{ 0 }};
101:
102: static attr a_attr[HTML_A_ATTRIBUTES+1] = { /* Anchor attributes */
103: { "EFFECT" },
104: { "HREF"},
105: { "ID" },
106: { "METHODS" },
107: { "NAME" }, /* Should be ID */
108: { "PRINT" },
109: { "REL" }, /* Relationship */
110: { "REV" }, /* Reverse relationship */
111: { "SHAPE" },
112: { "TITLE" },
113: { 0 } /* Terminate list */
114: };
115:
116: static attr base_attr[] = { /* BASE attributes */
117: { "HREF"},
118: { 0 } /* Terminate list */
119: };
120:
121:
122: static attr changed_attr[] = {
123: { "ID" },
124: { "IDREF" },
125: { 0 } /* terminate list */
126: };
127:
128: static attr fig_attr[] = { /* Figures */
129: { "ALIGN" },
130: { "ID" },
131: { "INDEX" },
132: { "ISMAP" }, /* @@@ NO! */
133: { "LANG" },
134: { "SRC" },
135: { 0 } /* terminate list */
136: };
137:
138: static attr form_attr[] = { /* General, for many things */
139: { "ACTION" },
140: { "ID" },
141: { "INDEX" },
142: { "LANG" },
143: { "METHOD" },
144: { 0 } /* terminate list */
145: };
146:
147: static attr gen_attr[] = { /* General, for many things */
148: { "ID" },
149: { "INDEX" },
150: { "LANG" },
151: { 0 } /* terminate list */
152: };
153:
154: static attr htmlplus_attr[] = { /* wrapper HTMLPLUS */
155: { "FORMS" },
156: { "VERSION" },
157: { 0 } /* terminate list */
158: };
159:
160: static attr id_attr[2] = {
161: { "ID" },
162: { 0 } /* terminate list */
163: };
164:
165: static attr image_attr[HTML_IMAGE_ATTRIBUTES+1] = { /* Image attributes */
166: { "ALIGN" },
167: { "ISMAP"}, /* Use HTTP SpaceJump instead */
168: { "LANG" },
169: { "SEETHRU"},
170: { "SRC"},
171: { 0 } /* Terminate list */
172: };
173:
174: static attr img_attr[HTML_IMG_ATTRIBUTES+1] = { /* IMG attributes */
175: { "ALIGN" },
176: { "ALT" },
177: { "ISMAP"}, /* Use HTTP SpaceJump instead */
178: { "SEETHRU"},
179: { "SRC"},
180: { 0 } /* Terminate list */
181: };
182:
183: static attr input_attr[HTML_INPUT_ATTRIBUTES+1] = {
184: { "ALIGN" },
185: { "CHECKED" },
186: { "DISABLED" },
187: { "ERROR" },
188: { "MAX" },
189: { "MIN" },
190: { "NAME" },
191: { "SIZE" },
192: { "SRC" },
193: { "TYPE" },
194: { "VALUE" },
2.2 timbl 195: { "0" }
2.1 timbl 196: };
197:
198: static attr l_attr[] = {
199: { "ALIGN"},
200: { "ID" },
201: { "LANG" },
202: { "INDEX" },
203: { 0 } /* Terminate list */
204: };
205:
206: static attr li_attr[] = {
207: { "ID" },
208: { "LANG" },
209: { "INDEX" },
210: { "SRC"},
211: { 0 } /* Terminate list */
212: };
213:
214: static attr link_attr[HTML_LINK_ATTRIBUTES+1] = { /* link attributes */
215: { "HREF"},
216: { "IDREF" },
217: { "METHODS" },
218: { "REL" }, /* Relationship */
219: { "REV" }, /* Reverse relationship */
220: { 0 } /* Terminate list */
221: };
222:
223: static attr list_attr[] = {
224: { "COMPACT"},
225: { "ID" },
226: { "LANG" },
227: { "INDEX" },
228: { 0 } /* Terminate list */
229: };
230:
2.3 frystyk 231: static attr glossary_attr[HTML_DL_ATTRIBUTES+1] = {
232: { "ID" },
233: { "COMPACT " },
234: { "INDEX" },
2.1 timbl 235: { 0 } /* Terminate list */
236: };
237:
238: static attr nextid_attr[HTML_NEXTID_ATTRIBUTES+1] = {
239: { "N" },
240: { 0 } /* Terminate list */
241: };
242:
243: static attr note_attr[HTML_NOTE_ATTRIBUTES+1] = { /* Footnotes etc etc */
244: { "ID" },
245: { "INDEX" },
246: { "LANG" },
247: { "ROLE" },
248: { 0 } /* terminate list */
249: };
250:
251: static attr option_attr[HTML_OPTION_ATTRIBUTES+1] = {
252: { "DISABLED" },
253: { "LANG" },
254: { "SELECTED" },
255: { 0 }
256: };
257:
258: #ifdef OLD_CODE
259: static attr pre_attr[HTML_PRE_ATTRIBUTES+1] = {
260: { "WIDTH" },
261: { 0 } /* Terminate list */
262: };
263: #endif
264:
265: static attr render_attr[HTML_RENDER_ATTRIBUTES+1] = {
266: { "STYLE" },
267: { "TAG" },
268: { 0 } /* Terminate list */
269: };
270:
271: static attr select_attr[HTML_SELECT_ATTRIBUTES+1] = {
272: { "ERROR" },
273: { "LANG" },
274: { "NAME" },
275: { "SEVERAL" },
276: { 0 },
277: };
278:
279: static attr tab_attr[HTML_TAB_ATTRIBUTES+1] = {
280: { "ALIGN" },
281: { "AT" },
282: { 0 }
283: };
284:
285: static attr table_attr[HTML_TABLE_ATTRIBUTES+1] = {
286: { "BORDER" },
287: { "ID" },
288: { "INDEX" },
289: { "LANG" },
290: { 0 }
291: };
292:
293: static attr td_attr[HTML_TD_ATTRIBUTES+1] = {
294: { "ALIGN" },
295: { "COLSPAN" },
296: { "ROWSPAN" },
297: { "TAG" },
298: { 0 }
299: };
300:
301: static attr textarea_attr[HTML_TEXTAREA_ATTRIBUTES+1] = {
302: { "COLS" },
303: { "DISABLED" },
304: { "ERROR" },
305: { "LANG" },
306: { "NAME" },
307: { "ROWS" },
308: { 0 }
309: };
310:
311: static attr ul_attr[HTML_UL_ATTRIBUTES+1] = {
312: { "COMPACT" },
313: { "ID" },
314: { "INDEX" },
315: { "LANG" },
316: { "PLAIN" },
317: { "WRAP" },
318: { 0 }
319: };
320:
321:
322: /* Elements
323: ** --------
324: **
325: ** Must match definitions in HTMLPDTD.html!
326: ** Must be in alphabetical order.
327: **
328: ** HTML is included to allow HTML documents to be parsed as a subset.
2.4 frystyk 329: ** TITLE is changed to type SGML_MIXED so it get parsed as well
330: ** Henrik 08/03-94
2.1 timbl 331: **
332: ** Name, Attributes, content
333: */
334: static HTTag tags[HTMLP_ELEMENTS] = {
335: { "A" , a_attr, HTML_A_ATTRIBUTES, SGML_MIXED },
336: { "ABBREV" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
337: { "ABSTRACT" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
338: { "ACRONYM" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
339: { "ADDED" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
340: { "ADDRESS" , no_attr, 0, SGML_MIXED },
341: { "ARG" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
342: { "B" , no_attr, 0, SGML_MIXED },
343: { "BASE" , base_attr, HTML_BASE_ATTRIBUTES, SGML_MIXED },
344: { "BLOCKQUOTE", no_attr, 0, SGML_MIXED },
345: { "BODY" , no_attr, 0, SGML_MIXED },
346: { "BOX" , no_attr, 0, SGML_MIXED },
347: { "BR" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_EMPTY },
348: { "BYLINE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
349: { "CAPTION" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
350: { "CHANGED" , changed_attr, HTML_CHANGED_ATTRIBUTES, SGML_MIXED },
351: { "CITE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
352: { "CMD" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
353: { "CODE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
354: { "COMMENT" , no_attr, 0, SGML_MIXED },
355: { "DD" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_EMPTY },
356: { "DFN" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
357: { "DIR" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
358: { "DL" , glossary_attr,HTML_DL_ATTRIBUTES, SGML_MIXED },
359: { "DT" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_EMPTY },
360: { "EM" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
361: { "FIG" , fig_attr, HTML_FIG_ATTRIBUTES, SGML_MIXED },
362: { "FOOTNOTE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
363: { "FORM" , form_attr, HTML_FORM_ATTRIBUTES, SGML_MIXED },
364: { "H1" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
365: { "H2" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
366: { "H3" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
367: { "H4" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
368: { "H5" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
369: { "H6" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
370: { "H7" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
371: { "HEAD" , no_attr, 0, SGML_MIXED },
372: { "HR" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_EMPTY },
373: { "HTML" , no_attr, 0, SGML_MIXED }, /* */
2.2 timbl 374: { "HTMLPLUS", htmlplus_attr,HTML_HTMLPLUS_ATTRIBUTES, SGML_MIXED },
2.1 timbl 375: { "I" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
376: { "IMAGE" , image_attr, HTML_IMAGE_ATTRIBUTES, SGML_EMPTY },
2.7 frystyk 377: { "IMG" , img_attr, HTML_IMG_ATTRIBUTES, SGML_EMPTY },
2.1 timbl 378: { "INPUT" , input_attr, HTML_INPUT_ATTRIBUTES, SGML_EMPTY },
379: { "ISINDEX" , no_attr, 0, SGML_EMPTY },
380: { "KBD" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
381: { "L" , l_attr, HTML_L_ATTRIBUTES, SGML_MIXED },
382: { "LI" , li_attr, HTML_LI_ATTRIBUTES, SGML_EMPTY },
383: { "LINK" , link_attr, HTML_LINK_ATTRIBUTES, SGML_EMPTY },
384: { "LISTING" , no_attr, 0, SGML_LITERAL },
385: { "LIT" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
386: { "MARGIN" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
387: { "MATH" , id_attr, HTML_ID_ATTRIBUTE, SGML_MIXED },
388: { "MENU" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
389: { "NEXTID" , nextid_attr, 1, SGML_EMPTY },
390: { "NOTE" , note_attr, HTML_NOTE_ATTRIBUTES, SGML_EMPTY },
391: { "OL" , list_attr, HTML_LIST_ATTRIBUTES, SGML_MIXED },
2.8 timbl 392: { "OPTION" , option_attr, HTML_OPTION_ATTRIBUTES, SGML_EMPTY },/*Mixed?*/
2.1 timbl 393: { "OVER" , no_attr, 0, SGML_MIXED },
394: { "P" , l_attr, HTML_L_ATTRIBUTES, SGML_EMPTY },
395: { "PERSON" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
396: { "PLAINTEXT", no_attr, 0, SGML_LITERAL },
397: { "PRE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
398: { "Q" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
399: { "QUOTE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
400: { "RENDER" , render_attr, HTML_RENDER_ATTRIBUTES, SGML_MIXED },
401: { "REMOVED" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
402: { "S" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
403: { "SAMP" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
404: { "SELECT" , select_attr, HTML_SELECT_ATTRIBUTES, SGML_MIXED },
405: { "STRONG" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
406: { "SUB" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
407: { "SUP" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
408: { "TAB" , tab_attr, HTML_TAB_ATTRIBUTES, SGML_EMPTY },
409: { "TABLE" , table_attr, HTML_TABLE_ATTRIBUTES, SGML_MIXED },
410: { "TD" , td_attr, HTML_TABLE_ATTRIBUTES, SGML_MIXED },
411: { "TEXTAREA", textarea_attr,HTML_TEXTAREA_ATTRIBUTES,SGML_MIXED},
412: { "TH" , td_attr, HTML_TD_ATTRIBUTES, SGML_MIXED },
2.4 frystyk 413: { "TITLE" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
2.1 timbl 414: { "TR" , id_attr, HTML_ID_ATTRIBUTE, SGML_MIXED },
415: { "TT" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
416: { "U" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
417: { "UL" , ul_attr, HTML_UL_ATTRIBUTES, SGML_MIXED },
418: { "VAR" , gen_attr, HTML_GEN_ATTRIBUTES, SGML_MIXED },
419: { "XMP" , no_attr, 0, SGML_LITERAL }
420: };
421:
422:
423: #ifdef OLD_CODE
424: PUBLIC CONST SGML_dtd HTML_dtd = {
425: tags,
426: HTML_ELEMENTS,
427: entities,
428: sizeof(entities)/sizeof(char**)
429: };
430: #endif
431:
432: PUBLIC CONST SGML_dtd HTMLP_dtd = {
433: tags,
434: HTMLP_ELEMENTS,
435: entities,
436: sizeof(entities)/sizeof(char**)
437: };
438:
439: /* Utility Routine: useful for people building HTML objects */
440:
441: /* Start anchor element
442: ** --------------------
443: **
444: ** It is kinda convenient to have a particulr routine for
445: ** starting an anchor element, as everything else for HTML is
446: ** simple anyway.
447: */
448: struct _HTStructured {
449: HTStructuredClass * isa;
450: /* ... */
451: };
452:
453: PUBLIC void HTStartAnchor ARGS3(HTStructured *, obj,
454: CONST char *, name,
455: CONST char *, href)
456: {
457: BOOL present[HTML_A_ATTRIBUTES];
458: CONST char* value[HTML_A_ATTRIBUTES];
459:
460: {
461: int i;
462: for(i=0; i<HTML_A_ATTRIBUTES; i++)
463: present[i] = NO;
464: }
465: if (name) {
466: present[HTML_A_NAME] = YES;
467: value[HTML_A_NAME] = name;
468: }
469: if (href) {
470: present[HTML_A_HREF] = YES;
471: value[HTML_A_HREF] = href;
472: }
473:
474: (*obj->isa->start_element)(obj, HTML_A , present, value);
475:
476: }
477:
2.5 frystyk 478: /* Utility Routine: useful for people building HTML objects */
479:
480: /* Put image element
481: ** --------------------
482: **
483: ** Hopefully as usefull as HTStartAnchor. Henrik 23/03-94
484: */
485: PUBLIC void HTMLPutImg ARGS4(HTStructured *, obj,
486: CONST char *, src,
487: CONST char *, alt,
488: CONST char *, align)
489: {
490: BOOL present[HTML_IMG_ATTRIBUTES];
491: CONST char* value[HTML_IMG_ATTRIBUTES];
492:
493: {
494: int i;
495: for(i=0; i<HTML_IMG_ATTRIBUTES; i++)
496: present[i] = NO;
497: }
498: if (src) {
499: present[HTML_IMG_SRC] = YES;
500: value[HTML_IMG_SRC] = src;
501: }
502: if (alt) {
503: present[HTML_IMG_ALT] = YES;
504: value[HTML_IMG_ALT] = alt;
505: }
506: if (align) {
507: present[HTML_IMG_ALIGN] = YES;
508: value[HTML_IMG_ALIGN] = align;
509: }
510: (*obj->isa->start_element)(obj, HTML_IMG , present, value);
2.7 frystyk 511: /* (*obj->isa->end_element)(obj, HTML_IMG); */
2.5 frystyk 512: }
513:
514:
2.1 timbl 515: PUBLIC void HTNextID ARGS2(HTStructured *, obj,
2.9 timbl 516: CONST char *, next_one)
2.1 timbl 517: {
518: BOOL present[HTML_NEXTID_ATTRIBUTES];
519: CONST char* value[HTML_NEXTID_ATTRIBUTES];
520: {
521: int i;
522: for(i=0; i<HTML_NEXTID_ATTRIBUTES; i++)
523: present[i] = NO;
524: }
525: present[HTML_NEXTID_N] = YES;
2.9 timbl 526: value[HTML_NEXTID_N] = next_one;
2.1 timbl 527:
528: (*obj->isa->start_element)(obj, HTML_NEXTID , present, value);
529:
530: }
2.5 frystyk 531:
532:
2.1 timbl 533:
Webmaster