tidy-ext 0.1.7

Sign up to get free protection for your applications and to get access to all the features.
Files changed (65) hide show
  1. data/.gitignore +4 -0
  2. data/LICENSE +50 -0
  3. data/README +12 -0
  4. data/Rakefile +60 -0
  5. data/VERSION +1 -0
  6. data/ext/tidy/access.c +3310 -0
  7. data/ext/tidy/access.h +279 -0
  8. data/ext/tidy/alloc.c +107 -0
  9. data/ext/tidy/attrask.c +209 -0
  10. data/ext/tidy/attrdict.c +2398 -0
  11. data/ext/tidy/attrdict.h +122 -0
  12. data/ext/tidy/attrget.c +213 -0
  13. data/ext/tidy/attrs.c +1911 -0
  14. data/ext/tidy/attrs.h +374 -0
  15. data/ext/tidy/buffio.c +232 -0
  16. data/ext/tidy/buffio.h +118 -0
  17. data/ext/tidy/charsets.c +1032 -0
  18. data/ext/tidy/charsets.h +14 -0
  19. data/ext/tidy/clean.c +2674 -0
  20. data/ext/tidy/clean.h +87 -0
  21. data/ext/tidy/config.c +1746 -0
  22. data/ext/tidy/config.h +153 -0
  23. data/ext/tidy/entities.c +419 -0
  24. data/ext/tidy/entities.h +24 -0
  25. data/ext/tidy/extconf.rb +5 -0
  26. data/ext/tidy/fileio.c +106 -0
  27. data/ext/tidy/fileio.h +46 -0
  28. data/ext/tidy/forward.h +69 -0
  29. data/ext/tidy/iconvtc.c +105 -0
  30. data/ext/tidy/iconvtc.h +15 -0
  31. data/ext/tidy/istack.c +373 -0
  32. data/ext/tidy/lexer.c +3825 -0
  33. data/ext/tidy/lexer.h +617 -0
  34. data/ext/tidy/localize.c +1882 -0
  35. data/ext/tidy/mappedio.c +329 -0
  36. data/ext/tidy/mappedio.h +16 -0
  37. data/ext/tidy/message.h +207 -0
  38. data/ext/tidy/parser.c +4408 -0
  39. data/ext/tidy/parser.h +76 -0
  40. data/ext/tidy/platform.h +636 -0
  41. data/ext/tidy/pprint.c +2276 -0
  42. data/ext/tidy/pprint.h +93 -0
  43. data/ext/tidy/ruby-tidy.c +195 -0
  44. data/ext/tidy/streamio.c +1407 -0
  45. data/ext/tidy/streamio.h +222 -0
  46. data/ext/tidy/tagask.c +286 -0
  47. data/ext/tidy/tags.c +955 -0
  48. data/ext/tidy/tags.h +235 -0
  49. data/ext/tidy/tidy-int.h +129 -0
  50. data/ext/tidy/tidy.h +1097 -0
  51. data/ext/tidy/tidyenum.h +622 -0
  52. data/ext/tidy/tidylib.c +1751 -0
  53. data/ext/tidy/tmbstr.c +306 -0
  54. data/ext/tidy/tmbstr.h +92 -0
  55. data/ext/tidy/utf8.c +539 -0
  56. data/ext/tidy/utf8.h +52 -0
  57. data/ext/tidy/version.h +14 -0
  58. data/ext/tidy/win32tc.c +795 -0
  59. data/ext/tidy/win32tc.h +19 -0
  60. data/spec/spec_helper.rb +5 -0
  61. data/spec/tidy/compat_spec.rb +44 -0
  62. data/spec/tidy/remote_uri_spec.rb +14 -0
  63. data/spec/tidy/test1.html +5 -0
  64. data/spec/tidy/tidy_spec.rb +34 -0
  65. metadata +125 -0
@@ -0,0 +1,622 @@
1
+ #ifndef __TIDYENUM_H__
2
+ #define __TIDYENUM_H__
3
+
4
+ /* @file tidyenum.h -- Split public enums into separate header
5
+
6
+ Simplifies enum re-use in various wrappers. e.g. SWIG
7
+ generated wrappers and COM IDL files.
8
+
9
+ Copyright (c) 1998-2008 World Wide Web Consortium
10
+ (Massachusetts Institute of Technology, European Research
11
+ Consortium for Informatics and Mathematics, Keio University).
12
+ All Rights Reserved.
13
+
14
+ CVS Info :
15
+
16
+ $Author: arnaud02 $
17
+ $Date: 2008/06/18 20:18:54 $
18
+ $Revision: 1.18 $
19
+
20
+ Contributing Author(s):
21
+
22
+ Dave Raggett <dsr@w3.org>
23
+
24
+ The contributing author(s) would like to thank all those who
25
+ helped with testing, bug fixes and suggestions for improvements.
26
+ This wouldn't have been possible without your help.
27
+
28
+ COPYRIGHT NOTICE:
29
+
30
+ This software and documentation is provided "as is," and
31
+ the copyright holders and contributing author(s) make no
32
+ representations or warranties, express or implied, including
33
+ but not limited to, warranties of merchantability or fitness
34
+ for any particular purpose or that the use of the software or
35
+ documentation will not infringe any third party patents,
36
+ copyrights, trademarks or other rights.
37
+
38
+ The copyright holders and contributing author(s) will not be held
39
+ liable for any direct, indirect, special or consequential damages
40
+ arising out of any use of the software or documentation, even if
41
+ advised of the possibility of such damage.
42
+
43
+ Permission is hereby granted to use, copy, modify, and distribute
44
+ this source code, or portions hereof, documentation and executables,
45
+ for any purpose, without fee, subject to the following restrictions:
46
+
47
+ 1. The origin of this source code must not be misrepresented.
48
+ 2. Altered versions must be plainly marked as such and must
49
+ not be misrepresented as being the original source.
50
+ 3. This Copyright notice may not be removed or altered from any
51
+ source or altered source distribution.
52
+
53
+ The copyright holders and contributing author(s) specifically
54
+ permit, without fee, and encourage the use of this source code
55
+ as a component for supporting the Hypertext Markup Language in
56
+ commercial products. If you use this source code in a product,
57
+ acknowledgment is not required but would be appreciated.
58
+
59
+
60
+ Created 2001-05-20 by Charles Reitzel
61
+ Updated 2002-07-01 by Charles Reitzel - 1st Implementation
62
+
63
+ */
64
+
65
+ #ifdef __cplusplus
66
+ extern "C" {
67
+ #endif
68
+
69
+ /* Enumerate configuration options
70
+ */
71
+
72
+ /** Categories of Tidy configuration options
73
+ */
74
+ typedef enum
75
+ {
76
+ TidyMarkup, /**< Markup options: (X)HTML version, etc */
77
+ TidyDiagnostics, /**< Diagnostics */
78
+ TidyPrettyPrint, /**< Output layout */
79
+ TidyEncoding, /**< Character encodings */
80
+ TidyMiscellaneous /**< File handling, message format, etc. */
81
+ } TidyConfigCategory;
82
+
83
+
84
+ /** Option IDs Used to get/set option values.
85
+ */
86
+ typedef enum
87
+ {
88
+ TidyUnknownOption, /**< Unknown option! */
89
+ TidyIndentSpaces, /**< Indentation n spaces */
90
+ TidyWrapLen, /**< Wrap margin */
91
+ TidyTabSize, /**< Expand tabs to n spaces */
92
+
93
+ TidyCharEncoding, /**< In/out character encoding */
94
+ TidyInCharEncoding, /**< Input character encoding (if different) */
95
+ TidyOutCharEncoding, /**< Output character encoding (if different) */
96
+ TidyNewline, /**< Output line ending (default to platform) */
97
+
98
+ TidyDoctypeMode, /**< See doctype property */
99
+ TidyDoctype, /**< User specified doctype */
100
+
101
+ TidyDuplicateAttrs, /**< Keep first or last duplicate attribute */
102
+ TidyAltText, /**< Default text for alt attribute */
103
+
104
+ /* obsolete */
105
+ TidySlideStyle, /**< Style sheet for slides: not used for anything yet */
106
+
107
+ TidyErrFile, /**< File name to write errors to */
108
+ TidyOutFile, /**< File name to write markup to */
109
+ TidyWriteBack, /**< If true then output tidied markup */
110
+ TidyShowMarkup, /**< If false, normal output is suppressed */
111
+ TidyShowWarnings, /**< However errors are always shown */
112
+ TidyQuiet, /**< No 'Parsing X', guessed DTD or summary */
113
+ TidyIndentContent, /**< Indent content of appropriate tags */
114
+ /**< "auto" does text/block level content indentation */
115
+ TidyHideEndTags, /**< Suppress optional end tags */
116
+ TidyXmlTags, /**< Treat input as XML */
117
+ TidyXmlOut, /**< Create output as XML */
118
+ TidyXhtmlOut, /**< Output extensible HTML */
119
+ TidyHtmlOut, /**< Output plain HTML, even for XHTML input.
120
+ Yes means set explicitly. */
121
+ TidyXmlDecl, /**< Add <?xml?> for XML docs */
122
+ TidyUpperCaseTags, /**< Output tags in upper not lower case */
123
+ TidyUpperCaseAttrs, /**< Output attributes in upper not lower case */
124
+ TidyMakeBare, /**< Make bare HTML: remove Microsoft cruft */
125
+ TidyMakeClean, /**< Replace presentational clutter by style rules */
126
+ TidyLogicalEmphasis, /**< Replace i by em and b by strong */
127
+ TidyDropPropAttrs, /**< Discard proprietary attributes */
128
+ TidyDropFontTags, /**< Discard presentation tags */
129
+ TidyDropEmptyParas, /**< Discard empty p elements */
130
+ TidyFixComments, /**< Fix comments with adjacent hyphens */
131
+ TidyBreakBeforeBR, /**< Output newline before <br> or not? */
132
+
133
+ /* obsolete */
134
+ TidyBurstSlides, /**< Create slides on each h2 element */
135
+
136
+ TidyNumEntities, /**< Use numeric entities */
137
+ TidyQuoteMarks, /**< Output " marks as &quot; */
138
+ TidyQuoteNbsp, /**< Output non-breaking space as entity */
139
+ TidyQuoteAmpersand, /**< Output naked ampersand as &amp; */
140
+ TidyWrapAttVals, /**< Wrap within attribute values */
141
+ TidyWrapScriptlets, /**< Wrap within JavaScript string literals */
142
+ TidyWrapSection, /**< Wrap within <![ ... ]> section tags */
143
+ TidyWrapAsp, /**< Wrap within ASP pseudo elements */
144
+ TidyWrapJste, /**< Wrap within JSTE pseudo elements */
145
+ TidyWrapPhp, /**< Wrap within PHP pseudo elements */
146
+ TidyFixBackslash, /**< Fix URLs by replacing \ with / */
147
+ TidyIndentAttributes,/**< Newline+indent before each attribute */
148
+ TidyXmlPIs, /**< If set to yes PIs must end with ?> */
149
+ TidyXmlSpace, /**< If set to yes adds xml:space attr as needed */
150
+ TidyEncloseBodyText, /**< If yes text at body is wrapped in P's */
151
+ TidyEncloseBlockText,/**< If yes text in blocks is wrapped in P's */
152
+ TidyKeepFileTimes, /**< If yes last modied time is preserved */
153
+ TidyWord2000, /**< Draconian cleaning for Word2000 */
154
+ TidyMark, /**< Add meta element indicating tidied doc */
155
+ TidyEmacs, /**< If true format error output for GNU Emacs */
156
+ TidyEmacsFile, /**< Name of current Emacs file */
157
+ TidyLiteralAttribs, /**< If true attributes may use newlines */
158
+ TidyBodyOnly, /**< Output BODY content only */
159
+ TidyFixUri, /**< Applies URI encoding if necessary */
160
+ TidyLowerLiterals, /**< Folds known attribute values to lower case */
161
+ TidyHideComments, /**< Hides all (real) comments in output */
162
+ TidyIndentCdata, /**< Indent <!CDATA[ ... ]]> section */
163
+ TidyForceOutput, /**< Output document even if errors were found */
164
+ TidyShowErrors, /**< Number of errors to put out */
165
+ TidyAsciiChars, /**< Convert quotes and dashes to nearest ASCII char */
166
+ TidyJoinClasses, /**< Join multiple class attributes */
167
+ TidyJoinStyles, /**< Join multiple style attributes */
168
+ TidyEscapeCdata, /**< Replace <![CDATA[]]> sections with escaped text */
169
+
170
+ #if SUPPORT_ASIAN_ENCODINGS
171
+ TidyLanguage, /**< Language property: not used for anything yet */
172
+ TidyNCR, /**< Allow numeric character references */
173
+ #else
174
+ TidyLanguageNotUsed,
175
+ TidyNCRNotUsed,
176
+ #endif
177
+ #if SUPPORT_UTF16_ENCODINGS
178
+ TidyOutputBOM, /**< Output a Byte Order Mark (BOM) for UTF-16 encodings */
179
+ /**< auto: if input stream has BOM, we output a BOM */
180
+ #else
181
+ TidyOutputBOMNotUsed,
182
+ #endif
183
+
184
+ TidyReplaceColor, /**< Replace hex color attribute values with names */
185
+ TidyCSSPrefix, /**< CSS class naming for -clean option */
186
+
187
+ TidyInlineTags, /**< Declared inline tags */
188
+ TidyBlockTags, /**< Declared block tags */
189
+ TidyEmptyTags, /**< Declared empty tags */
190
+ TidyPreTags, /**< Declared pre tags */
191
+
192
+ TidyAccessibilityCheckLevel, /**< Accessibility check level
193
+ 0 (old style), or 1, 2, 3 */
194
+
195
+ TidyVertSpace, /**< degree to which markup is spread out vertically */
196
+ #if SUPPORT_ASIAN_ENCODINGS
197
+ TidyPunctWrap, /**< consider punctuation and breaking spaces for wrapping */
198
+ #else
199
+ TidyPunctWrapNotUsed,
200
+ #endif
201
+ TidyMergeDivs, /**< Merge multiple DIVs */
202
+ TidyDecorateInferredUL, /**< Mark inferred UL elements with no indent CSS */
203
+ TidyPreserveEntities, /**< Preserve entities */
204
+ TidySortAttributes, /**< Sort attributes */
205
+ TidyMergeSpans, /**< Merge multiple SPANs */
206
+ TidyAnchorAsName, /**< Define anchors as name attributes */
207
+ N_TIDY_OPTIONS /**< Must be last */
208
+ } TidyOptionId;
209
+
210
+ /** Option data types
211
+ */
212
+ typedef enum
213
+ {
214
+ TidyString, /**< String */
215
+ TidyInteger, /**< Integer or enumeration */
216
+ TidyBoolean /**< Boolean flag */
217
+ } TidyOptionType;
218
+
219
+
220
+ /** AutoBool values used by ParseBool, ParseTriState, ParseIndent, ParseBOM
221
+ */
222
+ typedef enum
223
+ {
224
+ TidyNoState, /**< maps to 'no' */
225
+ TidyYesState, /**< maps to 'yes' */
226
+ TidyAutoState /**< Automatic */
227
+ } TidyTriState;
228
+
229
+ /** TidyNewline option values to control output line endings.
230
+ */
231
+ typedef enum
232
+ {
233
+ TidyLF, /**< Use Unix style: LF */
234
+ TidyCRLF, /**< Use DOS/Windows style: CR+LF */
235
+ TidyCR /**< Use Macintosh style: CR */
236
+ } TidyLineEnding;
237
+
238
+
239
+ /** Mode controlling treatment of doctype
240
+ */
241
+ typedef enum
242
+ {
243
+ TidyDoctypeOmit, /**< Omit DOCTYPE altogether */
244
+ TidyDoctypeAuto, /**< Keep DOCTYPE in input. Set version to content */
245
+ TidyDoctypeStrict, /**< Convert document to HTML 4 strict content model */
246
+ TidyDoctypeLoose, /**< Convert document to HTML 4 transitional
247
+ content model */
248
+ TidyDoctypeUser /**< Set DOCTYPE FPI explicitly */
249
+ } TidyDoctypeModes;
250
+
251
+ /** Mode controlling treatment of duplicate Attributes
252
+ */
253
+ typedef enum
254
+ {
255
+ TidyKeepFirst,
256
+ TidyKeepLast
257
+ } TidyDupAttrModes;
258
+
259
+ /** Mode controlling treatment of sorting attributes
260
+ */
261
+ typedef enum
262
+ {
263
+ TidySortAttrNone,
264
+ TidySortAttrAlpha
265
+ } TidyAttrSortStrategy;
266
+
267
+ /* I/O and Message handling interface
268
+ **
269
+ ** By default, Tidy will define, create and use
270
+ ** instances of input and output handlers for
271
+ ** standard C buffered I/O (i.e. FILE* stdin,
272
+ ** FILE* stdout and FILE* stderr for content
273
+ ** input, content output and diagnostic output,
274
+ ** respectively. A FILE* cfgFile input handler
275
+ ** will be used for config files. Command line
276
+ ** options will just be set directly.
277
+ */
278
+
279
+ /** Message severity level
280
+ */
281
+ typedef enum
282
+ {
283
+ TidyInfo, /**< Information about markup usage */
284
+ TidyWarning, /**< Warning message */
285
+ TidyConfig, /**< Configuration error */
286
+ TidyAccess, /**< Accessibility message */
287
+ TidyError, /**< Error message - output suppressed */
288
+ TidyBadDocument, /**< I/O or file system error */
289
+ TidyFatal /**< Crash! */
290
+ } TidyReportLevel;
291
+
292
+
293
+ /* Document tree traversal functions
294
+ */
295
+
296
+ /** Node types
297
+ */
298
+ typedef enum
299
+ {
300
+ TidyNode_Root, /**< Root */
301
+ TidyNode_DocType, /**< DOCTYPE */
302
+ TidyNode_Comment, /**< Comment */
303
+ TidyNode_ProcIns, /**< Processing Instruction */
304
+ TidyNode_Text, /**< Text */
305
+ TidyNode_Start, /**< Start Tag */
306
+ TidyNode_End, /**< End Tag */
307
+ TidyNode_StartEnd, /**< Start/End (empty) Tag */
308
+ TidyNode_CDATA, /**< Unparsed Text */
309
+ TidyNode_Section, /**< XML Section */
310
+ TidyNode_Asp, /**< ASP Source */
311
+ TidyNode_Jste, /**< JSTE Source */
312
+ TidyNode_Php, /**< PHP Source */
313
+ TidyNode_XmlDecl /**< XML Declaration */
314
+ } TidyNodeType;
315
+
316
+
317
+ /** Known HTML element types
318
+ */
319
+ typedef enum
320
+ {
321
+ TidyTag_UNKNOWN, /**< Unknown tag! */
322
+ TidyTag_A, /**< A */
323
+ TidyTag_ABBR, /**< ABBR */
324
+ TidyTag_ACRONYM, /**< ACRONYM */
325
+ TidyTag_ADDRESS, /**< ADDRESS */
326
+ TidyTag_ALIGN, /**< ALIGN */
327
+ TidyTag_APPLET, /**< APPLET */
328
+ TidyTag_AREA, /**< AREA */
329
+ TidyTag_B, /**< B */
330
+ TidyTag_BASE, /**< BASE */
331
+ TidyTag_BASEFONT, /**< BASEFONT */
332
+ TidyTag_BDO, /**< BDO */
333
+ TidyTag_BGSOUND, /**< BGSOUND */
334
+ TidyTag_BIG, /**< BIG */
335
+ TidyTag_BLINK, /**< BLINK */
336
+ TidyTag_BLOCKQUOTE, /**< BLOCKQUOTE */
337
+ TidyTag_BODY, /**< BODY */
338
+ TidyTag_BR, /**< BR */
339
+ TidyTag_BUTTON, /**< BUTTON */
340
+ TidyTag_CAPTION, /**< CAPTION */
341
+ TidyTag_CENTER, /**< CENTER */
342
+ TidyTag_CITE, /**< CITE */
343
+ TidyTag_CODE, /**< CODE */
344
+ TidyTag_COL, /**< COL */
345
+ TidyTag_COLGROUP, /**< COLGROUP */
346
+ TidyTag_COMMENT, /**< COMMENT */
347
+ TidyTag_DD, /**< DD */
348
+ TidyTag_DEL, /**< DEL */
349
+ TidyTag_DFN, /**< DFN */
350
+ TidyTag_DIR, /**< DIR */
351
+ TidyTag_DIV, /**< DIF */
352
+ TidyTag_DL, /**< DL */
353
+ TidyTag_DT, /**< DT */
354
+ TidyTag_EM, /**< EM */
355
+ TidyTag_EMBED, /**< EMBED */
356
+ TidyTag_FIELDSET, /**< FIELDSET */
357
+ TidyTag_FONT, /**< FONT */
358
+ TidyTag_FORM, /**< FORM */
359
+ TidyTag_FRAME, /**< FRAME */
360
+ TidyTag_FRAMESET, /**< FRAMESET */
361
+ TidyTag_H1, /**< H1 */
362
+ TidyTag_H2, /**< H2 */
363
+ TidyTag_H3, /**< H3 */
364
+ TidyTag_H4, /**< H4 */
365
+ TidyTag_H5, /**< H5 */
366
+ TidyTag_H6, /**< H6 */
367
+ TidyTag_HEAD, /**< HEAD */
368
+ TidyTag_HR, /**< HR */
369
+ TidyTag_HTML, /**< HTML */
370
+ TidyTag_I, /**< I */
371
+ TidyTag_IFRAME, /**< IFRAME */
372
+ TidyTag_ILAYER, /**< ILAYER */
373
+ TidyTag_IMG, /**< IMG */
374
+ TidyTag_INPUT, /**< INPUT */
375
+ TidyTag_INS, /**< INS */
376
+ TidyTag_ISINDEX, /**< ISINDEX */
377
+ TidyTag_KBD, /**< KBD */
378
+ TidyTag_KEYGEN, /**< KEYGEN */
379
+ TidyTag_LABEL, /**< LABEL */
380
+ TidyTag_LAYER, /**< LAYER */
381
+ TidyTag_LEGEND, /**< LEGEND */
382
+ TidyTag_LI, /**< LI */
383
+ TidyTag_LINK, /**< LINK */
384
+ TidyTag_LISTING, /**< LISTING */
385
+ TidyTag_MAP, /**< MAP */
386
+ TidyTag_MARQUEE, /**< MARQUEE */
387
+ TidyTag_MENU, /**< MENU */
388
+ TidyTag_META, /**< META */
389
+ TidyTag_MULTICOL, /**< MULTICOL */
390
+ TidyTag_NOBR, /**< NOBR */
391
+ TidyTag_NOEMBED, /**< NOEMBED */
392
+ TidyTag_NOFRAMES, /**< NOFRAMES */
393
+ TidyTag_NOLAYER, /**< NOLAYER */
394
+ TidyTag_NOSAVE, /**< NOSAVE */
395
+ TidyTag_NOSCRIPT, /**< NOSCRIPT */
396
+ TidyTag_OBJECT, /**< OBJECT */
397
+ TidyTag_OL, /**< OL */
398
+ TidyTag_OPTGROUP, /**< OPTGROUP */
399
+ TidyTag_OPTION, /**< OPTION */
400
+ TidyTag_P, /**< P */
401
+ TidyTag_PARAM, /**< PARAM */
402
+ TidyTag_PLAINTEXT,/**< PLAINTEXT */
403
+ TidyTag_PRE, /**< PRE */
404
+ TidyTag_Q, /**< Q */
405
+ TidyTag_RB, /**< RB */
406
+ TidyTag_RBC, /**< RBC */
407
+ TidyTag_RP, /**< RP */
408
+ TidyTag_RT, /**< RT */
409
+ TidyTag_RTC, /**< RTC */
410
+ TidyTag_RUBY, /**< RUBY */
411
+ TidyTag_S, /**< S */
412
+ TidyTag_SAMP, /**< SAMP */
413
+ TidyTag_SCRIPT, /**< SCRIPT */
414
+ TidyTag_SELECT, /**< SELECT */
415
+ TidyTag_SERVER, /**< SERVER */
416
+ TidyTag_SERVLET, /**< SERVLET */
417
+ TidyTag_SMALL, /**< SMALL */
418
+ TidyTag_SPACER, /**< SPACER */
419
+ TidyTag_SPAN, /**< SPAN */
420
+ TidyTag_STRIKE, /**< STRIKE */
421
+ TidyTag_STRONG, /**< STRONG */
422
+ TidyTag_STYLE, /**< STYLE */
423
+ TidyTag_SUB, /**< SUB */
424
+ TidyTag_SUP, /**< SUP */
425
+ TidyTag_TABLE, /**< TABLE */
426
+ TidyTag_TBODY, /**< TBODY */
427
+ TidyTag_TD, /**< TD */
428
+ TidyTag_TEXTAREA, /**< TEXTAREA */
429
+ TidyTag_TFOOT, /**< TFOOT */
430
+ TidyTag_TH, /**< TH */
431
+ TidyTag_THEAD, /**< THEAD */
432
+ TidyTag_TITLE, /**< TITLE */
433
+ TidyTag_TR, /**< TR */
434
+ TidyTag_TT, /**< TT */
435
+ TidyTag_U, /**< U */
436
+ TidyTag_UL, /**< UL */
437
+ TidyTag_VAR, /**< VAR */
438
+ TidyTag_WBR, /**< WBR */
439
+ TidyTag_XMP, /**< XMP */
440
+ TidyTag_NEXTID, /**< NEXTID */
441
+
442
+ N_TIDY_TAGS /**< Must be last */
443
+ } TidyTagId;
444
+
445
+ /* Attribute interrogation
446
+ */
447
+
448
+ /** Known HTML attributes
449
+ */
450
+ typedef enum
451
+ {
452
+ TidyAttr_UNKNOWN, /**< UNKNOWN= */
453
+ TidyAttr_ABBR, /**< ABBR= */
454
+ TidyAttr_ACCEPT, /**< ACCEPT= */
455
+ TidyAttr_ACCEPT_CHARSET, /**< ACCEPT_CHARSET= */
456
+ TidyAttr_ACCESSKEY, /**< ACCESSKEY= */
457
+ TidyAttr_ACTION, /**< ACTION= */
458
+ TidyAttr_ADD_DATE, /**< ADD_DATE= */
459
+ TidyAttr_ALIGN, /**< ALIGN= */
460
+ TidyAttr_ALINK, /**< ALINK= */
461
+ TidyAttr_ALT, /**< ALT= */
462
+ TidyAttr_ARCHIVE, /**< ARCHIVE= */
463
+ TidyAttr_AXIS, /**< AXIS= */
464
+ TidyAttr_BACKGROUND, /**< BACKGROUND= */
465
+ TidyAttr_BGCOLOR, /**< BGCOLOR= */
466
+ TidyAttr_BGPROPERTIES, /**< BGPROPERTIES= */
467
+ TidyAttr_BORDER, /**< BORDER= */
468
+ TidyAttr_BORDERCOLOR, /**< BORDERCOLOR= */
469
+ TidyAttr_BOTTOMMARGIN, /**< BOTTOMMARGIN= */
470
+ TidyAttr_CELLPADDING, /**< CELLPADDING= */
471
+ TidyAttr_CELLSPACING, /**< CELLSPACING= */
472
+ TidyAttr_CHAR, /**< CHAR= */
473
+ TidyAttr_CHAROFF, /**< CHAROFF= */
474
+ TidyAttr_CHARSET, /**< CHARSET= */
475
+ TidyAttr_CHECKED, /**< CHECKED= */
476
+ TidyAttr_CITE, /**< CITE= */
477
+ TidyAttr_CLASS, /**< CLASS= */
478
+ TidyAttr_CLASSID, /**< CLASSID= */
479
+ TidyAttr_CLEAR, /**< CLEAR= */
480
+ TidyAttr_CODE, /**< CODE= */
481
+ TidyAttr_CODEBASE, /**< CODEBASE= */
482
+ TidyAttr_CODETYPE, /**< CODETYPE= */
483
+ TidyAttr_COLOR, /**< COLOR= */
484
+ TidyAttr_COLS, /**< COLS= */
485
+ TidyAttr_COLSPAN, /**< COLSPAN= */
486
+ TidyAttr_COMPACT, /**< COMPACT= */
487
+ TidyAttr_CONTENT, /**< CONTENT= */
488
+ TidyAttr_COORDS, /**< COORDS= */
489
+ TidyAttr_DATA, /**< DATA= */
490
+ TidyAttr_DATAFLD, /**< DATAFLD= */
491
+ TidyAttr_DATAFORMATAS, /**< DATAFORMATAS= */
492
+ TidyAttr_DATAPAGESIZE, /**< DATAPAGESIZE= */
493
+ TidyAttr_DATASRC, /**< DATASRC= */
494
+ TidyAttr_DATETIME, /**< DATETIME= */
495
+ TidyAttr_DECLARE, /**< DECLARE= */
496
+ TidyAttr_DEFER, /**< DEFER= */
497
+ TidyAttr_DIR, /**< DIR= */
498
+ TidyAttr_DISABLED, /**< DISABLED= */
499
+ TidyAttr_ENCODING, /**< ENCODING= */
500
+ TidyAttr_ENCTYPE, /**< ENCTYPE= */
501
+ TidyAttr_FACE, /**< FACE= */
502
+ TidyAttr_FOR, /**< FOR= */
503
+ TidyAttr_FRAME, /**< FRAME= */
504
+ TidyAttr_FRAMEBORDER, /**< FRAMEBORDER= */
505
+ TidyAttr_FRAMESPACING, /**< FRAMESPACING= */
506
+ TidyAttr_GRIDX, /**< GRIDX= */
507
+ TidyAttr_GRIDY, /**< GRIDY= */
508
+ TidyAttr_HEADERS, /**< HEADERS= */
509
+ TidyAttr_HEIGHT, /**< HEIGHT= */
510
+ TidyAttr_HREF, /**< HREF= */
511
+ TidyAttr_HREFLANG, /**< HREFLANG= */
512
+ TidyAttr_HSPACE, /**< HSPACE= */
513
+ TidyAttr_HTTP_EQUIV, /**< HTTP_EQUIV= */
514
+ TidyAttr_ID, /**< ID= */
515
+ TidyAttr_ISMAP, /**< ISMAP= */
516
+ TidyAttr_LABEL, /**< LABEL= */
517
+ TidyAttr_LANG, /**< LANG= */
518
+ TidyAttr_LANGUAGE, /**< LANGUAGE= */
519
+ TidyAttr_LAST_MODIFIED, /**< LAST_MODIFIED= */
520
+ TidyAttr_LAST_VISIT, /**< LAST_VISIT= */
521
+ TidyAttr_LEFTMARGIN, /**< LEFTMARGIN= */
522
+ TidyAttr_LINK, /**< LINK= */
523
+ TidyAttr_LONGDESC, /**< LONGDESC= */
524
+ TidyAttr_LOWSRC, /**< LOWSRC= */
525
+ TidyAttr_MARGINHEIGHT, /**< MARGINHEIGHT= */
526
+ TidyAttr_MARGINWIDTH, /**< MARGINWIDTH= */
527
+ TidyAttr_MAXLENGTH, /**< MAXLENGTH= */
528
+ TidyAttr_MEDIA, /**< MEDIA= */
529
+ TidyAttr_METHOD, /**< METHOD= */
530
+ TidyAttr_MULTIPLE, /**< MULTIPLE= */
531
+ TidyAttr_NAME, /**< NAME= */
532
+ TidyAttr_NOHREF, /**< NOHREF= */
533
+ TidyAttr_NORESIZE, /**< NORESIZE= */
534
+ TidyAttr_NOSHADE, /**< NOSHADE= */
535
+ TidyAttr_NOWRAP, /**< NOWRAP= */
536
+ TidyAttr_OBJECT, /**< OBJECT= */
537
+ TidyAttr_OnAFTERUPDATE, /**< OnAFTERUPDATE= */
538
+ TidyAttr_OnBEFOREUNLOAD, /**< OnBEFOREUNLOAD= */
539
+ TidyAttr_OnBEFOREUPDATE, /**< OnBEFOREUPDATE= */
540
+ TidyAttr_OnBLUR, /**< OnBLUR= */
541
+ TidyAttr_OnCHANGE, /**< OnCHANGE= */
542
+ TidyAttr_OnCLICK, /**< OnCLICK= */
543
+ TidyAttr_OnDATAAVAILABLE, /**< OnDATAAVAILABLE= */
544
+ TidyAttr_OnDATASETCHANGED, /**< OnDATASETCHANGED= */
545
+ TidyAttr_OnDATASETCOMPLETE, /**< OnDATASETCOMPLETE= */
546
+ TidyAttr_OnDBLCLICK, /**< OnDBLCLICK= */
547
+ TidyAttr_OnERRORUPDATE, /**< OnERRORUPDATE= */
548
+ TidyAttr_OnFOCUS, /**< OnFOCUS= */
549
+ TidyAttr_OnKEYDOWN, /**< OnKEYDOWN= */
550
+ TidyAttr_OnKEYPRESS, /**< OnKEYPRESS= */
551
+ TidyAttr_OnKEYUP, /**< OnKEYUP= */
552
+ TidyAttr_OnLOAD, /**< OnLOAD= */
553
+ TidyAttr_OnMOUSEDOWN, /**< OnMOUSEDOWN= */
554
+ TidyAttr_OnMOUSEMOVE, /**< OnMOUSEMOVE= */
555
+ TidyAttr_OnMOUSEOUT, /**< OnMOUSEOUT= */
556
+ TidyAttr_OnMOUSEOVER, /**< OnMOUSEOVER= */
557
+ TidyAttr_OnMOUSEUP, /**< OnMOUSEUP= */
558
+ TidyAttr_OnRESET, /**< OnRESET= */
559
+ TidyAttr_OnROWENTER, /**< OnROWENTER= */
560
+ TidyAttr_OnROWEXIT, /**< OnROWEXIT= */
561
+ TidyAttr_OnSELECT, /**< OnSELECT= */
562
+ TidyAttr_OnSUBMIT, /**< OnSUBMIT= */
563
+ TidyAttr_OnUNLOAD, /**< OnUNLOAD= */
564
+ TidyAttr_PROFILE, /**< PROFILE= */
565
+ TidyAttr_PROMPT, /**< PROMPT= */
566
+ TidyAttr_RBSPAN, /**< RBSPAN= */
567
+ TidyAttr_READONLY, /**< READONLY= */
568
+ TidyAttr_REL, /**< REL= */
569
+ TidyAttr_REV, /**< REV= */
570
+ TidyAttr_RIGHTMARGIN, /**< RIGHTMARGIN= */
571
+ TidyAttr_ROWS, /**< ROWS= */
572
+ TidyAttr_ROWSPAN, /**< ROWSPAN= */
573
+ TidyAttr_RULES, /**< RULES= */
574
+ TidyAttr_SCHEME, /**< SCHEME= */
575
+ TidyAttr_SCOPE, /**< SCOPE= */
576
+ TidyAttr_SCROLLING, /**< SCROLLING= */
577
+ TidyAttr_SELECTED, /**< SELECTED= */
578
+ TidyAttr_SHAPE, /**< SHAPE= */
579
+ TidyAttr_SHOWGRID, /**< SHOWGRID= */
580
+ TidyAttr_SHOWGRIDX, /**< SHOWGRIDX= */
581
+ TidyAttr_SHOWGRIDY, /**< SHOWGRIDY= */
582
+ TidyAttr_SIZE, /**< SIZE= */
583
+ TidyAttr_SPAN, /**< SPAN= */
584
+ TidyAttr_SRC, /**< SRC= */
585
+ TidyAttr_STANDBY, /**< STANDBY= */
586
+ TidyAttr_START, /**< START= */
587
+ TidyAttr_STYLE, /**< STYLE= */
588
+ TidyAttr_SUMMARY, /**< SUMMARY= */
589
+ TidyAttr_TABINDEX, /**< TABINDEX= */
590
+ TidyAttr_TARGET, /**< TARGET= */
591
+ TidyAttr_TEXT, /**< TEXT= */
592
+ TidyAttr_TITLE, /**< TITLE= */
593
+ TidyAttr_TOPMARGIN, /**< TOPMARGIN= */
594
+ TidyAttr_TYPE, /**< TYPE= */
595
+ TidyAttr_USEMAP, /**< USEMAP= */
596
+ TidyAttr_VALIGN, /**< VALIGN= */
597
+ TidyAttr_VALUE, /**< VALUE= */
598
+ TidyAttr_VALUETYPE, /**< VALUETYPE= */
599
+ TidyAttr_VERSION, /**< VERSION= */
600
+ TidyAttr_VLINK, /**< VLINK= */
601
+ TidyAttr_VSPACE, /**< VSPACE= */
602
+ TidyAttr_WIDTH, /**< WIDTH= */
603
+ TidyAttr_WRAP, /**< WRAP= */
604
+ TidyAttr_XML_LANG, /**< XML_LANG= */
605
+ TidyAttr_XML_SPACE, /**< XML_SPACE= */
606
+ TidyAttr_XMLNS, /**< XMLNS= */
607
+
608
+ TidyAttr_EVENT, /**< EVENT= */
609
+ TidyAttr_METHODS, /**< METHODS= */
610
+ TidyAttr_N, /**< N= */
611
+ TidyAttr_SDAFORM, /**< SDAFORM= */
612
+ TidyAttr_SDAPREF, /**< SDAPREF= */
613
+ TidyAttr_SDASUFF, /**< SDASUFF= */
614
+ TidyAttr_URN, /**< URN= */
615
+
616
+ N_TIDY_ATTRIBS /**< Must be last */
617
+ } TidyAttrId;
618
+
619
+ #ifdef __cplusplus
620
+ } /* extern "C" */
621
+ #endif
622
+ #endif /* __TIDYENUM_H__ */