tidy-html5/src/clean.h

82 lines
2.9 KiB
C

#ifndef __CLEAN_H__
#define __CLEAN_H__
/* clean.h -- clean up misuse of presentation markup
(c) 1998-2006 (W3C) MIT, ERCIM, Keio University
See tidy.h for the copyright notice.
*/
TY_PRIVATE void TY_(FixNodeLinks)(Node *node);
TY_PRIVATE void TY_(FreeStyles)( TidyDocImpl* doc );
/* Add class="foo" to node
*/
TY_PRIVATE void TY_(AddStyleAsClass)( TidyDocImpl* doc, Node *node, ctmbstr stylevalue );
TY_PRIVATE void TY_(AddStyleProperty)(TidyDocImpl* doc, Node *node, ctmbstr property );
TY_PRIVATE void TY_(CleanDocument)( TidyDocImpl* doc );
/* simplifies <b><b> ... </b> ...</b> etc. */
TY_PRIVATE void TY_(NestedEmphasis)( TidyDocImpl* doc, Node* node );
/* replace i by em and b by strong */
TY_PRIVATE void TY_(EmFromI)( TidyDocImpl* doc, Node* node );
/*
Some people use dir or ul without an li
to indent the content. The pattern to
look for is a list with a single implicit
li. This is recursively replaced by an
implicit blockquote.
*/
TY_PRIVATE void TY_(List2BQ)( TidyDocImpl* doc, Node* node );
/*
Replace implicit blockquote by div with an indent
taking care to reduce nested blockquotes to a single
div with the indent set to match the nesting depth
*/
TY_PRIVATE void TY_(BQ2Div)( TidyDocImpl* doc, Node* node );
TY_PRIVATE void TY_(DropSections)( TidyDocImpl* doc, Node* node );
/*
This is a major clean up to strip out all the extra stuff you get
when you save as web page from Word 2000. It doesn't yet know what
to do with VML tags, but these will appear as errors unless you
declare them as new tags, such as o:p which needs to be declared
as inline.
*/
TY_PRIVATE void TY_(CleanWord2000)( TidyDocImpl* doc, Node *node);
TY_PRIVATE Bool TY_(IsWord2000)( TidyDocImpl* doc );
/* where appropriate move object elements from head to body */
TY_PRIVATE void TY_(BumpObject)( TidyDocImpl* doc, Node *html );
TY_PRIVATE Bool TY_(TidyMetaCharset)(TidyDocImpl* doc);
TY_PRIVATE void TY_(DropComments)(TidyDocImpl* doc, Node* node);
TY_PRIVATE void TY_(DropFontElements)(TidyDocImpl* doc, Node* node, Node **pnode);
TY_PRIVATE void TY_(WbrToSpace)(TidyDocImpl* doc, Node* node);
TY_PRIVATE void TY_(DowngradeTypography)(TidyDocImpl* doc, Node* node);
TY_PRIVATE void TY_(ReplacePreformattedSpaces)(TidyDocImpl* doc, Node* node);
TY_PRIVATE void TY_(NormalizeSpaces)(Lexer *lexer, Node *node);
TY_PRIVATE void TY_(ConvertCDATANodes)(TidyDocImpl* doc, Node* node);
TY_PRIVATE void TY_(FixAnchors)(TidyDocImpl* doc, Node *node, Bool wantName, Bool wantId);
TY_PRIVATE void TY_(FixXhtmlNamespace)(TidyDocImpl* doc, Bool wantXmlns);
TY_PRIVATE void TY_(FixLanguageInformation)(TidyDocImpl* doc, Node* node, Bool wantXmlLang, Bool wantLang);
/* Issue #567 - move style elements from body to head */
TY_PRIVATE void TY_(CleanStyle)(TidyDocImpl* doc, Node *html);
/* Issue #692 - discard multiple titles */
TY_PRIVATE void TY_(CleanHead)(TidyDocImpl* doc);
#endif /* __CLEAN_H__ */