| 
<?php
 include('mappings' . DIRECTORY_SEPARATOR . 'CLF2.php');
 include('basic' . DIRECTORY_SEPARATOR . 'typical-mod.php');
 include('basic' . DIRECTORY_SEPARATOR . 'typical-rxp-mod.php');
 include('basic' . DIRECTORY_SEPARATOR . 'wingding.php');
 include('basic' . DIRECTORY_SEPARATOR . 'language.php');
 
 return array(
 
 // execution macro: this defines the methods you want to call, each and every one of these "cleans" something
 // call the methods how many times you want, change the order as needed
 'macro' => array(
 
 //'tidy_code',
 
 'basictypical',
 'basictypicalrxp',
 'basicwingding',
 
 'dom_init',
 'DOM_clean_redundant_tags',
 'DOM_delete_empty_attributes',
 'DOM_alt_text',
 'DOM_non_breaking',
 'DOM_false_footnotes',
 'DOM_finish_footnotes',
 'dom_save',
 
 //    'undoublyencodeentities', // possibly unnecessary now (2012-01-16) but kept here for insurance (which is low risk since we have never done a document whose content was about HTML character entities)
 'post_dom', //'post_dom_stripme',
 
 'delete_empty_tags',
 
 //'mark_TOC', // needs to be rethought
 'combine_inline', // was disabled since in using brute force to ensure proper nesting this could take an extremely long time to run
 //'unmark_TOC', // needs to be rethought
 
 //'extra_space', // this is currently (2009-07-10) too aggressive for vanilla sweeper
 // do clean inline instead of some of these?
 'footnotes',
 //'heading_anchors',
 //'fix_inline',    // risky although I have not seen it be destructive; also its orange message could scare somebody.
 'non_breaking',
 'dekern',
 'citation',
 
 'tidy_code',
 
 'basiclanguage',
 'remove_default_attributes',
 
 ),
 
 'non_breaking_type' => 'nbsp', // nbsp, noWrap
 
 'use_local_DTD' => true,
 'local_DTD' => 'DTD' . DIRECTORY_SEPARATOR . 'xhtml1-strict.dtd',
 
 'basictypical' => $basicTypicalArray,
 'basictypicalrxp' => $basicTypicalArrayRxp,
 'basicwingding' => $basicwingding,
 'basicEnglishArray' => $basicEnglishArray,
 'basicFrenchArray' => $basicFrenchArray,
 'basicFrenchRxpArray' => $basicFrenchRxpArray,
 
 'CLF2_replace' => $CLF2Array,
 'CLF2_regex' => $CLF2RxpArray,
 
 'french_footnote_reference_anchor_text' => 'Lien à la note ',
 'french_footnote_anchor_text' => 'Lien à la référence de la note ',
 'english_footnote_reference_anchor_text' => 'Link to note ',
 'english_footnote_anchor_text' => 'Link to note reference ',
 'footnote_anchor_name' => 'note',
 'footnote_reference_anchor_name' => 'noteref',
 
 'french_endnote_reference_anchor_text' => 'Lien à la note de bas ',
 'french_endnote_anchor_text' => 'Lien à la référence de la note de bas ',
 'english_endnote_reference_anchor_text' => 'Link to endnote ',
 'english_endnote_anchor_text' => 'Link to endnote reference ',
 'endnote_anchor_name' => 'nnote',
 'endnote_reference_anchor_name' => 'nnoteref',
 
 'character_entity_encoding_type' => 'hexadecimal', // we might like to use 'named' but DOM which is currently (2015-06-09) being used doesn't like named entities
 );
 
 ?>
 
 |