<?php 
 
include('mappings' . DIRECTORY_SEPARATOR . 'CLF2.php'); 
include('basic' . DIRECTORY_SEPARATOR . 'typical-mod.php'); 
include('basic' . DIRECTORY_SEPARATOR . 'typical-rxp-mod.php'); 
include('basic' . DIRECTORY_SEPARATOR . 'wingding.php'); 
include('basic' . DIRECTORY_SEPARATOR . 'language.php'); 
 
return array( 
 
    // execution macro: this defines the methods you want to call, each and every one of these "cleans" something 
    // call the methods how many times you want, change the order as needed 
    'macro' => array( 
     
    //'tidy_code', 
     
    'basictypical', 
    'basictypicalrxp',  
    'basicwingding',     
     
    'dom_init',  
    'DOM_clean_redundant_tags', 
    'DOM_delete_empty_attributes', 
    'DOM_alt_text', 
    'DOM_non_breaking', 
    'DOM_false_footnotes', 
    'DOM_finish_footnotes', 
    'dom_save', 
     
//    'undoublyencodeentities', // possibly unnecessary now (2012-01-16) but kept here for insurance (which is low risk since we have never done a document whose content was about HTML character entities) 
    'post_dom', //'post_dom_stripme', 
     
    'delete_empty_tags', 
     
    //'mark_TOC', // needs to be rethought 
    'combine_inline', // was disabled since in using brute force to ensure proper nesting this could take an extremely long time to run 
    //'unmark_TOC', // needs to be rethought 
     
    //'extra_space', // this is currently (2009-07-10) too aggressive for vanilla sweeper 
    // do clean inline instead of some of these? 
    'footnotes', 
    //'heading_anchors', 
    //'fix_inline',    // risky although I have not seen it be destructive; also its orange message could scare somebody. 
    'non_breaking', 
    'dekern', 
    'citation', 
     
    'tidy_code', 
     
    'basiclanguage', 
    'remove_default_attributes', 
     
    ), 
 
    'non_breaking_type' => 'nbsp', // nbsp, noWrap 
     
    'use_local_DTD' => true, 
    'local_DTD' => 'DTD' . DIRECTORY_SEPARATOR . 'xhtml1-strict.dtd', 
     
    'basictypical' => $basicTypicalArray,     
    'basictypicalrxp' => $basicTypicalArrayRxp, 
    'basicwingding' => $basicwingding, 
    'basicEnglishArray' => $basicEnglishArray, 
    'basicFrenchArray' => $basicFrenchArray, 
    'basicFrenchRxpArray' => $basicFrenchRxpArray, 
 
    'CLF2_replace' => $CLF2Array,     
    'CLF2_regex' => $CLF2RxpArray, 
     
    'french_footnote_reference_anchor_text' => 'Lien à la note ', 
    'french_footnote_anchor_text' => 'Lien à la référence de la note ', 
    'english_footnote_reference_anchor_text' => 'Link to note ', 
    'english_footnote_anchor_text' => 'Link to note reference ', 
    'footnote_anchor_name' => 'note', 
    'footnote_reference_anchor_name' => 'noteref', 
     
    'french_endnote_reference_anchor_text' => 'Lien à la note de bas ', 
    'french_endnote_anchor_text' => 'Lien à la référence de la note de bas ', 
    'english_endnote_reference_anchor_text' => 'Link to endnote ', 
    'english_endnote_anchor_text' => 'Link to endnote reference ', 
    'endnote_anchor_name' => 'nnote', 
    'endnote_reference_anchor_name' => 'nnoteref', 
 
    'character_entity_encoding_type' => 'hexadecimal', // we might like to use 'named' but DOM which is currently (2015-06-09) being used doesn't like named entities 
); 
 
?> 
 
 |