A program to recognize and reward our most engaged community members
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="5.0"> <context> <input> <location/> </input> <output> <location/> <location/> <location/> <location/> </output> <macros/> </context> <operator activated="true" class="process" expanded="true" name="Process"> <process expanded="true" height="586" width="683"> <operator activated="true" class="retrieve" expanded="true" height="60" name="Retrieve" width="90" x="45" y="30"> <parameter key="repository_entry" value="D01 - ProcessedHotelCustomerSatisfaction_de"/> </operator> <operator activated="true" class="sample" expanded="true" height="76" name="Sample" width="90" x="179" y="30"> <parameter key="sample_size" value="1000"/> </operator> <operator activated="true" class="nominal_to_binominal" expanded="true" height="94" name="Nominal to Binominal" width="90" x="313" y="30"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attributes" value="customer_type|customer_group|customer_age"/> </operator> <operator activated="true" class="nominal_to_numerical" expanded="true" height="94" name="Nominal to Numerical" width="90" x="514" y="30"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attributes" value="reasons_positive|reasons_negative"/> <parameter key="invert_selection" value="true"/> </operator> <operator activated="true" class="group_models" expanded="true" height="94" name="Group Models" width="90" x="514" y="165"/> <operator activated="true" class="store" expanded="true" height="60" name="Store" width="90" x="648" y="165"> <parameter key="repository_entry" value="D02 - PreprocessingModels"/> </operator> <operator activated="true" class="text:process_document_from_data" expanded="true" height="76" name="Process Documents from Data" width="90" x="45" y="255"> <parameter key="keep_text" value="true"/> <parameter key="prunde_below_percent" value="1.0"/> <parameter key="prune_above_percent" value="40.0"/> <parameter key="select_attributes_and_weights" value="true"/> <list key="specify_weights"> <parameter key="reasons_negative" value="1.0"/> <parameter key="reasons_positive" value="1.0"/> </list> <process expanded="true" height="586" width="683"> <operator activated="true" class="text:transform_cases" expanded="true" height="60" name="Transform Cases" width="90" x="45" y="30"/> <operator activated="true" class="text:tokenize" expanded="true" height="60" name="Tokenize" width="90" x="179" y="30"/> <operator activated="true" class="text:stem_german" expanded="true" height="60" name="Stem (German)" width="90" x="313" y="30"/> <connect from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Tokenize" to_port="document"/> <connect from_op="Tokenize" from_port="document" to_op="Stem (German)" to_port="document"/> <connect from_op="Stem (German)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="0"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="store" expanded="true" height="60" name="Store (3)" width="90" x="45" y="390"> <parameter key="repository_entry" value="D02 - WordVectorData"/> </operator> <operator activated="true" class="x_validation" expanded="true" height="112" name="Validation" width="90" x="313" y="300"> <process expanded="true"> <operator activated="true" class="support_vector_machine" expanded="true" height="112" name="SVM" width="90" x="160" y="30"> <parameter key="C" value="6.309573444801933E-4"/> </operator> <connect from_port="training" to_op="SVM" to_port="training set"/> <connect from_op="SVM" from_port="model" to_port="model"/> <portSpacing port="source_training" spacing="0"/> <portSpacing port="sink_model" spacing="0"/> <portSpacing port="sink_through 1" spacing="0"/> </process> <process expanded="true"> <operator activated="true" class="apply_model" expanded="true" height="76" name="Apply Model" width="90" x="45" y="30"> <list key="application_parameters"/> </operator> <operator activated="true" class="performance_regression" expanded="true" height="76" name="Performance" width="90" x="227" y="30"> <parameter key="root_mean_squared_error" value="false"/> <parameter key="absolute_error" value="true"/> <parameter key="squared_error" value="true"/> <parameter key="correlation" value="true"/> </operator> <connect from_port="model" to_op="Apply Model" to_port="model"/> <connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/> <connect from_op="Apply Model" from_port="labelled data" to_op="Performance" to_port="labelled data"/> <connect from_op="Performance" from_port="performance" to_port="averagable 1"/> <portSpacing port="source_model" spacing="0"/> <portSpacing port="source_test set" spacing="0"/> <portSpacing port="source_through 1" spacing="0"/> <portSpacing port="sink_averagable 1" spacing="0"/> <portSpacing port="sink_averagable 2" spacing="0"/> </process> </operator> <operator activated="true" class="apply_model" expanded="true" height="76" name="apply on trainSet" width="90" x="514" y="300"> <list key="application_parameters"/> </operator> <connect from_op="Retrieve" from_port="output" to_op="Sample" to_port="example set input"/> <connect from_op="Sample" from_port="example set output" to_op="Nominal to Binominal" to_port="example set input"/> <connect from_op="Nominal to Binominal" from_port="example set output" to_op="Nominal to Numerical" to_port="example set input"/> <connect from_op="Nominal to Binominal" from_port="preprocessing model" to_op="Group Models" to_port="models in 1"/> <connect from_op="Nominal to Numerical" from_port="example set output" to_op="Process Documents from Data" to_port="example set"/> <connect from_op="Nominal to Numerical" from_port="preprocessing model" to_op="Group Models" to_port="models in 2"/> <connect from_op="Group Models" from_port="model out" to_op="Store" to_port="input"/> <connect from_op="Process Documents from Data" from_port="example set" to_op="Store (3)" to_port="input"/> <connect from_op="Process Documents from Data" from_port="word list" to_port="result 3"/> <connect from_op="Store (3)" from_port="through" to_op="Validation" to_port="training"/> <connect from_op="Validation" from_port="model" to_op="apply on trainSet" to_port="model"/> <connect from_op="Validation" from_port="training" to_op="apply on trainSet" to_port="unlabelled data"/> <connect from_op="Validation" from_port="averagable 1" to_port="result 1"/> <connect from_op="apply on trainSet" from_port="labelled data" to_port="result 2"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> <portSpacing port="sink_result 3" spacing="0"/> <portSpacing port="sink_result 4" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="5.0"> <context> <input> <location/> </input> <output> <location/> </output> <macros/> </context> <operator activated="true" class="process" expanded="true" name="Process"> <parameter key="logverbosity" value="3"/> <parameter key="random_seed" value="2001"/> <parameter key="send_mail" value="1"/> <parameter key="process_duration_for_mail" value="30"/> <parameter key="encoding" value="SYSTEM"/> <parameter key="parallelize_main_process" value="false"/> <process expanded="true" height="622" width="300"> <operator activated="true" class="text:process_document_from_file" expanded="true" height="76" name="Process Documents from Files" width="90" x="45" y="30"> <list key="text_directories"> <parameter key="atheism" value="C:\temp\temp\tests\wvtool-1.1\wvtool-1.1\examples\data\alt.atheism"/> <parameter key="christian" value="C:\temp\temp\tests\wvtool-1.1\wvtool-1.1\examples\data\soc.religion.christian"/> </list> <parameter key="file_pattern" value="*"/> <parameter key="extract_text_only" value="true"/> <parameter key="use_file_extension_as_type" value="true"/> <parameter key="content_type" value="0"/> <parameter key="encoding" value="SYSTEM"/> <parameter key="create_word_vector" value="true"/> <parameter key="vector_creation" value="0"/> <parameter key="add_meta_information" value="true"/> <parameter key="keep_text" value="false"/> <parameter key="prune_method" value="0"/> <parameter key="prunde_below_percent" value="3.0"/> <parameter key="prune_above_percent" value="30.0"/> <parameter key="prune_below_rank" value="5.0"/> <parameter key="prune_above_rank" value="5.0"/> <parameter key="datamanagement" value="7"/> <parameter key="parallelize_vector_creation" value="false"/> <process expanded="true" height="622" width="570"> <operator activated="true" class="text:tokenize" expanded="true" height="60" name="Tokenize" width="90" x="45" y="30"> <parameter key="mode" value="0"/> <parameter key="characters" value=".:"/> </operator> <operator activated="true" class="text:transform_cases" expanded="true" height="60" name="Transform Cases" width="90" x="180" y="30"> <parameter key="transform_to" value="0"/> </operator> <operator activated="true" class="text:filter_stopwords_english" expanded="true" height="60" name="Filter Stopwords (English)" width="90" x="315" y="30"/> <operator activated="true" class="text:stem_porter" expanded="true" height="60" name="Stem (Porter)" width="90" x="450" y="30"/> <connect from_port="document" to_op="Tokenize" to_port="document"/> <connect from_op="Tokenize" from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Filter Stopwords (English)" to_port="document"/> <connect from_op="Filter Stopwords (English)" from_port="document" to_op="Stem (Porter)" to_port="document"/> <connect from_op="Stem (Porter)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="36"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="x_validation" expanded="true" height="112" name="Validation" width="90" x="180" y="30"> <description>A cross-validation evaluating a decision tree model.</description> <parameter key="create_complete_model" value="false"/> <parameter key="average_performances_only" value="true"/> <parameter key="leave_one_out" value="false"/> <parameter key="number_of_validations" value="10"/> <parameter key="sampling_type" value="2"/> <parameter key="use_local_random_seed" value="false"/> <parameter key="local_random_seed" value="1992"/> <parameter key="parallelize_training" value="false"/> <parameter key="parallelize_testing" value="false"/> <process expanded="true" height="654" width="466"> <operator activated="true" class="decision_tree" expanded="true" height="76" name="Decision Tree" width="90" x="45" y="30"> <parameter key="criterion" value="gain_ratio"/> <parameter key="minimal_size_for_split" value="4"/> <parameter key="minimal_leaf_size" value="2"/> <parameter key="minimal_gain" value="0.1"/> <parameter key="maximal_depth" value="20"/> <parameter key="confidence" value="0.25"/> <parameter key="number_of_prepruning_alternatives" value="3"/> <parameter key="no_pre_pruning" value="false"/> <parameter key="no_pruning" value="false"/> </operator> <connect from_port="training" to_op="Decision Tree" to_port="training set"/> <connect from_op="Decision Tree" from_port="model" to_port="model"/> <portSpacing port="source_training" spacing="0"/> <portSpacing port="sink_model" spacing="0"/> <portSpacing port="sink_through 1" spacing="0"/> </process> <process expanded="true" height="654" width="466"> <operator activated="true" class="apply_model" expanded="true" height="76" name="Apply Model" width="90" x="45" y="30"> <list key="application_parameters"/> <parameter key="create_view" value="false"/> </operator> <operator activated="true" class="performance" expanded="true" height="76" name="Performance" width="90" x="179" y="30"> <parameter key="use_example_weights" value="true"/> </operator> <connect from_port="model" to_op="Apply Model" to_port="model"/> <connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/> <connect from_op="Apply Model" from_port="labelled data" to_op="Performance" to_port="labelled data"/> <connect from_op="Performance" from_port="performance" to_port="averagable 1"/> <portSpacing port="source_model" spacing="0"/> <portSpacing port="source_test set" spacing="0"/> <portSpacing port="source_through 1" spacing="0"/> <portSpacing port="sink_averagable 1" spacing="0"/> <portSpacing port="sink_averagable 2" spacing="0"/> </process> </operator> <connect from_op="Process Documents from Files" from_port="example set" to_op="Validation" to_port="training"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> </process> </operator></process>