Hello,
I attached a simple model for better understanding (please see below):
In the model I create a simple sinus curve with some noise as input for 2 sub-models: one reduces the example set using a sample bootstrap + remove duplicate operator and the other a sample operator (ratio set to 0.6) then forward this subset as input for a WEKA Multilayer Perceptron . As far as I understand the function of these operators the result should be nearly same - however, comparing both result sets in the plot view window (x-axis = att1, y-axis = prediction(label)) I realize a difference between the output of the sample-model and the bootstrap-model: while I can separate several sinus curves in the bootstrap-model I do not see the same (or similar) in the sample-model. It's less dense. I was expecting same behaviour ...
Would you pleae be so kind and give me a hint what's wrong (either model or my thinking)?
Thanks and best Regards
VD
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.0">
<context>
<input/>
<output/>
<macros/>
</context>
<operator activated="true" class="process" expanded="true" name="Process">
<process expanded="true" height="386" width="685">
<operator activated="true" class="generate_data" expanded="true" height="60" name="Generate Data" width="90" x="45" y="30">
<parameter key="target_function" value="simple sinus"/>
<parameter key="number_of_attributes" value="1"/>
<parameter key="attributes_lower_bound" value="-3.0"/>
<parameter key="attributes_upper_bound" value="3.0"/>
</operator>
<operator activated="true" class="add_noise" expanded="true" height="94" name="Add Noise" width="90" x="45" y="255">
<list key="noise"/>
</operator>
<operator activated="true" class="multiply" expanded="true" height="94" name="Multiply" width="90" x="179" y="165"/>
<operator activated="true" class="loop" expanded="true" height="76" name="Loop" width="90" x="313" y="75">
<parameter key="iterations" value="5"/>
<process expanded="true" height="575" width="709">
<operator activated="true" class="sample_bootstrapping" expanded="true" height="76" name="Sample (2)" width="90" x="45" y="30">
<parameter key="use_weights" value="false"/>
</operator>
<operator activated="true" class="remove_duplicates" expanded="true" height="76" name="Remove Duplicates" width="90" x="179" y="30"/>
<operator activated="true" class="weka:W-MultilayerPerceptron" expanded="true" height="76" name="W-MultilayerPerceptron" width="90" x="313" y="30">
<parameter key="N" value="5000.0"/>
<parameter key="H" value="5"/>
</operator>
<operator activated="true" class="apply_model" expanded="true" height="76" name="Apply Model" width="90" x="469" y="30">
<list key="application_parameters"/>
</operator>
<connect from_port="input 1" to_op="Sample (2)" to_port="example set input"/>
<connect from_op="Sample (2)" from_port="example set output" to_op="Remove Duplicates" to_port="example set input"/>
<connect from_op="Remove Duplicates" from_port="example set output" to_op="W-MultilayerPerceptron" to_port="training set"/>
<connect from_op="W-MultilayerPerceptron" from_port="model" to_op="Apply Model" to_port="model"/>
<connect from_op="W-MultilayerPerceptron" from_port="exampleSet" to_op="Apply Model" to_port="unlabelled data"/>
<connect from_op="Apply Model" from_port="labelled data" to_port="output 1"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="source_input 2" spacing="0"/>
<portSpacing port="sink_output 1" spacing="0"/>
<portSpacing port="sink_output 2" spacing="0"/>
</process>
</operator>
<operator activated="true" class="append" expanded="true" height="76" name="Append" width="90" x="447" y="75"/>
<operator activated="true" class="loop" expanded="true" height="76" name="Loop (2)" width="90" x="313" y="255">
<parameter key="iterations" value="5"/>
<process expanded="true" height="575" width="709">
<operator activated="true" class="sample" expanded="true" height="76" name="Sample" width="90" x="112" y="30">
<parameter key="sample" value="relative"/>
<parameter key="sample_ratio" value="0.6"/>
</operator>
<operator activated="true" class="weka:W-MultilayerPerceptron" expanded="true" height="76" name="W-MultilayerPerceptron (2)" width="90" x="315" y="30">
<parameter key="N" value="5000.0"/>
<parameter key="H" value="5"/>
</operator>
<operator activated="true" class="apply_model" expanded="true" height="76" name="Apply Model (2)" width="90" x="512" y="30">
<list key="application_parameters"/>
</operator>
<connect from_port="input 1" to_op="Sample" to_port="example set input"/>
<connect from_op="Sample" from_port="example set output" to_op="W-MultilayerPerceptron (2)" to_port="training set"/>
<connect from_op="W-MultilayerPerceptron (2)" from_port="model" to_op="Apply Model (2)" to_port="model"/>
<connect from_op="W-MultilayerPerceptron (2)" from_port="exampleSet" to_op="Apply Model (2)" to_port="unlabelled data"/>
<connect from_op="Apply Model (2)" from_port="labelled data" to_port="output 1"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="source_input 2" spacing="0"/>
<portSpacing port="sink_output 1" spacing="0"/>
<portSpacing port="sink_output 2" spacing="0"/>
</process>
</operator>
<operator activated="true" class="append" expanded="true" height="76" name="Append (2)" width="90" x="447" y="255"/>
<connect from_op="Generate Data" from_port="output" to_op="Add Noise" to_port="example set input"/>
<connect from_op="Add Noise" from_port="example set output" to_op="Multiply" to_port="input"/>
<connect from_op="Multiply" from_port="output 1" to_op="Loop" to_port="input 1"/>
<connect from_op="Multiply" from_port="output 2" to_op="Loop (2)" to_port="input 1"/>
<connect from_op="Loop" from_port="output 1" to_op="Append" to_port="example set 1"/>
<connect from_op="Append" from_port="merged set" to_port="result 1"/>
<connect from_op="Loop (2)" from_port="output 1" to_op="Append (2)" to_port="example set 1"/>
<connect from_op="Append (2)" from_port="merged set" to_port="result 2"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="sink_result 1" spacing="0"/>
<portSpacing port="sink_result 2" spacing="0"/>
<portSpacing port="sink_result 3" spacing="0"/>
</process>
</operator>
</process>