A program to recognize and reward our most engaged community members
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product" width="90" x="45" y="85"> <parameter key="repository_entry" value="//Local Repository/data/t123_product"/> </operator> <operator activated="true" class="split_data" compatibility="7.0.001" expanded="true" height="82" name="Split Data" width="90" x="112" y="187"> <enumeration key="partitions"> <parameter key="ratio" value="0.05"/> </enumeration> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="313" y="85"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attributes" value="langtext|artid|bezeichnung_3"/> </operator> <operator activated="true" class="set_role" compatibility="7.0.001" expanded="true" height="82" name="Set Role" width="90" x="514" y="85"> <parameter key="attribute_name" value="artid"/> <parameter key="target_role" value="id"/> <list key="set_additional_roles"/> </operator> <operator activated="true" class="cross_distances" compatibility="7.0.001" expanded="true" height="103" name="Cross Distances" width="90" x="715" y="85"> <parameter key="measure_types" value="NominalMeasures"/> <parameter key="only_top_k" value="true"/> <parameter key="compute_similarities" value="true"/> </operator> <connect from_op="Retrieve t123_product" from_port="output" to_op="Split Data" to_port="example set"/> <connect from_op="Split Data" from_port="partition 1" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Set Role" to_port="example set input"/> <connect from_op="Set Role" from_port="example set output" to_op="Cross Distances" to_port="request set"/> <connect from_op="Set Role" from_port="original" to_op="Cross Distances" to_port="reference set"/> <connect from_op="Cross Distances" from_port="result set" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product" width="90" x="45" y="85"> <parameter key="repository_entry" value="//Local Repository/data/t123_product"/> </operator> <operator activated="true" class="split_data" compatibility="7.0.001" expanded="true" height="82" name="Split Data" width="90" x="112" y="187"> <enumeration key="partitions"> <parameter key="ratio" value="0.05"/> </enumeration> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="313" y="85"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attributes" value="langtext|artid|bezeichnung_3"/> </operator> <operator activated="true" class="set_role" compatibility="7.0.001" expanded="true" height="82" name="Set Role" width="90" x="514" y="85"> <parameter key="attribute_name" value="artid"/> <parameter key="target_role" value="id"/> <list key="set_additional_roles"/> </operator> <operator activated="true" class="data_to_similarity" compatibility="7.0.001" expanded="true" height="82" name="Data to Similarity" width="90" x="648" y="85"> <parameter key="measure_types" value="NominalMeasures"/> </operator> <operator activated="true" class="similarity_to_data" compatibility="7.0.001" expanded="true" height="82" name="Similarity to Data" width="90" x="782" y="85"> <parameter key="table_type" value="matrix"/> </operator> <connect from_op="Retrieve t123_product" from_port="output" to_op="Split Data" to_port="example set"/> <connect from_op="Split Data" from_port="partition 1" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Set Role" to_port="example set input"/> <connect from_op="Set Role" from_port="example set output" to_op="Data to Similarity" to_port="example set"/> <connect from_op="Data to Similarity" from_port="similarity" to_op="Similarity to Data" to_port="similarity"/> <connect from_op="Data to Similarity" from_port="example set" to_op="Similarity to Data" to_port="exampleSet"/> <connect from_op="Similarity to Data" from_port="exampleSet" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>
You should be able to do it with your computer, but I think you have a huge mistake in your process as you apply distance measure to "langtext" which is nominal, so RM uses nominal distance. Nominal distance checks if two nominal values are identical or not, so you may think of it as comparing tow strings if they are equal. In other words to get distance=0 you'd need to have two identical text descriptions. What you should do is to apply text mining extension to convert text description into numerical values, then you can execute cross distance operator, using appropriate numerical distance measure. You can also set to top k to 3 to get 3 most similar products.
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product" width="90" x="45" y="85"> <parameter key="repository_entry" value="//Local Repository/data/t123_product"/> </operator> <operator activated="true" class="split_data" compatibility="7.0.001" expanded="true" height="82" name="Split Data" width="90" x="112" y="289"> <enumeration key="partitions"> <parameter key="ratio" value="0.05"/> </enumeration> </operator> <operator activated="true" class="nominal_to_numerical" compatibility="7.0.001" expanded="true" height="103" name="Nominal to Numerical" width="90" x="380" y="187"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attributes" value="bezeichnung_3|langtext"/> <list key="comparison_groups"/> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="313" y="34"/> <operator activated="true" class="set_role" compatibility="7.0.001" expanded="true" height="82" name="Set Role" width="90" x="514" y="34"> <parameter key="attribute_name" value="artid"/> <parameter key="target_role" value="id"/> <list key="set_additional_roles"/> </operator> <operator activated="true" class="cross_distances" compatibility="7.0.001" expanded="true" height="103" name="Cross Distances" width="90" x="715" y="85"> <parameter key="measure_types" value="NumericalMeasures"/> <parameter key="only_top_k" value="true"/> <parameter key="k" value="5"/> </operator> <connect from_op="Retrieve t123_product" from_port="output" to_op="Split Data" to_port="example set"/> <connect from_op="Split Data" from_port="partition 1" to_op="Nominal to Numerical" to_port="example set input"/> <connect from_op="Nominal to Numerical" from_port="example set output" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Set Role" to_port="example set input"/> <connect from_op="Set Role" from_port="example set output" to_op="Cross Distances" to_port="request set"/> <connect from_op="Set Role" from_port="original" to_op="Cross Distances" to_port="reference set"/> <connect from_op="Cross Distances" from_port="result set" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product_import_23032016" width="90" x="45" y="34"> <parameter key="repository_entry" value="//tech123_win/t123_product_import_23032016"/> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="179" y="34"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attribute" value="description"/> <parameter key="attributes" value="sku|description"/> </operator> <operator activated="true" class="split_data" compatibility="7.0.001" expanded="true" height="82" name="Split Data" width="90" x="313" y="34"> <enumeration key="partitions"> <parameter key="ratio" value="0.01"/> <parameter key="ratio" value="0.99"/> </enumeration> </operator> <operator activated="true" class="nominal_to_text" compatibility="7.0.001" expanded="true" height="82" name="Nominal to Text" width="90" x="313" y="136"/> <operator activated="true" class="text:process_document_from_data" compatibility="7.0.000" expanded="true" height="82" name="Process Documents from Data" width="90" x="246" y="289"> <parameter key="add_meta_information" value="false"/> <parameter key="keep_text" value="true"/> <parameter key="prune_below_absolute" value="2"/> <parameter key="prune_above_absolute" value="9999"/> <list key="specify_weights"/> <process expanded="true"> <operator activated="true" class="text:tokenize" compatibility="7.0.000" expanded="true" height="68" name="Tokenize" width="90" x="112" y="85"/> <operator activated="true" class="text:transform_cases" compatibility="7.0.000" expanded="true" height="68" name="Transform Cases" width="90" x="246" y="85"/> <operator activated="true" class="text:filter_stopwords_german" compatibility="7.0.000" expanded="true" height="68" name="Filter Stopwords (German)" width="90" x="380" y="85"/> <connect from_port="document" to_op="Tokenize" to_port="document"/> <connect from_op="Tokenize" from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Filter Stopwords (German)" to_port="document"/> <connect from_op="Filter Stopwords (German)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="0"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="cross_distances" compatibility="7.0.001" expanded="true" height="103" name="Cross Distances" width="90" x="447" y="289"> <parameter key="measure_types" value="NumericalMeasures"/> <parameter key="numerical_measure" value="CosineSimilarity"/> <parameter key="only_top_k" value="true"/> <parameter key="k" value="5"/> </operator> <connect from_op="Retrieve t123_product_import_23032016" from_port="output" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Split Data" to_port="example set"/> <connect from_op="Split Data" from_port="partition 1" to_op="Nominal to Text" to_port="example set input"/> <connect from_op="Nominal to Text" from_port="example set output" to_op="Process Documents from Data" to_port="example set"/> <connect from_op="Nominal to Text" from_port="original" to_op="Cross Distances" to_port="reference set"/> <connect from_op="Process Documents from Data" from_port="example set" to_op="Cross Distances" to_port="request set"/> <connect from_op="Cross Distances" from_port="result set" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product_import_23032016" width="90" x="45" y="34"> <parameter key="repository_entry" value="//tech123_win/t123_product_import_23032016"/> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="179" y="34"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attribute" value="description"/> <parameter key="attributes" value="sku|description"/> </operator> <operator activated="true" class="split_data" compatibility="7.0.001" expanded="true" height="82" name="Split Data" width="90" x="313" y="34"> <enumeration key="partitions"> <parameter key="ratio" value="0.001"/> <parameter key="ratio" value="0.999"/> </enumeration> </operator> <operator activated="true" class="nominal_to_text" compatibility="7.0.001" expanded="true" height="82" name="Nominal to Text" width="90" x="313" y="136"/> <operator activated="true" class="text:process_document_from_data" compatibility="7.0.000" expanded="true" height="82" name="Process Documents from Data" width="90" x="246" y="289"> <parameter key="add_meta_information" value="false"/> <parameter key="keep_text" value="true"/> <parameter key="prune_below_absolute" value="2"/> <parameter key="prune_above_absolute" value="9999"/> <list key="specify_weights"/> <process expanded="true"> <operator activated="true" class="text:tokenize" compatibility="7.0.000" expanded="true" height="68" name="Tokenize" width="90" x="112" y="85"/> <operator activated="true" class="text:transform_cases" compatibility="7.0.000" expanded="true" height="68" name="Transform Cases" width="90" x="246" y="85"/> <operator activated="true" class="text:filter_stopwords_german" compatibility="7.0.000" expanded="true" height="68" name="Filter Stopwords (German)" width="90" x="380" y="85"/> <connect from_port="document" to_op="Tokenize" to_port="document"/> <connect from_op="Tokenize" from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Filter Stopwords (German)" to_port="document"/> <connect from_op="Filter Stopwords (German)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="0"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="data_to_similarity" compatibility="7.0.001" expanded="true" height="82" name="Data to Similarity" width="90" x="447" y="340"> <parameter key="measure_types" value="NumericalMeasures"/> <parameter key="numerical_measure" value="CosineSimilarity"/> </operator> <connect from_op="Retrieve t123_product_import_23032016" from_port="output" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Split Data" to_port="example set"/> <connect from_op="Split Data" from_port="partition 1" to_op="Nominal to Text" to_port="example set input"/> <connect from_op="Nominal to Text" from_port="example set output" to_op="Process Documents from Data" to_port="example set"/> <connect from_op="Process Documents from Data" from_port="example set" to_op="Data to Similarity" to_port="example set"/> <connect from_op="Data to Similarity" from_port="similarity" to_port="result 1"/> <connect from_op="Data to Similarity" from_port="example set" to_port="result 2"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> <portSpacing port="sink_result 3" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="6.0.002" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="subprocess" compatibility="7.0.001" expanded="true" height="103" name="Subprocess" width="90" x="112" y="85"> <process expanded="true"> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (3)" width="90" x="179" y="30"> <list key="attribute_values"> <parameter key="attribute1" value="1"/> <parameter key="attribute2" value="2"/> <parameter key="attribute3" value="3"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification" width="90" x="179" y="165"> <list key="attribute_values"> <parameter key="attribute1" value="1"/> <parameter key="attribute2" value="2"/> <parameter key="attribute3" value="3"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (2)" width="90" x="179" y="238"> <list key="attribute_values"> <parameter key="attribute1" value="4"/> <parameter key="attribute2" value="5"/> <parameter key="attribute3" value="6"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_id" compatibility="7.0.001" expanded="true" height="82" name="Generate ID" width="90" x="514" y="30"> <parameter key="create_nominal_ids" value="true"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (4)" width="90" x="179" y="289"> <list key="attribute_values"> <parameter key="attribute1" value="7"/> <parameter key="attribute2" value="8"/> <parameter key="attribute3" value="6"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (5)" width="90" x="179" y="340"> <list key="attribute_values"> <parameter key="attribute1" value="4"/> <parameter key="attribute2" value="8"/> <parameter key="attribute3" value="6"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (6)" width="90" x="179" y="442"> <list key="attribute_values"> <parameter key="attribute1" value="100"/> <parameter key="attribute2" value="5"/> <parameter key="attribute3" value="6"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="generate_data_user_specification" compatibility="6.4.000" expanded="true" height="68" name="Generate Data by User Specification (7)" width="90" x="179" y="544"> <list key="attribute_values"> <parameter key="attribute1" value="100"/> <parameter key="attribute2" value="100"/> <parameter key="attribute3" value="6"/> </list> <list key="set_additional_roles"/> </operator> <operator activated="true" class="append" compatibility="7.0.001" expanded="true" height="187" name="Append" width="90" x="313" y="210"/> <operator activated="true" class="generate_id" compatibility="7.0.001" expanded="true" height="82" name="Generate ID (2)" width="90" x="514" y="210"> <parameter key="create_nominal_ids" value="true"/> </operator> <connect from_op="Generate Data by User Specification (3)" from_port="output" to_op="Generate ID" to_port="example set input"/> <connect from_op="Generate Data by User Specification" from_port="output" to_op="Append" to_port="example set 1"/> <connect from_op="Generate Data by User Specification (2)" from_port="output" to_op="Append" to_port="example set 2"/> <connect from_op="Generate ID" from_port="example set output" to_port="out 1"/> <connect from_op="Generate Data by User Specification (4)" from_port="output" to_op="Append" to_port="example set 3"/> <connect from_op="Generate Data by User Specification (5)" from_port="output" to_op="Append" to_port="example set 4"/> <connect from_op="Generate Data by User Specification (6)" from_port="output" to_op="Append" to_port="example set 5"/> <connect from_op="Generate Data by User Specification (7)" from_port="output" to_op="Append" to_port="example set 6"/> <connect from_op="Append" from_port="merged set" to_op="Generate ID (2)" to_port="example set input"/> <connect from_op="Generate ID (2)" from_port="example set output" to_port="out 2"/> <portSpacing port="source_in 1" spacing="0"/> <portSpacing port="sink_out 1" spacing="0"/> <portSpacing port="sink_out 2" spacing="162"/> <portSpacing port="sink_out 3" spacing="0"/> </process> </operator> <operator activated="true" class="cross_distances" compatibility="7.0.001" expanded="true" height="103" name="Cross Distances" width="90" x="313" y="85"> <parameter key="numerical_measure" value="KernelEuclideanDistance"/> <parameter key="only_top_k" value="true"/> <parameter key="k" value="3"/> </operator> <operator activated="true" class="aggregate" compatibility="7.0.001" expanded="true" height="82" name="Aggregate" width="90" x="447" y="34"> <list key="aggregation_attributes"> <parameter key="document" value="concatenation"/> </list> <parameter key="group_by_attributes" value="request"/> </operator> <connect from_op="Subprocess" from_port="out 1" to_op="Cross Distances" to_port="request set"/> <connect from_op="Subprocess" from_port="out 2" to_op="Cross Distances" to_port="reference set"/> <connect from_op="Cross Distances" from_port="result set" to_op="Aggregate" to_port="example set input"/> <connect from_op="Aggregate" from_port="example set output" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="90"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="7.0.001"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process"> <process expanded="true"> <operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve t123_product_import_23032016" width="90" x="45" y="34"> <parameter key="repository_entry" value="//Local Repository/data/t123_product_import_23032016"/> </operator> <operator activated="true" class="select_attributes" compatibility="7.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="246" y="34"> <parameter key="attribute_filter_type" value="subset"/> <parameter key="attribute" value="description"/> <parameter key="attributes" value="sku|description|etim|manufacturer|teg_prodnumber|short_description"/> </operator> <operator activated="true" class="trim" compatibility="7.0.001" expanded="true" height="82" name="Trim" width="90" x="380" y="34"> <parameter key="attribute_filter_type" value="single"/> <parameter key="attribute" value="etim"/> </operator> <operator activated="true" class="filter_examples" compatibility="7.0.001" expanded="true" height="103" name="Filter Examples" width="90" x="581" y="34"> <list key="filters_list"> <parameter key="filters_entry_key" value="etim.equals.EC000374"/> </list> </operator> <operator activated="false" class="filter_examples" compatibility="7.0.001" expanded="true" height="103" name="Filter Examples (2)" width="90" x="782" y="34"> <list key="filters_list"> <parameter key="filters_entry_key" value="manufacturer.equals.Gira"/> </list> </operator> <operator activated="true" class="nominal_to_text" compatibility="7.0.001" expanded="true" height="82" name="Nominal to Text" width="90" x="246" y="238"/> <operator activated="true" class="text:process_document_from_data" compatibility="7.0.000" expanded="true" height="82" name="Process Documents from Data" width="90" x="246" y="391"> <parameter key="keep_text" value="true"/> <parameter key="prune_method" value="absolute"/> <parameter key="prune_below_absolute" value="2"/> <parameter key="prune_above_absolute" value="9999"/> <list key="specify_weights"/> <process expanded="true"> <operator activated="true" class="text:transform_cases" compatibility="7.0.000" expanded="true" height="68" name="Transform Cases" width="90" x="313" y="85"/> <operator activated="true" class="text:filter_stopwords_german" compatibility="7.0.000" expanded="true" height="68" name="Filter Stopwords (German)" width="90" x="447" y="85"/> <operator activated="true" class="text:stem_snowball" compatibility="7.0.000" expanded="true" height="68" name="Stem (Snowball)" width="90" x="581" y="85"> <parameter key="language" value="German"/> </operator> <connect from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Filter Stopwords (German)" to_port="document"/> <connect from_op="Filter Stopwords (German)" from_port="document" to_op="Stem (Snowball)" to_port="document"/> <connect from_op="Stem (Snowball)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="0"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="multiply" compatibility="7.0.001" expanded="true" height="103" name="Multiply" width="90" x="447" y="391"/> <operator activated="true" class="cross_distances" compatibility="7.0.001" expanded="true" height="103" name="Cross Distances" width="90" x="648" y="391"> <parameter key="measure_types" value="NumericalMeasures"/> <parameter key="numerical_measure" value="CosineSimilarity"/> <parameter key="only_top_k" value="true"/> </operator> <operator activated="true" class="normalize" compatibility="7.0.001" expanded="true" height="103" name="Normalize" width="90" x="849" y="238"> <parameter key="attribute_filter_type" value="single"/> <parameter key="attribute" value="distance"/> </operator> <operator activated="true" class="aggregate" compatibility="7.0.001" expanded="true" height="82" name="Aggregate" width="90" x="1117" y="238"> <list key="aggregation_attributes"> <parameter key="document" value="concatenation"/> </list> <parameter key="group_by_attributes" value="request"/> </operator> <connect from_op="Retrieve t123_product_import_23032016" from_port="output" to_op="Select Attributes" to_port="example set input"/> <connect from_op="Select Attributes" from_port="example set output" to_op="Trim" to_port="example set input"/> <connect from_op="Trim" from_port="example set output" to_op="Filter Examples" to_port="example set input"/> <connect from_op="Filter Examples" from_port="example set output" to_op="Nominal to Text" to_port="example set input"/> <connect from_op="Nominal to Text" from_port="example set output" to_op="Process Documents from Data" to_port="example set"/> <connect from_op="Process Documents from Data" from_port="example set" to_op="Multiply" to_port="input"/> <connect from_op="Multiply" from_port="output 1" to_op="Cross Distances" to_port="request set"/> <connect from_op="Multiply" from_port="output 2" to_op="Cross Distances" to_port="reference set"/> <connect from_op="Cross Distances" from_port="result set" to_op="Normalize" to_port="example set input"/> <connect from_op="Normalize" from_port="example set output" to_op="Aggregate" to_port="example set input"/> <connect from_op="Aggregate" from_port="example set output" to_port="result 1"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> </process> </operator></process>