A program to recognize and reward our most engaged community members
<?xml version="1.0" encoding="UTF-8" standalone="no"?><process version="5.2.008"> <context> <input/> <output/> <macros/> </context> <operator activated="true" class="process" compatibility="5.2.008" expanded="true" name="Process"> <process expanded="true" height="685" width="1016"> <operator activated="true" class="retrieve" compatibility="5.2.008" expanded="true" height="60" name="Clarity_XOG_GEL_WSDL" width="90" x="45" y="300"> <parameter key="repository_entry" value="../Data/Clarity_XOG_GEL_WSDL"/> </operator> <operator activated="true" class="text:process_document_from_data" compatibility="5.2.004" expanded="true" height="76" name="Process Documents from Data" width="90" x="179" y="210"> <parameter key="add_meta_information" value="false"/> <parameter key="keep_text" value="true"/> <parameter key="prune_method" value="absolute"/> <parameter key="prune_below_absolute" value="2"/> <parameter key="prune_above_absolute" value="9999"/> <list key="specify_weights"/> <process expanded="true" height="550" width="728"> <operator activated="true" class="web:extract_html_text_content" compatibility="5.2.003" expanded="true" height="60" name="Extract Content" width="90" x="112" y="30"> <parameter key="minimum_text_block_length" value="3"/> </operator> <operator activated="true" class="text:tokenize" compatibility="5.2.004" expanded="true" height="60" name="Tokenize" width="90" x="45" y="120"/> <operator activated="true" class="text:transform_cases" compatibility="5.2.004" expanded="true" height="60" name="Transform Cases" width="90" x="45" y="210"/> <operator activated="true" class="text:filter_stopwords_english" compatibility="5.2.004" expanded="true" height="60" name="Filter Stopwords (English)" width="90" x="45" y="300"/> <operator activated="true" class="text:replace_tokens" compatibility="5.2.004" expanded="true" height="60" name="Replace Tokens" width="90" x="246" y="300"> <list key="replace_dictionary"> <parameter key="chris" value=" "/> <parameter key="clarity" value=" "/> <parameter key="ca" value=" "/> <parameter key="com" value=" "/> <parameter key="hi" value=" "/> <parameter key=" munity" value=" "/> <parameter key=" munities" value=" "/> <parameter key="use" value=" "/> <parameter key="user" value=" "/> </list> </operator> <operator activated="false" class="text:stem_snowball" compatibility="5.2.004" expanded="true" height="60" name="Stem (Snowball)" width="90" x="581" y="480"/> <operator activated="true" class="text:filter_by_length" compatibility="5.2.004" expanded="true" height="60" name="Filter Tokens (by Length)" width="90" x="380" y="300"> <parameter key="min_chars" value="2"/> </operator> <operator activated="false" class="text:generate_n_grams_terms" compatibility="5.2.004" expanded="true" height="60" name="Generate n-Grams (Terms)" width="90" x="581" y="390"> <parameter key="max_length" value="3"/> </operator> <connect from_port="document" to_op="Extract Content" to_port="document"/> <connect from_op="Extract Content" from_port="document" to_op="Tokenize" to_port="document"/> <connect from_op="Tokenize" from_port="document" to_op="Transform Cases" to_port="document"/> <connect from_op="Transform Cases" from_port="document" to_op="Filter Stopwords (English)" to_port="document"/> <connect from_op="Filter Stopwords (English)" from_port="document" to_op="Replace Tokens" to_port="document"/> <connect from_op="Replace Tokens" from_port="document" to_op="Filter Tokens (by Length)" to_port="document"/> <connect from_op="Filter Tokens (by Length)" from_port="document" to_port="document 1"/> <portSpacing port="source_document" spacing="0"/> <portSpacing port="sink_document 1" spacing="0"/> <portSpacing port="sink_document 2" spacing="0"/> </process> </operator> <operator activated="true" class="k_means" compatibility="5.2.008" expanded="true" height="76" name="Clustering" width="90" x="313" y="165"> <parameter key="k" value="5"/> </operator> <operator activated="true" class="extract_prototypes" compatibility="5.2.008" expanded="true" height="76" name="Extract Cluster Prototypes" width="90" x="581" y="345"/> <connect from_op="Clarity_XOG_GEL_WSDL" from_port="output" to_op="Process Documents from Data" to_port="example set"/> <connect from_op="Process Documents from Data" from_port="example set" to_op="Clustering" to_port="example set"/> <connect from_op="Process Documents from Data" from_port="word list" to_port="result 4"/> <connect from_op="Clustering" from_port="cluster model" to_op="Extract Cluster Prototypes" to_port="model"/> <connect from_op="Clustering" from_port="clustered set" to_port="result 3"/> <connect from_op="Extract Cluster Prototypes" from_port="example set" to_port="result 1"/> <connect from_op="Extract Cluster Prototypes" from_port="model" to_port="result 2"/> <portSpacing port="source_input 1" spacing="0"/> <portSpacing port="sink_result 1" spacing="0"/> <portSpacing port="sink_result 2" spacing="0"/> <portSpacing port="sink_result 3" spacing="0"/> <portSpacing port="sink_result 4" spacing="0"/> <portSpacing port="sink_result 5" spacing="0"/> </process> </operator></process>