Error when trying to write SIM

MarlaBot
MarlaBot New Altair Community Member
edited November 5 in Community Q&A
A RapidMiner user wants to know the answer to this question: "Hey everyone. I want to write a SIM (similarity measure object). I tried using "write database", but I received a error. I tried other operators like "write csv" and other but all they failed. I get the "Expected ExampleSet but received SimilarityMeasureObject" for error message. Any tips? Thanks. Attaching the XML Process below"
Tagged:

Best Answer

  • varunm1
    varunm1 New Altair Community Member
    Answer ✓
    Hello @up201708850

    You need to connect Data to simlarity operator after the similarity to data operator. This will give you an example set that can be stored using CSV or excel.

Answers

  • up201708850
    up201708850 New Altair Community Member
    <?xml version="1.0" encoding="UTF-8"?><process version="8.0.001">
      <context>
        <input/>
        <output/>
        <macros/>
      </context>
      <operator activated="true" class="process" compatibility="8.0.001" expanded="true" name="Process">
        <parameter key="logfile" value="e0"/>
        <parameter key="resultfile" value="e1"/>
        <process expanded="true">
          <operator activated="false" class="retrieve" compatibility="8.0.001" expanded="true" height="68" name="Retrieve dbo.tbPmRmSmp100" width="90" x="45" y="34">
            <parameter key="repository_entry" value="//DB/SQLEXPRESS01/Example Sets/dbo.tbPmRmSmp100"/>
          </operator>
          <operator activated="true" class="retrieve" compatibility="8.0.001" expanded="true" height="68" name="Retrieve dbo.tbPmRmSmpCOLUMBIDAE" width="90" x="112" y="187">
            <parameter key="repository_entry" value="//DB/SQLEXPRESS01/Example Sets/dbo.tbPmRmSmpCOLUMBIDAE"/>
          </operator>
          <operator activated="true" class="set_role" compatibility="8.0.001" expanded="true" height="82" name="Set Role" width="90" x="313" y="187">
            <parameter key="attribute_name" value="IdDo"/>
            <parameter key="target_role" value="label"/>
            <list key="set_additional_roles"/>
          </operator>
          <operator activated="true" class="select_attributes" compatibility="8.0.001" expanded="true" height="82" name="Select Attributes" width="90" x="447" y="187">
            <parameter key="attribute_filter_type" value="subset"/>
            <parameter key="attributes" value="CdVal|IdCttMdd"/>
          </operator>
          <operator activated="true" class="filter_examples" compatibility="8.0.001" expanded="true" height="103" name="Filter Examples" width="90" x="581" y="187">
            <list key="filters_list">
              <parameter key="filters_entry_key" value="IdCttMdd.eq.2"/>
            </list>
          </operator>
          <operator activated="true" class="text:process_document_from_data" compatibility="8.1.000" expanded="true" height="82" name="Process Documents from Data" width="90" x="715" y="187">
            <list key="specify_weights"/>
            <process expanded="true">
              <operator activated="true" class="text:transform_cases" compatibility="8.1.000" expanded="true" height="68" name="Transform Cases" width="90" x="45" y="34">
                <parameter key="transform_to" value="upper case"/>
              </operator>
              <operator activated="true" class="text:tokenize" compatibility="8.1.000" expanded="true" height="68" name="Tokenize" width="90" x="179" y="34">
                <parameter key="mode" value="specify characters"/>
                <parameter key="characters" value=","/>
                <parameter key="expression" value="(?is)"/>
              </operator>
              <operator activated="true" class="text:filter_stopwords_english" compatibility="8.1.000" expanded="true" height="68" name="Filter Stopwords (English)" width="90" x="313" y="85"/>
              <operator activated="false" class="text:filter_tokens_by_pos" compatibility="8.1.000" expanded="true" height="68" name="Filter Tokens (by POS Tags)" width="90" x="45" y="187"/>
              <operator activated="true" class="text:filter_by_length" compatibility="8.1.000" expanded="true" height="68" name="Filter Tokens (by Length)" width="90" x="447" y="136">
                <parameter key="min_chars" value="3"/>
              </operator>
              <operator activated="true" class="text:stem_porter" compatibility="8.1.000" expanded="true" height="68" name="Stem (Porter)" width="90" x="380" y="34"/>
              <operator activated="false" class="text:generate_n_grams_terms" compatibility="8.1.000" expanded="true" height="68" name="Generate n-Grams (Terms)" width="90" x="514" y="238">
                <parameter key="max_length" value="10"/>
              </operator>
              <connect from_port="document" to_op="Transform Cases" to_port="document"/>
              <connect from_op="Transform Cases" from_port="document" to_op="Tokenize" to_port="document"/>
              <connect from_op="Tokenize" from_port="document" to_op="Filter Stopwords (English)" to_port="document"/>
              <connect from_op="Filter Stopwords (English)" from_port="document" to_op="Filter Tokens (by Length)" to_port="document"/>
              <connect from_op="Filter Tokens (by Length)" from_port="document" to_op="Stem (Porter)" to_port="document"/>
              <connect from_op="Stem (Porter)" from_port="document" to_port="document 1"/>
              <portSpacing port="source_document" spacing="0"/>
              <portSpacing port="sink_document 1" spacing="0"/>
              <portSpacing port="sink_document 2" spacing="0"/>
            </process>
          </operator>
          <operator activated="true" class="store" compatibility="8.0.001" expanded="true" height="68" name="Store" width="90" x="916" y="289">
            <parameter key="repository_entry" value="Result01"/>
          </operator>
          <operator activated="true" class="multiply" compatibility="8.0.001" expanded="true" height="103" name="Multiply" width="90" x="916" y="136"/>
          <operator activated="true" class="jdbc_connectors:write_database" compatibility="8.0.001" expanded="true" height="68" name="Write Database (2)" width="90" x="1050" y="136">
            <parameter key="connection" value="SQLEXPRESS01"/>
            <parameter key="table_name" value="aaa"/>
            <parameter key="overwrite_mode" value="overwrite"/>
          </operator>
          <operator activated="true" class="data_to_similarity" compatibility="8.0.001" expanded="true" height="82" name="Data to Similarity" width="90" x="1050" y="238"/>
          <operator activated="true" class="retrieve" compatibility="8.0.001" expanded="true" height="68" name="Retrieve" width="90" x="45" y="391">
            <parameter key="repository_entry" value="Result01"/>
          </operator>
          <operator activated="true" class="text:wordlist_to_data" compatibility="8.1.000" expanded="true" height="82" name="WordList to Data" width="90" x="179" y="391"/>
          <connect from_op="Retrieve dbo.tbPmRmSmpCOLUMBIDAE" from_port="output" to_op="Set Role" to_port="example set input"/>
          <connect from_op="Set Role" from_port="example set output" to_op="Select Attributes" to_port="example set input"/>
          <connect from_op="Select Attributes" from_port="example set output" to_op="Filter Examples" to_port="example set input"/>
          <connect from_op="Filter Examples" from_port="example set output" to_op="Process Documents from Data" to_port="example set"/>
          <connect from_op="Process Documents from Data" from_port="example set" to_op="Multiply" to_port="input"/>
          <connect from_op="Process Documents from Data" from_port="word list" to_op="Store" to_port="input"/>
          <connect from_op="Multiply" from_port="output 1" to_op="Write Database (2)" to_port="input"/>
          <connect from_op="Multiply" from_port="output 2" to_op="Data to Similarity" to_port="example set"/>
          <connect from_op="Write Database (2)" from_port="through" to_port="result 1"/>
          <connect from_op="Retrieve" from_port="output" to_op="WordList to Data" to_port="word list"/>
          <connect from_op="WordList to Data" from_port="word list" to_port="result 2"/>
          <portSpacing port="source_input 1" spacing="0"/>
          <portSpacing port="sink_result 1" spacing="0"/>
          <portSpacing port="sink_result 2" spacing="0"/>
          <portSpacing port="sink_result 3" spacing="0"/>
        </process>
      </operator>
    </process>


  • varunm1
    varunm1 New Altair Community Member
    Answer ✓
    Hello @up201708850

    You need to connect Data to simlarity operator after the similarity to data operator. This will give you an example set that can be stored using CSV or excel.