Stability of Feature Selection

ozgeozyazar
ozgeozyazar New Altair Community Member
edited November 2024 in Community Q&A
Hi !

I have applied attached stability process but I am not sure if I correctly selected log parameters for for jaccard and kuncheva indexes. Could you please help me to correct the process and advice how can I interpret the results of kucheva and jaccard index ?

<?xml version="1.0" encoding="UTF-8"?><process version="8.0.001">
  <context>
    <input/>
    <output/>
    <macros/>
  </context>
  <operator activated="true" class="process" compatibility="6.0.002" expanded="true" name="Process">
    <process expanded="true">
      <operator activated="true" class="read_excel" compatibility="8.0.001" expanded="true" height="68" name="Read Excel" width="90" x="179" y="34">
        <parameter key="excel_file" value="C:\Users\AngelsChange\Desktop\SPSS-TEZ\Descriptive 2\MACRO\MACRO_KNN.xlsx"/>
        <parameter key="imported_cell_range" value="A1:AQ1100"/>
        <parameter key="first_row_as_names" value="false"/>
        <list key="annotations">
          <parameter key="0" value="Name"/>
        </list>
        <list key="data_set_meta_data_information">
          <parameter key="0" value="ID.false.integer.attribute"/>
          <parameter key="1" value="DISEASE_DURATION.true.integer.attribute"/>
          <parameter key="2" value="AGE.true.integer.attribute"/>
          <parameter key="3" value="WEIGHT.true.numeric.attribute"/>
          <parameter key="4" value="HEIGHT.true.real.attribute"/>
          <parameter key="5" value="BMI.true.real.attribute"/>
          <parameter key="6" value="FBG.true.integer.attribute"/>
          <parameter key="7" value="PBG.true.numeric.attribute"/>
          <parameter key="8" value="HbA1c.true.numeric.attribute"/>
          <parameter key="9" value="FBG_HbA1c.true.real.attribute"/>
          <parameter key="10" value="PBG_HbA1c.true.numeric.attribute"/>
          <parameter key="11" value="TColl.true.numeric.attribute"/>
          <parameter key="12" value="TG.true.integer.attribute"/>
          <parameter key="13" value="HDLK.true.numeric.attribute"/>
          <parameter key="14" value="LDLK.true.numeric.attribute"/>
          <parameter key="15" value="LDL_HDL.true.numeric.attribute"/>
          <parameter key="16" value="TColl_HDL.true.numeric.attribute"/>
          <parameter key="17" value="Cr.true.numeric.attribute"/>
          <parameter key="18" value="ALB.true.numeric.attribute"/>
          <parameter key="19" value="ALB_CR.true.numeric.attribute"/>
          <parameter key="20" value="GFR.true.numeric.attribute"/>
          <parameter key="21" value="CCI.true.integer.attribute"/>
          <parameter key="22" value="CONTROL_7\.5.true.integer.attribute"/>
          <parameter key="23" value="CONTROL_6.true.integer.attribute"/>
          <parameter key="24" value="CONTROL_6\.5.true.integer.attribute"/>
          <parameter key="25" value="CONTROL_7.true.integer.attribute"/>
          <parameter key="26" value="GENDER.true.integer.attribute"/>
          <parameter key="27" value="BACKGROUND_INFORMATION.true.integer.attribute"/>
          <parameter key="28" value="FAMILY_HEALTH_STORY.true.integer.attribute"/>
          <parameter key="29" value="INSULINE_TREATMENT.true.integer.attribute"/>
          <parameter key="30" value="BMI_DEGREE.true.integer.attribute"/>
          <parameter key="31" value="PATIENTS_STATUS.true.integer.attribute"/>
          <parameter key="32" value="SMOKING_HABIT.true.integer.attribute"/>
          <parameter key="33" value="HYPERTENSION.true.integer.attribute"/>
          <parameter key="34" value="MACRO.true.binominal.label"/>
          <parameter key="35" value="MICRO.true.integer.attribute"/>
          <parameter key="36" value="CODISEASE.true.integer.attribute"/>
          <parameter key="37" value="HBA1C_DEGREE.true.integer.attribute"/>
          <parameter key="38" value="GLUCOSE_LEVEL_RISK_DEGREE.true.integer.attribute"/>
          <parameter key="39" value="LIPID_PROFILE.true.integer.attribute"/>
          <parameter key="40" value="CREATININE_DEGREE.true.integer.attribute"/>
          <parameter key="41" value="ALBUMIN_DEGREE.true.integer.attribute"/>
          <parameter key="42" value="GFR_DEGREE.true.integer.attribute"/>
        </list>
      </operator>
      <operator activated="true" class="concurrency:loop_parameters" compatibility="8.0.001" expanded="true" height="82" name="Loop Parameters (2)" width="90" x="380" y="85">
        <list key="parameters">
          <parameter key="MRMR-FS (2).relevance_redundancy_relation" value="quotient,difference"/>
          <parameter key="Stability (2).sampling_type" value="linear sampling,shuffled sampling,stratified sampling,automatic"/>
          <parameter key="MRMR-FS (2).k" value="[0.0;100.0;10;linear]"/>
        </list>
        <process expanded="true">
          <operator activated="true" class="featselext:feature_selection_stability_evaluator" compatibility="1.1.004" expanded="true" height="103" name="Stability (2)" width="90" x="112" y="136">
            <parameter key="sampling_type" value="automatic"/>
            <process expanded="true">
              <operator activated="true" class="featselext:mrmr_feature_selection" compatibility="1.1.004" expanded="true" height="82" name="MRMR-FS (2)" width="90" x="313" y="187">
                <parameter key="normalize_weights" value="true"/>
                <parameter key="k" value="50"/>
                <parameter key="relevance_redundancy_relation" value="difference"/>
              </operator>
              <connect from_port="exampleset" to_op="MRMR-FS (2)" to_port="example set"/>
              <connect from_op="MRMR-FS (2)" from_port="weights" to_port="weights"/>
              <portSpacing port="source_exampleset" spacing="0"/>
              <portSpacing port="sink_weights" spacing="0"/>
            </process>
          </operator>
          <operator activated="true" class="log" compatibility="8.0.001" expanded="true" height="103" name="Log (2)" width="90" x="313" y="136">
            <parameter key="filename" value="C:\Users\AngelsChange\Desktop\wer.log"/>
            <list key="log">
              <parameter key="jaccard" value="operator.Stability (2).value.robustness"/>
              <parameter key="kuncheva" value="operator.Stability (2).value.consistency"/>
            </list>
          </operator>
          <connect from_port="input 1" to_op="Stability (2)" to_port="exampleset"/>
          <connect from_op="Stability (2)" from_port="robustness" to_op="Log (2)" to_port="through 1"/>
          <connect from_op="Stability (2)" from_port="kuncheva" to_op="Log (2)" to_port="through 2"/>
          <connect from_op="Log (2)" from_port="through 1" to_port="performance"/>
          <connect from_op="Log (2)" from_port="through 2" to_port="output 1"/>
          <portSpacing port="source_input 1" spacing="0"/>
          <portSpacing port="source_input 2" spacing="0"/>
          <portSpacing port="sink_performance" spacing="0"/>
          <portSpacing port="sink_output 1" spacing="0"/>
          <portSpacing port="sink_output 2" spacing="0"/>
        </process>
      </operator>
      <connect from_port="input 1" to_op="Read Excel" to_port="file"/>
      <connect from_op="Read Excel" from_port="output" to_op="Loop Parameters (2)" to_port="input 1"/>
      <connect from_op="Loop Parameters (2)" from_port="output 1" to_port="result 2"/>
      <portSpacing port="source_input 1" spacing="0"/>
      <portSpacing port="source_input 2" spacing="0"/>
      <portSpacing port="sink_result 1" spacing="0"/>
      <portSpacing port="sink_result 2" spacing="0"/>
      <portSpacing port="sink_result 3" spacing="0"/>
    </process>
  </operator>
</process>

Answers

  • ozgeozyazar
    ozgeozyazar New Altair Community Member
    If you have an idea please share wth me since I need to complete my thesis and it is the important part :(
  • rfuentealba
    rfuentealba New Altair Community Member
    Hello, @ozgeozyazar

    When I import your process, RapidMiner tells me the following:


    I need more information, as you are working with an old version of RapidMiner, and you haven't provided information on what plugins are you using, etc.

    All the best,

    Rodrigo.