Stability of Feature Selection

ozgeozyazar
ozgeozyazar New Altair Community Member
edited November 2024 in Community Q&A
Hi !

I have applied attached stability process but I am not sure if I correctly selected log parameters for for jaccard and kuncheva indexes. Could you please help me to correct the process and advice how can I interpret the results of kucheva and jaccard index ?

<?xml version="1.0" encoding="UTF-8"?><process version="8.0.001">
  <context>
    <input/>
    <output/>
    <macros/>
  </context>
  <operator activated="true" class="process" compatibility="6.0.002" expanded="true" name="Process">
    <process expanded="true">
      <operator activated="true" class="read_excel" compatibility="8.0.001" expanded="true" height="68" name="Read Excel" width="90" x="179" y="34">
        <parameter key="excel_file" value="C:\Users\AngelsChange\Desktop\SPSS-TEZ\Descriptive 2\MACRO\MACRO_KNN.xlsx"/>
        <parameter key="imported_cell_range" value="A1:AQ1100"/>
        <parameter key="first_row_as_names" value="false"/>
        <list key="annotations">
          <parameter key="0" value="Name"/>
        </list>
        <list key="data_set_meta_data_information">
          <parameter key="0" value="ID.false.integer.attribute"/>
          <parameter key="1" value="DISEASE_DURATION.true.integer.attribute"/>
          <parameter key="2" value="AGE.true.integer.attribute"/>
          <parameter key="3" value="WEIGHT.true.numeric.attribute"/>
          <parameter key="4" value="HEIGHT.true.real.attribute"/>
          <parameter key="5" value="BMI.true.real.attribute"/>
          <parameter key="6" value="FBG.true.integer.attribute"/>
          <parameter key="7" value="PBG.true.numeric.attribute"/>
          <parameter key="8" value="HbA1c.true.numeric.attribute"/>
          <parameter key="9" value="FBG_HbA1c.true.real.attribute"/>
          <parameter key="10" value="PBG_HbA1c.true.numeric.attribute"/>
          <parameter key="11" value="TColl.true.numeric.attribute"/>
          <parameter key="12" value="TG.true.integer.attribute"/>
          <parameter key="13" value="HDLK.true.numeric.attribute"/>
          <parameter key="14" value="LDLK.true.numeric.attribute"/>
          <parameter key="15" value="LDL_HDL.true.numeric.attribute"/>
          <parameter key="16" value="TColl_HDL.true.numeric.attribute"/>
          <parameter key="17" value="Cr.true.numeric.attribute"/>
          <parameter key="18" value="ALB.true.numeric.attribute"/>
          <parameter key="19" value="ALB_CR.true.numeric.attribute"/>
          <parameter key="20" value="GFR.true.numeric.attribute"/>
          <parameter key="21" value="CCI.true.integer.attribute"/>
          <parameter key="22" value="CONTROL_7\.5.true.integer.attribute"/>
          <parameter key="23" value="CONTROL_6.true.integer.attribute"/>
          <parameter key="24" value="CONTROL_6\.5.true.integer.attribute"/>
          <parameter key="25" value="CONTROL_7.true.integer.attribute"/>
          <parameter key="26" value="GENDER.true.integer.attribute"/>
          <parameter key="27" value="BACKGROUND_INFORMATION.true.integer.attribute"/>
          <parameter key="28" value="FAMILY_HEALTH_STORY.true.integer.attribute"/>
          <parameter key="29" value="INSULINE_TREATMENT.true.integer.attribute"/>
          <parameter key="30" value="BMI_DEGREE.true.integer.attribute"/>
          <parameter key="31" value="PATIENTS_STATUS.true.integer.attribute"/>
          <parameter key="32" value="SMOKING_HABIT.true.integer.attribute"/>
          <parameter key="33" value="HYPERTENSION.true.integer.attribute"/>
          <parameter key="34" value="MACRO.true.binominal.label"/>
          <parameter key="35" value="MICRO.true.integer.attribute"/>
          <parameter key="36" value="CODISEASE.true.integer.attribute"/>
          <parameter key="37" value="HBA1C_DEGREE.true.integer.attribute"/>
          <parameter key="38" value="GLUCOSE_LEVEL_RISK_DEGREE.true.integer.attribute"/>
          <parameter key="39" value="LIPID_PROFILE.true.integer.attribute"/>
          <parameter key="40" value="CREATININE_DEGREE.true.integer.attribute"/>
          <parameter key="41" value="ALBUMIN_DEGREE.true.integer.attribute"/>
          <parameter key="42" value="GFR_DEGREE.true.integer.attribute"/>
        </list>
      </operator>
      <operator activated="true" class="concurrency:loop_parameters" compatibility="8.0.001" expanded="true" height="82" name="Loop Parameters (2)" width="90" x="380" y="85">
        <list key="parameters">
          <parameter key="MRMR-FS (2).relevance_redundancy_relation" value="quotient,difference"/>
          <parameter key="Stability (2).sampling_type" value="linear sampling,shuffled sampling,stratified sampling,automatic"/>
          <parameter key="MRMR-FS (2).k" value="[0.0;100.0;10;linear]"/>
        </list>
        <process expanded="true">
          <operator activated="true" class="featselext:feature_selection_stability_evaluator" compatibility="1.1.004" expanded="true" height="103" name="Stability (2)" width="90" x="112" y="136">
            <parameter key="sampling_type" value="automatic"/>
            <process expanded="true">
              <operator activated="true" class="featselext:mrmr_feature_selection" compatibility="1.1.004" expanded="true" height="82" name="MRMR-FS (2)" width="90" x="313" y="187">
                <parameter key="normalize_weights" value="true"/>
                <parameter key="k" value="50"/>
                <parameter key="relevance_redundancy_relation" value="difference"/>
              </operator>
              <connect from_port="exampleset" to_op="MRMR-FS (2)" to_port="example set"/>
              <connect from_op="MRMR-FS (2)" from_port="weights" to_port="weights"/>
              <portSpacing port="source_exampleset" spacing="0"/>
              <portSpacing port="sink_weights" spacing="0"/>
            </process>
          </operator>
          <operator activated="true" class="log" compatibility="8.0.001" expanded="true" height="103" name="Log (2)" width="90" x="313" y="136">
            <parameter key="filename" value="C:\Users\AngelsChange\Desktop\wer.log"/>
            <list key="log">
              <parameter key="jaccard" value="operator.Stability (2).value.robustness"/>
              <parameter key="kuncheva" value="operator.Stability (2).value.consistency"/>
            </list>
          </operator>
          <connect from_port="input 1" to_op="Stability (2)" to_port="exampleset"/>
          <connect from_op="Stability (2)" from_port="robustness" to_op="Log (2)" to_port="through 1"/>
          <connect from_op="Stability (2)" from_port="kuncheva" to_op="Log (2)" to_port="through 2"/>
          <connect from_op="Log (2)" from_port="through 1" to_port="performance"/>
          <connect from_op="Log (2)" from_port="through 2" to_port="output 1"/>
          <portSpacing port="source_input 1" spacing="0"/>
          <portSpacing port="source_input 2" spacing="0"/>
          <portSpacing port="sink_performance" spacing="0"/>
          <portSpacing port="sink_output 1" spacing="0"/>
          <portSpacing port="sink_output 2" spacing="0"/>
        </process>
      </operator>
      <connect from_port="input 1" to_op="Read Excel" to_port="file"/>
      <connect from_op="Read Excel" from_port="output" to_op="Loop Parameters (2)" to_port="input 1"/>
      <connect from_op="Loop Parameters (2)" from_port="output 1" to_port="result 2"/>
      <portSpacing port="source_input 1" spacing="0"/>
      <portSpacing port="source_input 2" spacing="0"/>
      <portSpacing port="sink_result 1" spacing="0"/>
      <portSpacing port="sink_result 2" spacing="0"/>
      <portSpacing port="sink_result 3" spacing="0"/>
    </process>
  </operator>
</process>

Answers

  • ozgeozyazar
    ozgeozyazar New Altair Community Member
    If you have an idea please share wth me since I need to complete my thesis and it is the important part :(
  • rfuentealba
    rfuentealba New Altair Community Member
    Hello, @ozgeozyazar

    When I import your process, RapidMiner tells me the following:


    I need more information, as you are working with an old version of RapidMiner, and you haven't provided information on what plugins are you using, etc.

    All the best,

    Rodrigo.

Welcome!

It looks like you're new here. Sign in or register to get started.

Welcome!

It looks like you're new here. Sign in or register to get started.