How to make Feature selection by Consistency-based in rapidminer studio?

LookkuyeeLookkuyee Member Posts: 1 Newbie
I'm a student and I have to do project about Data mining and Consistency-based Feature selection. 
But I don't know how to make Feature selection by Consistency-based in rapidminer studio?
Then I come to ask more Question and thanks for help me 

Answers

  • SGolbertSGolbert RapidMiner Certified Analyst, Member Posts: 225   Unicorn

    It was hard to find, but the operator that you need is available through the Weka Extension. It's called Performance (Consistency).

    Here is a sample process using the Optimize Selection (Evolutionary) operator:
    <?xml version="1.0" encoding="UTF-8"?><process version="9.1.000">
    <context>
    <input/>
    <output/>
    <macros/>
    </context>
    <operator activated="true" class="process" compatibility="6.0.002" expanded="true" name="Root" origin="GENERATED_TUTORIAL">
    <parameter key="logverbosity" value="init"/>
    <parameter key="random_seed" value="2000"/>
    <parameter key="send_mail" value="never"/>
    <parameter key="notification_email" value=""/>
    <parameter key="process_duration_for_mail" value="30"/>
    <parameter key="encoding" value="SYSTEM"/>
    <process expanded="true">
    <operator activated="true" class="retrieve" compatibility="9.1.000" expanded="true" height="68" name="Retrieve Titanic Training" width="90" x="112" y="34">
    <parameter key="repository_entry" value="//Samples/data/Titanic Training"/>
    </operator>
    <operator activated="true" class="optimize_selection_evolutionary" compatibility="9.1.000" expanded="true" height="103" name="Optimize Selection (Evolutionary)" origin="GENERATED_TUTORIAL" width="90" x="380" y="34">
    <parameter key="use_exact_number_of_attributes" value="false"/>
    <parameter key="restrict_maximum" value="false"/>
    <parameter key="min_number_of_attributes" value="1"/>
    <parameter key="max_number_of_attributes" value="1"/>
    <parameter key="exact_number_of_attributes" value="1"/>
    <parameter key="initialize_with_input_weights" value="false"/>
    <parameter key="population_size" value="5"/>
    <parameter key="maximum_number_of_generations" value="30"/>
    <parameter key="use_early_stopping" value="false"/>
    <parameter key="generations_without_improval" value="2"/>
    <parameter key="normalize_weights" value="true"/>
    <parameter key="use_local_random_seed" value="false"/>
    <parameter key="local_random_seed" value="1992"/>
    <parameter key="user_result_individual_selection" value="false"/>
    <parameter key="show_population_plotter" value="false"/>
    <parameter key="plot_generations" value="10"/>
    <parameter key="constraint_draw_range" value="false"/>
    <parameter key="draw_dominated_points" value="true"/>
    <parameter key="maximal_fitness" value="Infinity"/>
    <parameter key="selection_scheme" value="tournament"/>
    <parameter key="tournament_size" value="0.25"/>
    <parameter key="start_temperature" value="1.0"/>
    <parameter key="dynamic_selection_pressure" value="true"/>
    <parameter key="keep_best_individual" value="true"/>
    <parameter key="save_intermediate_weights" value="false"/>
    <parameter key="intermediate_weights_generations" value="10"/>
    <parameter key="p_initialize" value="0.5"/>
    <parameter key="p_mutation" value="-1.0"/>
    <parameter key="p_crossover" value="0.5"/>
    <parameter key="crossover_type" value="uniform"/>
    <process expanded="true">
    <operator activated="true" class="split_validation" compatibility="9.1.000" expanded="true" height="124" name="Validation" origin="GENERATED_TUTORIAL" width="90" x="313" y="30">
    <parameter key="create_complete_model" value="false"/>
    <parameter key="split" value="relative"/>
    <parameter key="split_ratio" value="0.7"/>
    <parameter key="training_set_size" value="100"/>
    <parameter key="test_set_size" value="-1"/>
    <parameter key="sampling_type" value="automatic"/>
    <parameter key="use_local_random_seed" value="false"/>
    <parameter key="local_random_seed" value="1992"/>
    <process expanded="true">
    <operator activated="true" class="naive_bayes" compatibility="9.1.000" expanded="true" height="82" name="Naive Bayes" width="90" x="179" y="34">
    <parameter key="laplace_correction" value="true"/>
    </operator>
    <connect from_port="training" to_op="Naive Bayes" to_port="training set"/>
    <connect from_op="Naive Bayes" from_port="model" to_port="model"/>
    <portSpacing port="source_training" spacing="0"/>
    <portSpacing port="sink_model" spacing="0"/>
    <portSpacing port="sink_through 1" spacing="0"/>
    </process>
    <process expanded="true">
    <operator activated="true" class="apply_model" compatibility="7.1.001" expanded="true" height="82" name="Apply Model" origin="GENERATED_TUTORIAL" width="90" x="45" y="30">
    <list key="application_parameters"/>
    <parameter key="create_view" value="false"/>
    </operator>
    <operator activated="true" class="weka:performance_consistency" compatibility="7.3.000" expanded="true" height="82" name="Performance (2)" width="90" x="246" y="34"/>
    <connect from_port="model" to_op="Apply Model" to_port="model"/>
    <connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/>
    <connect from_op="Apply Model" from_port="labelled data" to_op="Performance (2)" to_port="example set"/>
    <connect from_op="Performance (2)" from_port="performance" to_port="averagable 1"/>
    <portSpacing port="source_model" spacing="0"/>
    <portSpacing port="source_test set" spacing="0"/>
    <portSpacing port="source_through 1" spacing="0"/>
    <portSpacing port="sink_averagable 1" spacing="0"/>
    <portSpacing port="sink_averagable 2" spacing="0"/>
    </process>
    </operator>
    <connect from_port="example set" to_op="Validation" to_port="training"/>
    <connect from_op="Validation" from_port="averagable 1" to_port="performance"/>
    <portSpacing port="source_example set" spacing="0"/>
    <portSpacing port="source_through 1" spacing="0"/>
    <portSpacing port="sink_performance" spacing="36"/>
    </process>
    </operator>
    <connect from_op="Retrieve Titanic Training" from_port="output" to_op="Optimize Selection (Evolutionary)" to_port="example set in"/>
    <connect from_op="Optimize Selection (Evolutionary)" from_port="example set out" to_port="result 1"/>
    <connect from_op="Optimize Selection (Evolutionary)" from_port="performance" to_port="result 2"/>
    <portSpacing port="source_input 1" spacing="0"/>
    <portSpacing port="sink_result 1" spacing="0"/>
    <portSpacing port="sink_result 2" spacing="18"/>
    <portSpacing port="sink_result 3" spacing="0"/>
    </process>
    </operator>
    </process>


    Regards,
    Sebastian

    sgenzerLookkuyee
Sign In or Register to comment.