RapidMiner

How to combine example set in IO Object Collection

SOLVED
Contributor II

How to combine example set in IO Object Collection

I couldn't combine the example set shown in each IO Object Collection from Loop Attributes. I tried using Loop Collection, Remember and Recall operators, but not worked. The process XML is attached, hope someone can help me with this. Thanks.

<?xml version="1.0" encoding="UTF-8"?>

-<process version="7.5.001">


-<context>

<input/>

<output/>

<macros/>

</context>


-<operator name="Process" expanded="true" compatibility="7.5.001" class="process" activated="true">

<parameter value="init" key="logverbosity"/>

<parameter value="2001" key="random_seed"/>

<parameter value="never" key="send_mail"/>

<parameter value="" key="notification_email"/>

<parameter value="30" key="process_duration_for_mail"/>

<parameter value="SYSTEM" key="encoding"/>


-<process expanded="true">


-<operator name="Retrieve number of tourists" expanded="true" compatibility="7.5.001" class="retrieve" activated="true" y="34" x="45" width="90" height="68">

<parameter value="Samples/data/number of tourists" key="repository_entry"/>

</operator>


-<operator name="Loop Values" expanded="true" compatibility="7.5.001" class="loop_values" activated="true" y="34" x="179" width="90" height="82">

<parameter value="COUNTRY" key="attribute"/>

<parameter value="loop_value" key="iteration_macro"/>


-<process expanded="true">


-<operator name="Filter Examples (4)" expanded="true" compatibility="7.5.001" class="filter_examples" activated="true" y="34" x="45" width="90" height="103">

<parameter value="" key="parameter_expression"/>

<parameter value="custom_filters" key="condition_class"/>

<parameter value="false" key="invert_filter"/>


-<list key="filters_list">

<parameter value="COUNTRY.equals.%{loop_value}" key="filters_entry_key"/>

</list>

<parameter value="true" key="filters_logic_and"/>

<parameter value="true" key="filters_check_metadata"/>

</operator>


-<operator name="Recall (2)" expanded="true" compatibility="7.5.001" class="recall" activated="true" y="238" x="715" width="90" height="68">

<parameter value="data" key="name"/>

<parameter value="ExampleSet" key="io_object"/>

<parameter value="true" key="remove_from_store"/>

</operator>


-<operator name="Set Role" expanded="true" compatibility="7.5.001" class="set_role" activated="true" y="34" x="179" width="90" height="82">

<parameter value="YEAR" key="attribute_name"/>

<parameter value="id" key="target_role"/>

<list key="set_additional_roles"/>

</operator>


-<operator name="Loop Attributes (2)" expanded="true" compatibility="7.5.001" class="concurrency:loop_attributes" activated="true" y="34" x="313" width="90" height="82">

<parameter value="subset" key="attribute_filter_type"/>

<parameter value="" key="attribute"/>

<parameter value="01-12-F|01-12-M|13-19-F|13-19-M|20-29-F|20-29-M|30-39-F|30-39-M|40-49-F|40-49-M|50-59-F|50-59-M|60-65-F|60-65-M|66-F|66-M" key="attributes"/>

<parameter value="false" key="use_except_expression"/>

<parameter value="attribute_value" key="value_type"/>

<parameter value="false" key="use_value_type_exception"/>

<parameter value="time" key="except_value_type"/>

<parameter value="attribute_block" key="block_type"/>

<parameter value="false" key="use_block_type_exception"/>

<parameter value="value_matrix_row_start" key="except_block_type"/>

<parameter value="false" key="invert_selection"/>

<parameter value="true" key="include_special_attributes"/>

<parameter value="loop_attribute" key="attribute_name_macro"/>

<parameter value="false" key="reuse_results"/>

<parameter value="true" key="enable_parallel_execution"/>


-<process expanded="true">


-<operator name="Differentiate (2)" expanded="true" compatibility="7.4.000" class="series:differentiate_example_set" activated="true" y="34" x="112" width="90" height="82">

<parameter value="%{loop_attribute}" key="attribute_name"/>

<parameter value="difference" key="change_mode"/>

<parameter value="1" key="lag"/>

<parameter value="true" key="keep_original_attribute"/>

</operator>


-<operator name="Select Attributes (3)" expanded="true" compatibility="7.5.001" class="select_attributes" activated="true" y="34" x="246" width="90" height="82">

<parameter value="no_missing_values" key="attribute_filter_type"/>

<parameter value="66-F" key="attribute"/>

<parameter value="" key="attributes"/>

<parameter value="[-!"#$%&'()*+,./:;<=>?@\[\\\]_`{|}~]" key="regular_expression"/>

<parameter value="true" key="use_except_expression"/>

<parameter value="numeric" key="value_type"/>

<parameter value="false" key="use_value_type_exception"/>

<parameter value="time" key="except_value_type"/>

<parameter value="attribute_block" key="block_type"/>

<parameter value="false" key="use_block_type_exception"/>

<parameter value="value_matrix_row_start" key="except_block_type"/>

<parameter value="true" key="invert_selection"/>

<parameter value="false" key="include_special_attributes"/>

</operator>

<connect to_port="example set input" to_op="Differentiate (2)" from_port="input 1"/>

<connect to_port="example set input" to_op="Select Attributes (3)" from_port="example set output" from_op="Differentiate (2)"/>

<connect to_port="output 1" from_port="example set output" from_op="Select Attributes (3)"/>

<portSpacing spacing="0" port="source_input 1"/>

<portSpacing spacing="0" port="source_input 2"/>

<portSpacing spacing="0" port="sink_output 1"/>

<portSpacing spacing="0" port="sink_output 2"/>

</process>

</operator>

<operator name="Multiply" expanded="true" compatibility="7.5.001" class="multiply" activated="true" y="85" x="447" width="90" height="103"/>


-<operator name="Loop Collection (3)" expanded="true" compatibility="7.5.001" class="loop_collection" activated="true" y="238" x="581" width="90" height="82">

<parameter value="true" key="set_iteration_macro"/>

<parameter value="iteration" key="macro_name"/>

<parameter value="1" key="macro_start_value"/>

<parameter value="false" key="unfold"/>


-<process expanded="true">


-<operator name="Branch" expanded="true" compatibility="7.5.001" class="branch" activated="true" y="34" x="246" width="90" height="82">

<parameter value="expression" key="condition_type"/>

<parameter value="%{iteration}==1" key="expression"/>

<parameter value="ANOVAMatrix" key="io_object"/>

<parameter value="true" key="return_inner_output"/>


-<process expanded="true">

<connect to_port="input 1" from_port="condition"/>

<portSpacing spacing="0" port="source_condition"/>

<portSpacing spacing="0" port="source_input 1"/>

<portSpacing spacing="0" port="sink_input 1"/>

<portSpacing spacing="0" port="sink_input 2"/>

</process>


-<process expanded="true">


-<operator name="Recall" expanded="true" compatibility="7.5.001" class="recall" activated="true" y="238" x="45" width="90" height="68">

<parameter value="data" key="name"/>

<parameter value="ExampleSet" key="io_object"/>

<parameter value="true" key="remove_from_store"/>

</operator>


-<operator name="Join" expanded="true" compatibility="7.5.001" class="join" activated="true" y="34" x="112" width="90" height="82">

<parameter value="true" key="remove_double_attributes"/>

<parameter value="inner" key="join_type"/>

<parameter value="true" key="use_id_attribute_as_key"/>

<list key="key_attributes"/>

<parameter value="false" key="keep_both_join_attributes"/>

</operator>


-<operator name="Remember" expanded="true" compatibility="7.5.001" class="remember" activated="true" y="85" x="246" width="90" height="68">

<parameter value="data" key="name"/>

<parameter value="ExampleSet" key="io_object"/>

<parameter value="1" key="store_which"/>

<parameter value="true" key="remove_from_process"/>

</operator>

<connect to_port="left" to_op="Join" from_port="condition"/>

<connect to_port="right" to_op="Join" from_port="result" from_op="Recall"/>

<connect to_port="store" to_op="Remember" from_port="join" from_op="Join"/>

<connect to_port="input 1" from_port="stored" from_op="Remember"/>

<portSpacing spacing="0" port="source_condition"/>

<portSpacing spacing="0" port="source_input 1"/>

<portSpacing spacing="0" port="sink_input 1"/>

<portSpacing spacing="0" port="sink_input 2"/>

</process>

</operator>

<connect to_port="condition" to_op="Branch" from_port="single"/>

<connect to_port="output 1" from_port="input 1" from_op="Branch"/>

<portSpacing spacing="0" port="source_single"/>

<portSpacing spacing="0" port="sink_output 1"/>

<portSpacing spacing="0" port="sink_output 2"/>

</process>

</operator>


-<operator name="Select" expanded="true" compatibility="7.5.001" class="select" activated="true" y="85" x="581" width="90" height="68">

<parameter value="1" key="index"/>

<parameter value="false" key="unfold"/>

</operator>


-<operator name="Remember (2)" expanded="true" compatibility="7.5.001" class="remember" activated="true" y="85" x="715" width="90" height="68">

<parameter value="data" key="name"/>

<parameter value="ExampleSet" key="io_object"/>

<parameter value="1" key="store_which"/>

<parameter value="true" key="remove_from_process"/>

</operator>

<connect to_port="example set input" to_op="Filter Examples (4)" from_port="example set"/>

<connect to_port="example set input" to_op="Set Role" from_port="example set output" from_op="Filter Examples (4)"/>

<connect to_port="out 1" from_port="result" from_op="Recall (2)"/>

<connect to_port="input 1" to_op="Loop Attributes (2)" from_port="example set output" from_op="Set Role"/>

<connect to_port="input" to_op="Multiply" from_port="output 1" from_op="Loop Attributes (2)"/>

<connect to_port="collection" to_op="Select" from_port="output 1" from_op="Multiply"/>

<connect to_port="collection" to_op="Loop Collection (3)" from_port="output 2" from_op="Multiply"/>

<connect to_port="store" to_op="Remember (2)" from_port="selected" from_op="Select"/>

<portSpacing spacing="0" port="source_example set"/>

<portSpacing spacing="0" port="sink_out 1"/>

<portSpacing spacing="0" port="sink_out 2"/>

</process>

</operator>

<connect to_port="example set" to_op="Loop Values" from_port="output" from_op="Retrieve number of tourists"/>

<connect to_port="result 1" from_port="out 1" from_op="Loop Values"/>

<portSpacing spacing="0" port="source_input 1"/>

<portSpacing spacing="0" port="sink_result 1"/>

<portSpacing spacing="0" port="sink_result 2"/>

</process>

</operator>

</process>
2 REPLIES
Moderator
Solution
Accepted by topic author hmhsing
‎05-19-2017 06:03 AM

Re: How to combine example set in IO Object Collection

Contributor II

Re: How to combine example set in IO Object Collection

Thanks for your help. Since I used two loops (loop values and then loop attributes in the subprocess), I need two loop collections (one with join, the other with append inside the loop) to combine all the example set together. It finally works, thanks again.