🎉 🎉. RAPIDMINER 9.8 IS OUT!!! 🎉 🎉

RapidMiner 9.8 continues to innovate in data science collaboration, connectivity and governance

CLICK HERE TO DOWNLOAD

Predicting Parameter with Clustering

phonigsphonigs Member Posts: 1 Newbie
Hello Community,

i havn't found any similar question 

i am trying to build an application who can helps me predict parameters for machines.
the macchine doeas many different processes, who have different parameters. the parameters change by process type and diameters and material of the workpiece.

As Database we can use the parameters of all parts in production (about 10000 parametersets). 
When a new piece has to be processed all these parameters has to be created.
To start with we have some piece and process data, like quality, diameters, matewrials and some more. al these inforamtioan are also lincluded to the parameter sets.


The idea for me is now: All the existing parameters getting clustered. The clusters shoud depict the processes. 
Then take the Dataset to presict, and look to which cluster the set depends and then generate the missing parameters depending on the datas in this cluster.

i have made a process where i get some data out.
i used random clustering and applymodel. And i got some data out, which are not too bad. But the imput data have changed too. 

Does anyone has a better idea how i can solve this?



This is what i got till now.
I tryed to get a verification through cluster distances


<?xml version="1.0" encoding="UTF-8"?>
-<process version="9.8.000">

-<context>
<input/>
<output/>
<macros/>
</context>

-<operator name="Process" expanded="true" compatibility="9.8.000" class="process" activated="true">
<parameter value="init" key="logverbosity"/>
<parameter value="2001" key="random_seed"/>
<parameter value="never" key="send_mail"/>
<parameter value="" key="notification_email"/>
<parameter value="30" key="process_duration_for_mail"/>
<parameter value="SYSTEM" key="encoding"/>

-<process expanded="true">

-<operator name="Retrieve Predict_Data_Set1" expanded="true" compatibility="9.8.000" class="retrieve" activated="true" y="34" x="45" width="90" height="68">
<parameter value="//Local Repository/processes/Predict_Data_Set1" key="repository_entry"/>
</operator>

-<operator name="Select Attributes" expanded="true" compatibility="9.8.000" class="select_attributes" activated="true" y="34" x="179" width="90" height="82">
<parameter value="subset" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="Außendurchmesser|Borddurchmesser|Druck|Eingriffsbreite|Eingriffstiefe|Form|Laufbahndurchmesser|Schleifscheibe Durchmesser|Schleifvorgang|Verschleiß WZ|Vor/Fertig|Werkstoff|Winkel|WKST Spindelgeschwindigkeit|WKZT Spindelgeschwindigkeit|Zustelltiefe" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>
</operator>

-<operator name="Map SVG" expanded="true" compatibility="9.8.000" class="map" activated="true" y="136" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Schleifvorgang" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Laufbahn"/>
<parameter value="1" key="Außen"/>
<parameter value="3" key="Bord"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map VrFrt" expanded="true" compatibility="9.8.000" class="map" activated="true" y="238" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Vor/Fertig" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Vor"/>
<parameter value="1" key="Fertig"/>
<parameter value="0" key="Vor "/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map WKST" expanded="true" compatibility="9.8.000" class="map" activated="true" y="340" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Werkstoff" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="C6204"/>
<parameter value="1" key="C6535"/>
<parameter value="2" key="C6534"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map FRM" expanded="true" compatibility="9.8.000" class="map" activated="true" y="442" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Form" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Rund"/>
<parameter value="1" key="Bilop"/>
<parameter value="2" key="Trilop"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Nominal to Numerical" expanded="true" compatibility="9.8.000" class="nominal_to_numerical" activated="true" y="442" x="313" width="90" height="103">
<parameter value="false" key="return_preprocessing_model"/>
<parameter value="false" key="create_view"/>
<parameter value="all" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="nominal" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="file_path" key="except_value_type"/>
<parameter value="single_value" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="single_value" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>
<parameter value="dummy coding" key="coding_type"/>
<parameter value="false" key="use_comparison_groups"/>
<list key="comparison_groups"/>
<parameter value="all 0 and warning" key="unexpected_value_handling"/>
<parameter value="false" key="use_underscore_in_name"/>
</operator>
<operator name="Multiply" expanded="true" compatibility="9.8.000" class="multiply" activated="true" y="493" x="447" width="90" height="166"/>

-<operator name="Generate ID (3)" expanded="true" compatibility="9.8.000" class="generate_id" activated="true" y="1258" x="715" width="90" height="82">
<parameter value="false" key="create_nominal_ids"/>
<parameter value="0" key="offset"/>
</operator>

-<operator name="Clustering" expanded="true" compatibility="9.8.000" class="concurrency:k_means" activated="true" y="493" x="849" width="90" height="82">
<parameter value="true" key="add_cluster_attribute"/>
<parameter value="true" key="add_as_label"/>
<parameter value="false" key="remove_unlabeled"/>
<parameter value="70" key="k"/>
<parameter value="10" key="max_runs"/>
<parameter value="true" key="determine_good_start_values"/>
<parameter value="BregmanDivergences" key="measure_types"/>
<parameter value="MixedEuclideanDistance" key="mixed_measure"/>
<parameter value="NominalDistance" key="nominal_measure"/>
<parameter value="EuclideanDistance" key="numerical_measure"/>
<parameter value="SquaredEuclideanDistance" key="divergence"/>
<parameter value="radial" key="kernel_type"/>
<parameter value="1.0" key="kernel_gamma"/>
<parameter value="1.0" key="kernel_sigma1"/>
<parameter value="0.0" key="kernel_sigma2"/>
<parameter value="2.0" key="kernel_sigma3"/>
<parameter value="3.0" key="kernel_degree"/>
<parameter value="1.0" key="kernel_shift"/>
<parameter value="1.0" key="kernel_a"/>
<parameter value="0.0" key="kernel_b"/>
<parameter value="100" key="max_optimization_steps"/>
<parameter value="false" key="use_local_random_seed"/>
<parameter value="1992" key="local_random_seed"/>
</operator>
<operator name="Multiply (3)" expanded="true" compatibility="9.8.000" class="multiply" activated="true" y="493" x="1184" width="90" height="124"/>

-<operator name="Retrieve Parameter_Set" expanded="true" compatibility="9.8.000" class="retrieve" activated="true" y="748" x="45" width="90" height="68">
<parameter value="//Local Repository/processes/Parameter_Set" key="repository_entry"/>
</operator>

-<operator name="Select Attributes (2)" expanded="true" compatibility="9.8.000" class="select_attributes" activated="true" y="748" x="179" width="90" height="82">
<parameter value="subset" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="Außendurchmesser|Borddurchmesser|Druck|Eingriffsbreite|Eingriffstiefe|Form|Laufbahndurchmesser|Schleifscheibe Durchmesser|Schleifvorgang|Verschleiß WZ|Vor/Fertig|Werkstoff|Winkel|WKST Spindelgeschwindigkeit|WKZT Spindelgeschwindigkeit|Zustelltiefe" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>
</operator>

-<operator name="Map SVG (2)" expanded="true" compatibility="9.8.000" class="map" activated="true" y="850" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Schleifvorgang" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Laufbahn"/>
<parameter value="1" key="Außen"/>
<parameter value="3" key="Bord"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map VrFrt (2)" expanded="true" compatibility="9.8.000" class="map" activated="true" y="952" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Vor/Fertig" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Vor"/>
<parameter value="1" key="Fertig"/>
<parameter value="0" key="Vor "/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map WKST (2)" expanded="true" compatibility="9.8.000" class="map" activated="true" y="1054" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Werkstoff" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="C6204"/>
<parameter value="1" key="C6535"/>
<parameter value="2" key="C6534"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Map FRM (2)" expanded="true" compatibility="9.8.000" class="map" activated="true" y="1156" x="179" width="90" height="82">
<parameter value="single" key="attribute_filter_type"/>
<parameter value="Form" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="attribute_value" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="time" key="except_value_type"/>
<parameter value="attribute_block" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_matrix_row_start" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>

-<list key="value_mappings">
<parameter value="0" key="Rund"/>
<parameter value="1" key="Bilop"/>
<parameter value="2" key="Trilop"/>
</list>
<parameter value="false" key="consider_regular_expressions"/>
<parameter value="false" key="add_default_mapping"/>
</operator>

-<operator name="Nominal to Numerical (2)" expanded="true" compatibility="9.8.000" class="nominal_to_numerical" activated="true" y="1156" x="380" width="90" height="103">
<parameter value="false" key="return_preprocessing_model"/>
<parameter value="false" key="create_view"/>
<parameter value="all" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="nominal" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="file_path" key="except_value_type"/>
<parameter value="single_value" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="single_value" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="false" key="include_special_attributes"/>
<parameter value="dummy coding" key="coding_type"/>
<parameter value="false" key="use_comparison_groups"/>
<list key="comparison_groups"/>
<parameter value="all 0 and warning" key="unexpected_value_handling"/>
<parameter value="false" key="use_underscore_in_name"/>
</operator>

-<operator name="Generate ID" expanded="true" compatibility="9.8.000" class="generate_id" activated="true" y="901" x="916" width="90" height="82">
<parameter value="false" key="create_nominal_ids"/>
<parameter value="0" key="offset"/>
</operator>

-<operator name="Generate ID (2)" expanded="true" compatibility="9.8.000" class="generate_id" activated="true" y="799" x="916" width="90" height="82">
<parameter value="false" key="create_nominal_ids"/>
<parameter value="0" key="offset"/>
</operator>

-<operator name="Join" expanded="true" compatibility="9.8.000" class="concurrency:join" activated="true" y="850" x="1050" width="90" height="82">
<parameter value="true" key="remove_double_attributes"/>
<parameter value="right" key="join_type"/>
<parameter value="true" key="use_id_attribute_as_key"/>
<list key="key_attributes"/>
<parameter value="false" key="keep_both_join_attributes"/>
</operator>

-<operator name="Apply Model" expanded="true" compatibility="9.8.000" class="apply_model" activated="true" y="850" x="1251" width="90" height="82">
<list key="application_parameters"/>
<parameter value="false" key="create_view"/>
</operator>
<operator name="Multiply (2)" expanded="true" compatibility="9.8.000" class="multiply" activated="true" y="850" x="1452" width="90" height="124"/>

-<operator name="Cross Distances" expanded="true" compatibility="9.8.000" class="cross_distances" activated="true" y="493" x="1653" width="90" height="103">
<parameter value="MixedMeasures" key="measure_types"/>
<parameter value="MixedEuclideanDistance" key="mixed_measure"/>
<parameter value="NominalDistance" key="nominal_measure"/>
<parameter value="EuclideanDistance" key="numerical_measure"/>
<parameter value="GeneralizedIDivergence" key="divergence"/>
<parameter value="radial" key="kernel_type"/>
<parameter value="1.0" key="kernel_gamma"/>
<parameter value="1.0" key="kernel_sigma1"/>
<parameter value="0.0" key="kernel_sigma2"/>
<parameter value="2.0" key="kernel_sigma3"/>
<parameter value="3.0" key="kernel_degree"/>
<parameter value="1.0" key="kernel_shift"/>
<parameter value="1.0" key="kernel_a"/>
<parameter value="0.0" key="kernel_b"/>
<parameter value="false" key="only_top_k"/>
<parameter value="10" key="k"/>
<parameter value="nearest" key="search_for"/>
<parameter value="false" key="compute_similarities"/>
</operator>

-<operator name="Join (2)" expanded="true" compatibility="9.8.000" class="concurrency:join" activated="true" y="1258" x="849" width="90" height="82">
<parameter value="true" key="remove_double_attributes"/>
<parameter value="right" key="join_type"/>
<parameter value="true" key="use_id_attribute_as_key"/>
<list key="key_attributes"/>
<parameter value="false" key="keep_both_join_attributes"/>
</operator>

-<operator name="Append" expanded="true" compatibility="9.8.000" class="append" activated="true" y="1258" x="983" width="90" height="82">
<parameter value="double_array" key="datamanagement"/>
<parameter value="auto" key="data_management"/>
<parameter value="all" key="merge_type"/>
</operator>
<operator name="Multiply (4)" expanded="true" compatibility="9.8.000" class="multiply" activated="true" y="1258" x="1117" width="90" height="103"/>

-<operator name="Set Role" expanded="true" compatibility="9.8.000" class="set_role" activated="true" y="1258" x="1251" width="90" height="82">
<parameter value="Eingriffsbreite" key="attribute_name"/>
<parameter value="prediction" key="target_role"/>
<list key="set_additional_roles"/>
</operator>

-<operator name="Discretize" expanded="true" compatibility="9.8.000" class="discretize_by_size" activated="true" y="1258" x="1385" width="90" height="103">
<parameter value="false" key="return_preprocessing_model"/>
<parameter value="false" key="create_view"/>
<parameter value="regular_expression" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="Eingriffsbreite" key="regular_expression"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="numeric" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="real" key="except_value_type"/>
<parameter value="value_series" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_series_end" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="true" key="include_special_attributes"/>
<parameter value="20" key="size_of_bins"/>
<parameter value="decreasing" key="sorting_direction"/>
<parameter value="long" key="range_name_type"/>
<parameter value="true" key="automatic_number_of_digits"/>
<parameter value="-1" key="number_of_digits"/>
</operator>

-<operator name="Performance" expanded="true" compatibility="9.8.000" class="cluster_distance_performance" activated="true" y="1258" x="1519" width="90" height="103">
<parameter value="Avg. within centroid distance" key="main_criterion"/>
<parameter value="false" key="main_criterion_only"/>
<parameter value="false" key="normalize"/>
<parameter value="false" key="maximize"/>
</operator>

-<operator name="Set Role (2)" expanded="true" compatibility="9.8.000" class="set_role" activated="true" y="1462" x="782" width="90" height="82">
<parameter value="Eingriffsbreite" key="attribute_name"/>
<parameter value="prediction" key="target_role"/>
<list key="set_additional_roles"/>
</operator>

-<operator name="Discretize (2)" expanded="true" compatibility="9.8.000" class="discretize_by_size" activated="true" y="1462" x="916" width="90" height="103">
<parameter value="false" key="return_preprocessing_model"/>
<parameter value="false" key="create_view"/>
<parameter value="regular_expression" key="attribute_filter_type"/>
<parameter value="" key="attribute"/>
<parameter value="" key="attributes"/>
<parameter value="Eingriffsbreite" key="regular_expression"/>
<parameter value="false" key="use_except_expression"/>
<parameter value="numeric" key="value_type"/>
<parameter value="false" key="use_value_type_exception"/>
<parameter value="real" key="except_value_type"/>
<parameter value="value_series" key="block_type"/>
<parameter value="false" key="use_block_type_exception"/>
<parameter value="value_series_end" key="except_block_type"/>
<parameter value="false" key="invert_selection"/>
<parameter value="true" key="include_special_attributes"/>
<parameter value="20" key="size_of_bins"/>
<parameter value="decreasing" key="sorting_direction"/>
<parameter value="long" key="range_name_type"/>
<parameter value="true" key="automatic_number_of_digits"/>
<parameter value="-1" key="number_of_digits"/>
</operator>

-<operator name="Performance (2)" expanded="true" compatibility="9.8.000" class="cluster_distance_performance" activated="true" y="1462" x="1050" width="90" height="103">
<parameter value="Avg. within centroid distance" key="main_criterion"/>
<parameter value="false" key="main_criterion_only"/>
<parameter value="false" key="normalize"/>
<parameter value="false" key="maximize"/>
</operator>
<connect to_port="example set input" to_op="Select Attributes" from_port="output" from_op="Retrieve Predict_Data_Set1"/>
<connect to_port="example set input" to_op="Map SVG" from_port="example set output" from_op="Select Attributes"/>
<connect to_port="example set input" to_op="Map VrFrt" from_port="example set output" from_op="Map SVG"/>
<connect to_port="example set input" to_op="Map WKST" from_port="example set output" from_op="Map VrFrt"/>
<connect to_port="example set input" to_op="Map FRM" from_port="example set output" from_op="Map WKST"/>
<connect to_port="example set input" to_op="Nominal to Numerical" from_port="example set output" from_op="Map FRM"/>
<connect to_port="input" to_op="Multiply" from_port="example set output" from_op="Nominal to Numerical"/>
<connect to_port="example set" to_op="Clustering" from_port="output 1" from_op="Multiply"/>
<connect to_port="example set input" to_op="Generate ID (2)" from_port="output 2" from_op="Multiply"/>
<connect to_port="example set input" to_op="Generate ID (3)" from_port="output 3" from_op="Multiply"/>
<connect to_port="example set input" to_op="Set Role (2)" from_port="output 4" from_op="Multiply"/>
<connect to_port="reference set" to_op="Cross Distances" from_port="output 5" from_op="Multiply"/>
<connect to_port="left" to_op="Join (2)" from_port="example set output" from_op="Generate ID (3)"/>
<connect to_port="input" to_op="Multiply (3)" from_port="cluster model" from_op="Clustering"/>
<connect to_port="model" to_op="Apply Model" from_port="output 1" from_op="Multiply (3)"/>
<connect to_port="cluster model" to_op="Performance (2)" from_port="output 2" from_op="Multiply (3)"/>
<connect to_port="cluster model" to_op="Performance" from_port="output 3" from_op="Multiply (3)"/>
<connect to_port="example set input" to_op="Select Attributes (2)" from_port="output" from_op="Retrieve Parameter_Set"/>
<connect to_port="example set input" to_op="Map SVG (2)" from_port="example set output" from_op="Select Attributes (2)"/>
<connect to_port="example set input" to_op="Map VrFrt (2)" from_port="example set output" from_op="Map SVG (2)"/>
<connect to_port="example set input" to_op="Map WKST (2)" from_port="example set output" from_op="Map VrFrt (2)"/>
<connect to_port="example set input" to_op="Map FRM (2)" from_port="example set output" from_op="Map WKST (2)"/>
<connect to_port="example set input" to_op="Nominal to Numerical (2)" from_port="example set output" from_op="Map FRM (2)"/>
<connect to_port="example set input" to_op="Generate ID" from_port="example set output" from_op="Nominal to Numerical (2)"/>
<connect to_port="right" to_op="Join" from_port="example set output" from_op="Generate ID"/>
<connect to_port="left" to_op="Join" from_port="example set output" from_op="Generate ID (2)"/>
<connect to_port="unlabelled data" to_op="Apply Model" from_port="join" from_op="Join"/>
<connect to_port="input" to_op="Multiply (2)" from_port="labelled data" from_op="Apply Model"/>
<connect to_port="result 1" from_port="output 1" from_op="Multiply (2)"/>
<connect to_port="right" to_op="Join (2)" from_port="output 2" from_op="Multiply (2)"/>
<connect to_port="request set" to_op="Cross Distances" from_port="output 3" from_op="Multiply (2)"/>
<connect to_port="result 4" from_port="result set" from_op="Cross Distances"/>
<connect to_port="example set 1" to_op="Append" from_port="join" from_op="Join (2)"/>
<connect to_port="input" to_op="Multiply (4)" from_port="merged set" from_op="Append"/>
<connect to_port="example set input" to_op="Set Role" from_port="output 1" from_op="Multiply (4)"/>
<connect to_port="result 5" from_port="output 2" from_op="Multiply (4)"/>
<connect to_port="example set input" to_op="Discretize" from_port="example set output" from_op="Set Role"/>
<connect to_port="example set" to_op="Performance" from_port="example set output" from_op="Discretize"/>
<connect to_port="result 2" from_port="performance" from_op="Performance"/>
<connect to_port="example set input" to_op="Discretize (2)" from_port="example set output" from_op="Set Role (2)"/>
<connect to_port="example set" to_op="Performance (2)" from_port="example set output" from_op="Discretize (2)"/>
<connect to_port="result 3" from_port="performance" from_op="Performance (2)"/>
<portSpacing spacing="0" port="source_input 1"/>
<portSpacing spacing="0" port="sink_result 1"/>
<portSpacing spacing="0" port="sink_result 2"/>
<portSpacing spacing="0" port="sink_result 3"/>
<portSpacing spacing="0" port="sink_result 4"/>
<portSpacing spacing="0" port="sink_result 5"/>
<portSpacing spacing="0" port="sink_result 6"/>
<description y="700" x="10" width="562" height="638" resized="true" colored="false" color="yellow" align="right">Input Predictiondata</description>
<description y="10" x="10" width="563" height="687" resized="true" colored="true" color="purple" align="right">Input 1 Basicdata/ Learningdata</description>
<description y="1424" x="581" width="1175" height="262" resized="true" colored="true" color="blue" align="right">Performancetest Prediction</description>
<description y="1162" x="582" width="1175" height="257" resized="true" colored="true" color="gray" align="right">Perfomancetest Dataset<br/></description>
<description y="696" x="582" width="1172" height="454" resized="true" colored="true" color="red" align="right">Prediction<br></description>
<description y="434" x="585" width="976" height="256" resized="true" colored="true" color="green" align="right">Training Data<br></description>
<description y="434" x="1576" width="176" height="250" resized="true" colored="true" color="orange" align="center">Validation data</description>
</process>
</operator>
</process>

Answers

  • mschmitzmschmitz Administrator, Moderator, Employee, RapidMiner Certified Analyst, RapidMiner Certified Expert, University Professor Posts: 2,822  RM Data Scientist
    the process you posted here is malfromated. Please use the code (and spoiler option) to post it.

    Use case wise: I would strongly recommend to rethink the idea of clustering here. You can of course do it. In this case you would do something like: What did otherpeople do in this situation? And recommend this setting.

    What one often does is to predict the quality for given parameter and inputs. You can then try to optimize the settings of your maschine to get optimal quality under given properties.

    Cheers,
    Martin
    - Head of Data Science Services at RapidMiner -
    Dortmund, Germany
Sign In or Register to comment.