How to apply batch model to non batched data in rapidminer - batch-processing

i have created a model using batched validation, is there a way to apply this model to non-batched data?
Here is the sample process I created:
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="7.0.001">
<context>
<input/>
<output/>
<macros/>
</context>
<operator activated="true" class="process" compatibility="7.0.001" expanded="true" name="Process">
<parameter key="logverbosity" value="init"/>
<parameter key="random_seed" value="2001"/>
<parameter key="send_mail" value="never"/>
<parameter key="notification_email" value=""/>
<parameter key="process_duration_for_mail" value="30"/>
<parameter key="encoding" value="SYSTEM"/>
<process expanded="true">
<operator activated="true" class="retrieve" compatibility="7.0.001" expanded="true" height="68" name="Retrieve distmodel3" width="90" x="45" y="136">
<parameter key="repository_entry" value="../data/distmodel3"/>
</operator>
<operator activated="true" class="set_role" compatibility="7.0.001" expanded="true" height="82" name="Set Role" width="90" x="246" y="187">
<parameter key="attribute_name" value="batchid"/>
<parameter key="target_role" value="batch"/>
<list key="set_additional_roles">
<parameter key="Letter" value="label"/>
<parameter key="Frame" value="batch"/>
<parameter key="Feat1" value="regular"/>
<parameter key="Feat2" value="regular"/>
<parameter key="Feat3" value="regular"/>
<parameter key="Feat4" value="regular"/>
<parameter key="Feat5" value="regular"/>
<parameter key="Feat6" value="regular"/>
<parameter key="Feat7" value="regular"/>
<parameter key="Feat8" value="regular"/>
<parameter key="Gender" value="regular"/>
</list>
</operator>
<operator activated="true" class="batch_x_validation" compatibility="7.0.001" expanded="true" height="124" name="Validation" width="90" x="380" y="85">
<parameter key="create_complete_model" value="false"/>
<parameter key="average_performances_only" value="true"/>
<process expanded="true">
<operator activated="false" class="weka:W-J48" compatibility="7.0.000" expanded="true" height="82" name="W-J48" width="90" x="112" y="34">
<parameter key="U" value="true"/>
<parameter key="C" value="0.25"/>
<parameter key="M" value="2.0"/>
<parameter key="R" value="false"/>
<parameter key="B" value="true"/>
<parameter key="S" value="false"/>
<parameter key="L" value="false"/>
<parameter key="A" value="false"/>
</operator>
<operator activated="true" class="k_nn" compatibility="7.0.001" expanded="true" height="82" name="k-NN" width="90" x="112" y="187">
<parameter key="k" value="3"/>
<parameter key="weighted_vote" value="false"/>
<parameter key="measure_types" value="MixedMeasures"/>
<parameter key="mixed_measure" value="MixedEuclideanDistance"/>
<parameter key="nominal_measure" value="NominalDistance"/>
<parameter key="numerical_measure" value="EuclideanDistance"/>
<parameter key="divergence" value="GeneralizedIDivergence"/>
<parameter key="kernel_type" value="radial"/>
<parameter key="kernel_gamma" value="1.0"/>
<parameter key="kernel_sigma1" value="1.0"/>
<parameter key="kernel_sigma2" value="0.0"/>
<parameter key="kernel_sigma3" value="2.0"/>
<parameter key="kernel_degree" value="3.0"/>
<parameter key="kernel_shift" value="1.0"/>
<parameter key="kernel_a" value="1.0"/>
<parameter key="kernel_b" value="0.0"/>
</operator>
<connect from_port="training" to_op="k-NN" to_port="training set"/>
<connect from_op="k-NN" from_port="model" to_port="model"/>
<portSpacing port="source_training" spacing="0"/>
<portSpacing port="sink_model" spacing="0"/>
<portSpacing port="sink_through 1" spacing="0"/>
</process>
<process expanded="true">
<operator activated="true" class="apply_model" compatibility="7.0.001" expanded="true" height="82" name="Apply Model" width="90" x="45" y="34">
<list key="application_parameters"/>
<parameter key="create_view" value="false"/>
</operator>
<operator activated="true" class="performance_classification" compatibility="7.0.001" expanded="true" height="82" name="Performance" width="90" x="179" y="34">
<parameter key="main_criterion" value="first"/>
<parameter key="accuracy" value="true"/>
<parameter key="classification_error" value="true"/>
<parameter key="kappa" value="true"/>
<parameter key="weighted_mean_recall" value="false"/>
<parameter key="weighted_mean_precision" value="false"/>
<parameter key="spearman_rho" value="false"/>
<parameter key="kendall_tau" value="false"/>
<parameter key="absolute_error" value="false"/>
<parameter key="relative_error" value="false"/>
<parameter key="relative_error_lenient" value="false"/>
<parameter key="relative_error_strict" value="false"/>
<parameter key="normalized_absolute_error" value="false"/>
<parameter key="root_mean_squared_error" value="false"/>
<parameter key="root_relative_squared_error" value="false"/>
<parameter key="squared_error" value="false"/>
<parameter key="correlation" value="false"/>
<parameter key="squared_correlation" value="false"/>
<parameter key="cross-entropy" value="false"/>
<parameter key="margin" value="false"/>
<parameter key="soft_margin_loss" value="false"/>
<parameter key="logistic_loss" value="false"/>
<parameter key="skip_undefined_labels" value="true"/>
<parameter key="use_example_weights" value="true"/>
<list key="class_weights"/>
</operator>
<connect from_port="model" to_op="Apply Model" to_port="model"/>
<connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/>
<connect from_op="Apply Model" from_port="labelled data" to_op="Performance" to_port="labelled data"/>
<connect from_op="Performance" from_port="performance" to_port="averagable 1"/>
<portSpacing port="source_model" spacing="0"/>
<portSpacing port="source_test set" spacing="0"/>
<portSpacing port="source_through 1" spacing="0"/>
<portSpacing port="sink_averagable 1" spacing="0"/>
<portSpacing port="sink_averagable 2" spacing="0"/>
</process>
</operator>
<operator activated="true" class="legacy:write_model" compatibility="7.0.001" expanded="true" height="68" name="Write Model" width="90" x="514" y="187">
<parameter key="model_file" value="C:\Users\Hans\Documents\ModelFile.mod"/>
<parameter key="overwrite_existing_file" value="true"/>
<parameter key="output_type" value="XML Zipped"/>
</operator>
<connect from_op="Retrieve distmodel3" from_port="output" to_op="Set Role" to_port="example set input"/>
<connect from_op="Set Role" from_port="example set output" to_op="Validation" to_port="training"/>
<connect from_op="Validation" from_port="model" to_op="Write Model" to_port="input"/>
<connect from_op="Validation" from_port="training" to_port="result 1"/>
<connect from_op="Validation" from_port="averagable 1" to_port="result 2"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="sink_result 1" spacing="0"/>
<portSpacing port="sink_result 2" spacing="0"/>
<portSpacing port="sink_result 3" spacing="0"/>
</process>
</operator>
</process>
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////////

The Batch Validation operator uses an attribute to split the training example set. Because this attribute is explicitly set to be of type batch, it is special and this means that it is not used when building the model; classification models use regular attributes to predict a class label. This means the model should work on an example set that does not contain the attribute with the batch role. If the model is used with an example set containing the batch attribute which is set to be regular, the performance will not depend on it (the model may not work at all - it depends on the model).

Related

How to choose testcases available in testng.xml to execute from jenkins UI

I want to run one or more testcases from Jenkins UI which are listed in testng.xml file.
In my testng file there are only three testcases, and I have distributed in different OS and browsers.
Below is the testng.xml code
<!-- Chrome_Browser on Mac OS -->
<test name="ChromeMacTestcase1" preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase1">
</class>
</classes>
</test>
<test name="ChromeMacTestcase2"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase2">
</class>
</classes>
</test>
<test name="ChromeMacTestcase3"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase3">
</class>
</classes>
</test>
<!-- Chrome_Browser on Windows OS -->
<test name="ChromeWinTestcase1" preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase1">
</class>
</classes>
</test>
<test name="ChromeWinTestcase2"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase2">
</class>
</classes>
</test>
<test name="ChromeWinTestcase3"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase3">
</class>
</classes>
</test>
<!-- Firfox_Browser on Mac OS -->
<test name="FirefoxMacTestcase1" preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase1">
</class>
</classes>
</test>
<test name="FirefoxMacTestcase2"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase2">
</class>
</classes>
</test>
<test name="FirefoxMacTestcase3"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Mac OS X 10.9" />
<classes>
<class name="com.testCases.Testcase3">
</class>
</classes>
</test>
<!-- Firefox_Browser on Windows OS -->
<test name="FirefoxWinTestcase1" preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase1">
</class>
</classes>
</test>
<test name="FirefoxWinTestcase2"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase2">
</class>
</classes>
</test>
<test name="FirefoxWinTestcase3"
preserve-order="true">
<parameter name="browser" value="chrome" />
<parameter name="version" value="54" />
<parameter name="platform" value="Windows 10" />
<classes>
<class name="com.testCases.Testcase3">
</class>
</classes>
</test>
Basically the following things I want to perform from jenkins UI.
First I want to select Browser and OS.
Second I want to run all the testcases based on selected browser and OS
Third I want to run only two testcase(Testcase1 and Testcase2) based on selected browser and OS.
How to pass these parameters from Jenkins to testng.xml and run the testcases as per selected options from Jenkins UI?

OrientDB Cluster Configuration Using VM

I am trying to form a orientDB cluster using orientdb-enterprise-2.2.3 using the VM hosted on local server. The VM have the configuration of Fedora OS 18. I have attached the orientdb-server-config.xml and hazelcast.xml file.
orientdb-server-config.xml
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
<orient-server>
<handlers>
<handler class="com.orientechnologies.orient.graph.handler.OGraphServerHandler">
<parameters>
<parameter value="true" name="enabled"/>
<parameter value="50" name="graph.pool.max"/>
</parameters>
</handler>
<handler class="com.orientechnologies.orient.server.hazelcast.OHazelcastPlugin">
<parameters>
<parameter value="${distributed}" name="enabled"/>
<parameter value="${ORIENTDB_HOME}/config/default-distributed-db-config.json" name="configuration.db.default"/>
<parameter value="${ORIENTDB_HOME}/config/hazelcast.xml" name="configuration.hazelcast"/>
</parameters>
</handler>
<handler class="com.orientechnologies.orient.server.handler.OJMXPlugin">
<parameters>
<parameter value="false" name="enabled"/>
<parameter value="true" name="profilerManaged"/>
</parameters>
</handler>
<handler class="com.orientechnologies.orient.server.handler.OAutomaticBackup">
<parameters>
<parameter value="false" name="enabled"/>
<parameter value="${ORIENTDB_HOME}/config/automatic-backup.json" name="config"/>
</parameters>
</handler>
<handler class="com.orientechnologies.orient.server.handler.OServerSideScriptInterpreter">
<parameters>
<parameter value="true" name="enabled"/>
<parameter value="SQL" name="allowedLanguages"/>
</parameters>
</handler>
</handlers>
<network>
<sockets>
<socket implementation="com.orientechnologies.orient.server.network.OServerTLSSocketFactory" name="ssl">
<parameters>
<parameter value="false" name="network.ssl.clientAuth"/>
<parameter value="config/cert/orientdb.ks" name="network.ssl.keyStore"/>
<parameter value="password" name="network.ssl.keyStorePassword"/>
<parameter value="config/cert/orientdb.ks" name="network.ssl.trustStore"/>
<parameter value="password" name="network.ssl.trustStorePassword"/>
</parameters>
</socket>
<socket implementation="com.orientechnologies.orient.server.network.OServerTLSSocketFactory" name="https">
<parameters>
<parameter value="false" name="network.ssl.clientAuth"/>
<parameter value="config/cert/orientdb.ks" name="network.ssl.keyStore"/>
<parameter value="password" name="network.ssl.keyStorePassword"/>
<parameter value="config/cert/orientdb.ks" name="network.ssl.trustStore"/>
<parameter value="password" name="network.ssl.trustStorePassword"/>
</parameters>
</socket>
</sockets>
<protocols>
<protocol implementation="com.orientechnologies.orient.server.network.protocol.binary.ONetworkProtocolBinary" name="binary"/>
<protocol implementation="com.orientechnologies.orient.server.network.protocol.http.ONetworkProtocolHttpDb" name="http"/>
</protocols>
<listeners>
<listener protocol="binary" socket="default" port-range="2424-2430" ip-address="0.0.0.0"/>
<listener protocol="http" socket="default" port-range="2480-2490" ip-address="0.0.0.0">
<commands>
<command implementation="com.orientechnologies.orient.server.network.protocol.http.command.get.OServerCommandGetStaticContent" pattern="GET|www GET|studio/ GET| GET|*.htm GET|*.html GET|*.xml GET|*.jpeg GET|*.jpg GET|*.png GET|*.gif GET|*.js GET|*.css GET|*.swf GET|*.ico GET|*.txt GET|*.otf GET|*.pjs GET|*.svg GET|*.json GET|*.woff GET|*.woff2 GET|*.ttf GET|*.svgz" stateful="false">
<parameters>
<entry value="Cache-Control: no-cache, no-store, max-age=0, must-revalidate\r\nPragma: no-cache" name="http.cache:*.htm *.html"/>
<entry value="Cache-Control: max-age=120" name="http.cache:default"/>
</parameters>
</command>
<command implementation="com.orientechnologies.orient.graph.server.command.OServerCommandGetGephi" pattern="GET|gephi/*" stateful="false"/>
</commands>
<parameters>
<parameter value="utf-8" name="network.http.charset"/>
<parameter value="true" name="network.http.jsonResponseError"/>
</parameters>
</listener>
</listeners>
</network>
<storages/>
<users>
<user resources="*" password="root" name="root"/>
<user resources="connect,server.listDatabases,server.dblist" password="guest" name="guest"/>
</users>
<properties>
<entry value="1" name="db.pool.min"/>
<entry value="50" name="db.pool.max"/>
<entry value="true" name="profiler.enabled"/>
</properties>
<isAfterFirstTime>true</isAfterFirstTime>
</orient-server>
hazelcast.xml
<?xml version="1.0" encoding="UTF-8"?>
<hazelcast xsi:schemaLocation="http://www.hazelcast.com/schema/config hazelcast-config-3.3.xsd"
xmlns="http://www.hazelcast.com/schema/config" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
<group>
<name>orientdb</name>
<password>orientdb</password>
</group>
<network>
<port auto-increment="true">2434</port>
<join>
<multicast enabled="true">
<multicast-group>235.1.1.1</multicast-group>
<multicast-port>2434</multicast-port>
</multicast>
</join>
</network>
<executor-service>
<pool-size>16</pool-size>
</executor-service>
</hazelcast>
But the two nodes are not getting connected in the cluster. I am trying the multicast join for clustering. The individual servers are working fine.
What might be the issue with the multicast clustering?
Hi Deep Mistry try iptables firewall configuration as the ports might be blocked by firewall

WSO2 ESB 4.7.0 UI does not allow editing any further after a JMS consumer is created

I have the following JMS consumer proxy service defined:
<proxy xmlns="http://ws.apache.org/ns/synapse" name="DefiDealerProxy" transports="jms" statistics="enable" trace="enable" startOnLoad="true">
<target>
<inSequence>
<property name="OUT_ONLY" value="true" scope="default" type="STRING" />
</inSequence>
</target>
<parameter name="transport.jms.ConnectionFactory">myTopicConnectionFactory</parameter>
<parameter name="transport.jms.Destination">activemq.topic.sync</parameter>
<parameter name="transport.jms.DestinationType">topic</parameter>
<parameter name="transport.jms.MessageSelector">ACTION = 'Save' AND ENTITY = 'dealer'</parameter>
<parameter name="transport.jms.SubscriptionDurable">true</parameter>
<parameter name="transport.jms.DurableSubscriberName">My Subscriber</parameter>
<parameter name="transport.jms.ContentType">
<rules>
<jmsProperty>contentType</jmsProperty>
<default>application/xml</default>
</rules>
</parameter>
</proxy>
And here is my axis2.xml configuration:
<transportReceiver name="jms" class="org.apache.axis2.transport.jms.JMSListener">
<parameter name="myTopicConnectionFactory" locked="false">
<parameter name="java.naming.factory.initial" locked="false">org.apache.activemq.jndi.ActiveMQInitialContextFactory</parameter>
<parameter name="java.naming.provider.url" locked="false">failover:tcp://localhost:61616</parameter>
<parameter name="transport.jms.UserName">user</parameter>
<parameter name="transport.jms.Password">password</parameter>
<parameter name="transport.jms.ConnectionFactoryJNDIName" locked="false">TopicConnectionFactory</parameter>
<parameter name="transport.jms.ConnectionFactoryType" locked="false">topic</parameter>
<parameter name="transport.jms.DurableSubscriberClientID" locked="false">myHomePC</parameter>
</parameter>
<parameter name="myQueueConnectionFactory" locked="false">
<parameter name="java.naming.factory.initial" locked="false">org.apache.activemq.jndi.ActiveMQInitialContextFactory</parameter>
<parameter name="java.naming.provider.url" locked="false">failover:tcp://localhost:61616</parameter>
<parameter name="transport.jms.UserName">user</parameter>
<parameter name="transport.jms.Password">password</parameter>
<parameter name="transport.jms.ConnectionFactoryJNDIName" locked="false">QueueConnectionFactory</parameter>
<parameter name="transport.jms.ConnectionFactoryType" locked="false">queue</parameter>
<parameter name="transport.jms.DurableSubscriberClientID" locked="false">myHomePC</parameter>
</parameter>
<parameter name="default" locked="false">
<parameter name="java.naming.factory.initial" locked="false">org.apache.activemq.jndi.ActiveMQInitialContextFactory</parameter>
<parameter name="java.naming.provider.url" locked="false">failover:tcp://localhost:61616</parameter>
<parameter name="transport.jms.UserName">user</parameter>
<parameter name="transport.jms.Password">password</parameter>
<parameter name="transport.jms.ConnectionFactoryJNDIName" locked="false">QueueConnectionFactory</parameter>
<parameter name="transport.jms.ConnectionFactoryType" locked="false">queue</parameter>
<parameter name="transport.jms.DurableSubscriberClientID" locked="false">myHomePC</parameter>
</parameter>
</transportReceiver>
Once I create the proxy service in source mode and save it. It successfully connects to the ActiveMQ broker and receives messages as expected. However, I cannot edit the proxy service again in design or source mode as the UI completely changes upon clicking the Edit button. I have facing this issue in ESB 4.6 & 4.7. Has anyone faced this issue? any help will be appreciated.
It seems to be the single quotes inside <parameter name="transport.jms.MessageSelector">ACTION = 'Save' AND ENTITY = 'dealer'</parameter> line is causing the issue.
I was able to get an editable proxy service using the following configuration.
<proxy xmlns="http://ws.apache.org/ns/synapse"
name="DefiDealerProxy"
transports="jms"
statistics="enable"
trace="enable"
startOnLoad="true">
<target>
<inSequence>
<property name="OUT_ONLY" value="true" scope="default" type="STRING"/>
</inSequence>
</target>
<parameter name="transport.jms.ContentType">
<rules>
<jmsProperty>contentType</jmsProperty>
<default>application/xml</default>
</rules>
</parameter>
<parameter name="transport.jms.MessageSelector">ACTION=Save AND ENTITY = dealer</parameter>
<parameter name="transport.jms.ConnectionFactory">myTopicConnectionFactory</parameter>
<parameter name="transport.jms.DestinationType">topic</parameter>
<parameter name="transport.jms.Destination">activemq.topic.sync</parameter>
<parameter name="transport.jms.DurableSubscriberName">My Subscriber</parameter>
<description/>
</proxy>

RapidMiner : Where/how is the Store (Model) operator connected in this process flow

I have created a process flow within RapidMiner that utilizes some loops. I'm not exactly sure where my Store Model operator should be connected to, in order to save the model parameters derived through this process to be in a new process.
The attached example has my data replaced with some sample data, however the rest of the process is what I have for my actual data set.
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.3.012">
<context>
<input/>
<output/>
<macros/>
</context>
<operator activated="true" class="process" compatibility="5.3.012" expanded="true" name="Process">
<process expanded="true">
<operator activated="true" class="retrieve" compatibility="5.3.012" expanded="true" height="60" name="Retrieve Sonar" width="90" x="45" y="30">
<parameter key="repository_entry" value="//Samples/data/Sonar"/>
</operator>
<operator activated="true" class="numerical_to_binominal" compatibility="5.3.012" expanded="true" height="76" name="Numerical to Binominal" width="90" x="179" y="30">
<parameter key="attribute_filter_type" value="single"/>
<parameter key="attribute" value="20_OV_COVER"/>
</operator>
<operator activated="true" class="set_role" compatibility="5.3.012" expanded="true" height="76" name="Set Role" width="90" x="45" y="120">
<parameter key="attribute_name" value="class"/>
<parameter key="target_role" value="label"/>
<list key="set_additional_roles"/>
</operator>
<operator activated="true" class="normalize" compatibility="5.3.012" expanded="true" height="94" name="Normalize" width="90" x="179" y="120"/>
<operator activated="true" class="nominal_to_numerical" compatibility="5.3.012" expanded="true" height="94" name="Nominal to Numerical (2)" width="90" x="45" y="210">
<list key="comparison_groups"/>
</operator>
<operator activated="true" class="replace_missing_values" compatibility="5.3.012" expanded="true" height="94" name="Replace Missing Values" width="90" x="179" y="210">
<list key="columns"/>
</operator>
<operator activated="true" class="independent_component_analysis" compatibility="5.3.012" expanded="true" height="94" name="ICA" width="90" x="313" y="210">
<parameter key="number_of_components" value="700"/>
</operator>
<operator activated="true" class="optimize_selection_forward" compatibility="5.3.012" expanded="true" height="94" name="Forward Selection" width="90" x="514" y="75">
<parameter key="maximal_number_of_attributes" value="100"/>
<parameter key="speculative_rounds" value="10"/>
<process expanded="true">
<operator activated="true" class="x_validation" compatibility="5.3.012" expanded="true" height="112" name="Validation" width="90" x="112" y="30">
<parameter key="number_of_validations" value="5"/>
<process expanded="true">
<operator activated="true" class="naive_bayes" compatibility="5.3.012" expanded="true" height="76" name="Naive Bayes" width="90" x="112" y="30"/>
<connect from_port="training" to_op="Naive Bayes" to_port="training set"/>
<connect from_op="Naive Bayes" from_port="model" to_port="model"/>
<portSpacing port="source_training" spacing="0"/>
<portSpacing port="sink_model" spacing="0"/>
<portSpacing port="sink_through 1" spacing="0"/>
</process>
<process expanded="true">
<operator activated="true" class="apply_model" compatibility="5.3.012" expanded="true" height="76" name="Apply Model" width="90" x="45" y="30">
<list key="application_parameters"/>
</operator>
<operator activated="true" class="performance" compatibility="5.3.012" expanded="true" height="76" name="Performance" width="90" x="276" y="30"/>
<connect from_port="model" to_op="Apply Model" to_port="model"/>
<connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/>
<connect from_op="Apply Model" from_port="labelled data" to_op="Performance" to_port="labelled data"/>
<connect from_op="Performance" from_port="performance" to_port="averagable 1"/>
<portSpacing port="source_model" spacing="0"/>
<portSpacing port="source_test set" spacing="0"/>
<portSpacing port="source_through 1" spacing="0"/>
<portSpacing port="sink_averagable 1" spacing="0"/>
<portSpacing port="sink_averagable 2" spacing="0"/>
</process>
</operator>
<connect from_port="example set" to_op="Validation" to_port="training"/>
<connect from_op="Validation" from_port="averagable 1" to_port="performance"/>
<portSpacing port="source_example set" spacing="0"/>
<portSpacing port="sink_performance" spacing="0"/>
</process>
</operator>
<connect from_op="Retrieve Sonar" from_port="output" to_op="Numerical to Binominal" to_port="example set input"/>
<connect from_op="Numerical to Binominal" from_port="example set output" to_op="Set Role" to_port="example set input"/>
<connect from_op="Set Role" from_port="example set output" to_op="Normalize" to_port="example set input"/>
<connect from_op="Normalize" from_port="example set output" to_op="Nominal to Numerical (2)" to_port="example set input"/>
<connect from_op="Nominal to Numerical (2)" from_port="example set output" to_op="Replace Missing Values" to_port="example set input"/>
<connect from_op="Replace Missing Values" from_port="example set output" to_op="ICA" to_port="example set input"/>
<connect from_op="ICA" from_port="example set output" to_op="Forward Selection" to_port="example set"/>
<connect from_op="ICA" from_port="original" to_port="result 1"/>
<connect from_op="ICA" from_port="preprocessing model" to_port="result 2"/>
<connect from_op="Forward Selection" from_port="example set" to_port="result 3"/>
<connect from_op="Forward Selection" from_port="attribute weights" to_port="result 4"/>
<connect from_op="Forward Selection" from_port="performance" to_port="result 5"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="sink_result 1" spacing="18"/>
<portSpacing port="sink_result 2" spacing="0"/>
<portSpacing port="sink_result 3" spacing="0"/>
<portSpacing port="sink_result 4" spacing="0"/>
<portSpacing port="sink_result 5" spacing="0"/>
<portSpacing port="sink_result 6" spacing="0"/>
</process>
</operator>
</process>
The forward selection operator outputs a set of weights and these can be used to select the attributes that the operator found to give the best performance. The first thing to do therefore is to use these weights with the Select by Weight operator to give the example set that was used to build the model.
From there you could simply rebuild the model with this example set outside the Forward Selection operator. If you additionally wanted to get an estimate of the performance on unseen data you could use a Validation block on all the data but if not then simply using the model operator would create the model you need.
When I tried it, the estimated performance I got was different to the one produced by the Forward Selection operator because the partitioning in the validation block is different owing to different random number seeds. It is also the case that the Validation block inside the Forward Selection is giving an average performance for 10 models built on 10 partitions of data. These 10 models could all be different so there is no one true model that can be saved.
Hope that helps.
regards
Andrew

RapidMiner - range by occurence

I want to filter my results (document occurrence) by the most frequent (the 10 most popular them). How do I do that?
One way would be to use a sort operator followed by a filter. For example, sorting and filtering the sample Iris dataset by a1:
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.2.008">
<context>
<input/>
<output/>
<macros/>
</context>
<operator activated="true" class="process" compatibility="5.2.008" expanded="true" name="Process">
<process expanded="true" height="417" width="675">
<operator activated="true" class="retrieve" compatibility="5.2.008" expanded="true" height="60" name="Retrieve" width="90" x="45" y="30">
<parameter key="repository_entry" value="//Samples/data/Iris"/>
</operator>
<operator activated="true" class="sort" compatibility="5.2.008" expanded="true" height="76" name="Sort" width="90" x="179" y="30">
<parameter key="attribute_name" value="a1"/>
<parameter key="sorting_direction" value="decreasing"/>
</operator>
<operator activated="true" class="filter_example_range" compatibility="5.2.008" expanded="true" height="76" name="Filter Example Range" width="90" x="313" y="30">
<parameter key="first_example" value="1"/>
<parameter key="last_example" value="10"/>
</operator>
<connect from_op="Retrieve" from_port="output" to_op="Sort" to_port="example set input"/>
<connect from_op="Sort" from_port="example set output" to_op="Filter Example Range" to_port="example set input"/>
<connect from_op="Filter Example Range" from_port="example set output" to_port="result 1"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="sink_result 1" spacing="0"/>
<portSpacing port="sink_result 2" spacing="0"/>
</process>
</operator>
</process>