Pages: [1]
  Print  
Author Topic: SOLVED: Performance Vector not showing / visible  (Read 422 times)
casnl
Newbie
*
Posts: 5


« on: October 23, 2013, 10:11:43 AM »

Hi,

Fairly new to RM, I followed a couple tutorials. However neither the tutorials nor this forum could help me fix this issue. I followed this http://www.corequant.com/?p=1 tutorial step by step for Sentiment Analysis. Using RM 5.3.013 with (obviously) text processing extension. I never get the expected output, i.e. the Performance Vector. I am able to save the model and vector and apply it to unlabeled data; which yields results. However I want to know the performance of my model; what am I missing here? Why am I not getting any performance output?

My process:
Code:
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.3.013">
  <context>
    <input/>
    <output/>
    <macros/>
  </context>
  <operator activated="true" class="process" compatibility="5.3.013" expanded="true" name="Process">
    <process expanded="true">
      <operator activated="true" class="text:process_document_from_file" compatibility="5.3.002" expanded="true" height="76" name="Process Documents from Files" width="90" x="112" y="30">
        <list key="text_directories">
          <parameter key="negative" value="/Users/casvanandel/Dropbox/Thesis/Data/review_polarity/txt_sentoken/neg"/>
          <parameter key="positive" value="/Users/casvanandel/Dropbox/Thesis/Data/review_polarity/txt_sentoken/pos"/>
        </list>
        <parameter key="prune_method" value="percentual"/>
        <parameter key="prune_above_percent" value="95.0"/>
        <process expanded="true">
          <operator activated="true" class="text:tokenize" compatibility="5.3.002" expanded="true" height="60" name="Tokenize" width="90" x="112" y="75"/>
          <operator activated="true" class="text:filter_by_length" compatibility="5.3.002" expanded="true" height="60" name="Filter Tokens (by Length)" width="90" x="216" y="162"/>
          <operator activated="true" class="text:stem_porter" compatibility="5.3.002" expanded="true" height="60" name="Stem (Porter)" width="90" x="292" y="247"/>
          <operator activated="true" class="text:filter_stopwords_english" compatibility="5.3.002" expanded="true" height="60" name="Filter Stopwords (English)" width="90" x="421" y="338"/>
          <connect from_port="document" to_op="Tokenize" to_port="document"/>
          <connect from_op="Tokenize" from_port="document" to_op="Filter Tokens (by Length)" to_port="document"/>
          <connect from_op="Filter Tokens (by Length)" from_port="document" to_op="Stem (Porter)" to_port="document"/>
          <connect from_op="Stem (Porter)" from_port="document" to_op="Filter Stopwords (English)" to_port="document"/>
          <connect from_op="Filter Stopwords (English)" from_port="document" to_port="document 1"/>
          <portSpacing port="source_document" spacing="0"/>
          <portSpacing port="sink_document 1" spacing="0"/>
          <portSpacing port="sink_document 2" spacing="0"/>
        </process>
      </operator>
      <operator activated="true" class="x_validation" compatibility="5.3.013" expanded="true" height="112" name="Validation" width="90" x="313" y="30">
        <process expanded="true">
          <operator activated="true" class="support_vector_machine_linear" compatibility="5.3.013" expanded="true" height="76" name="SVM (Linear)" width="90" x="112" y="30"/>
          <connect from_port="training" to_op="SVM (Linear)" to_port="training set"/>
          <connect from_op="SVM (Linear)" from_port="model" to_port="model"/>
          <portSpacing port="source_training" spacing="0"/>
          <portSpacing port="sink_model" spacing="0"/>
          <portSpacing port="sink_through 1" spacing="0"/>
        </process>
        <process expanded="true">
          <operator activated="true" class="apply_model" compatibility="5.3.013" expanded="true" height="76" name="Apply Model" width="90" x="51" y="56">
            <list key="application_parameters"/>
          </operator>
          <operator activated="true" class="performance" compatibility="5.3.013" expanded="true" height="76" name="Performance" width="90" x="99" y="165"/>
          <connect from_port="model" to_op="Apply Model" to_port="model"/>
          <connect from_port="test set" to_op="Apply Model" to_port="unlabelled data"/>
          <connect from_op="Apply Model" from_port="labelled data" to_op="Performance" to_port="labelled data"/>
          <connect from_op="Performance" from_port="performance" to_port="averagable 1"/>
          <portSpacing port="source_model" spacing="0"/>
          <portSpacing port="source_test set" spacing="0"/>
          <portSpacing port="source_through 1" spacing="0"/>
          <portSpacing port="sink_averagable 1" spacing="0"/>
          <portSpacing port="sink_averagable 2" spacing="0"/>
        </process>
      </operator>
      <operator activated="true" class="store" compatibility="5.3.013" expanded="true" height="60" name="Store (2)" width="90" x="447" y="165">
        <parameter key="repository_entry" value="//Local Repository/pd_model"/>
      </operator>
      <operator activated="true" class="store" compatibility="5.3.013" expanded="true" height="60" name="Store" width="90" x="112" y="165">
        <parameter key="repository_entry" value="//Local Repository/pd_word"/>
      </operator>
      <operator activated="false" class="retrieve" compatibility="5.3.013" expanded="true" height="60" name="Retrieve (2)" width="90" x="313" y="255">
        <parameter key="repository_entry" value="pd_model"/>
      </operator>
      <operator activated="false" class="retrieve" compatibility="5.3.013" expanded="true" height="60" name="Retrieve" width="90" x="45" y="255">
        <parameter key="repository_entry" value="pd_word"/>
      </operator>
      <operator activated="false" class="text:process_document_from_file" compatibility="5.3.002" expanded="true" height="76" name="Process Documents from Files (2)" width="90" x="179" y="345">
        <list key="text_directories">
          <parameter key="tbd" value="/yourdirectoy/txt_sentoken/tbd"/>
        </list>
        <parameter key="prune_method" value="percentual"/>
        <parameter key="prune_above_percent" value="95.0"/>
        <process expanded="true">
          <operator activated="false" class="text:tokenize" compatibility="5.3.002" expanded="true" name="Tokenize (2)"/>
          <operator activated="false" class="text:filter_by_length" compatibility="5.3.002" expanded="true" name="Filter Tokens (2)"/>
          <operator activated="false" class="text:stem_porter" compatibility="5.3.002" expanded="true" name="Stem (2)"/>
          <operator activated="false" class="text:filter_stopwords_english" compatibility="5.3.002" expanded="true" name="Filter Stopwords (2)"/>
          <connect from_port="document" to_op="Tokenize (2)" to_port="document"/>
          <connect from_op="Tokenize (2)" from_port="document" to_op="Filter Tokens (2)" to_port="document"/>
          <connect from_op="Filter Tokens (2)" from_port="document" to_op="Stem (2)" to_port="document"/>
          <connect from_op="Stem (2)" from_port="document" to_op="Filter Stopwords (2)" to_port="document"/>
          <connect from_op="Filter Stopwords (2)" from_port="document" to_port="document 1"/>
          <portSpacing port="source_document" spacing="0"/>
          <portSpacing port="sink_document 1" spacing="0"/>
          <portSpacing port="sink_document 2" spacing="0"/>
        </process>
      </operator>
      <operator activated="false" class="apply_model" compatibility="5.3.013" expanded="true" height="76" name="Apply Model (2)" width="90" x="514" y="300">
        <list key="application_parameters"/>
      </operator>
      <connect from_op="Process Documents from Files" from_port="example set" to_op="Validation" to_port="training"/>
      <connect from_op="Process Documents from Files" from_port="word list" to_op="Store" to_port="input"/>
      <connect from_op="Validation" from_port="model" to_op="Store (2)" to_port="input"/>
      <connect from_op="Store (2)" from_port="through" to_port="result 1"/>
      <connect from_op="Retrieve (2)" from_port="output" to_op="Apply Model (2)" to_port="model"/>
      <connect from_op="Retrieve" from_port="output" to_op="Process Documents from Files (2)" to_port="word list"/>
      <connect from_op="Process Documents from Files (2)" from_port="example set" to_op="Apply Model (2)" to_port="unlabelled data"/>
      <portSpacing port="source_input 1" spacing="0"/>
      <portSpacing port="sink_result 1" spacing="0"/>
      <portSpacing port="sink_result 2" spacing="0"/>
    </process>
  </operator>
</process>

Thanks in advance.
« Last Edit: October 23, 2013, 11:38:43 AM by casnl » Logged
Marco Boeck
Administrator
Hero Member
*****
Posts: 879


WWW
« Reply #1 on: October 23, 2013, 10:30:31 AM »

Hi,

there is a slight piece missing on the screenshot of the tutorial: You need to connect the "ave" port of the 'Validation' operator to the process result ports, as you did with the "mod" port.

Regards,
Marco
Logged

Join us in Boston for the RapidMiner World conference!

RapidMiner Studio 6 | RapidMiner Studio 6 Q&A
casnl
Newbie
*
Posts: 5


« Reply #2 on: October 23, 2013, 11:38:24 AM »

You really are a hero-member. Thanks a lot.
Logged
Pages: [1]
  Print  
 
Jump to: