在RapidMiner中创建一个帕累托图

时间:2016-06-10 20:12:05

标签: rapidminer

我无法绘制简单的帕累托图表。

我的数据如下:

enter image description here

当我尝试创建一个pareto图表时,我得到一个空格,我也无法选择" Count Value"的值:

enter image description here

我在这里缺少什么? 我的样本数据存储在xml:

<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.3.015">
  <context>
    <input/>
    <output/>
    <macros/>
  </context>
  <operator activated="true" class="process" compatibility="5.3.015" expanded="true" name="Process">
    <process expanded="true">
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification" width="90" x="447" y="75">
        <list key="attribute_values">
          <parameter key="category" value="&quot;black&quot;"/>
          <parameter key="Incidents" value="10"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (2)" width="90" x="447" y="390">
        <list key="attribute_values">
          <parameter key="category" value="&quot;blue&quot;"/>
          <parameter key="Incidents" value="2"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (3)" width="90" x="447" y="210">
        <list key="attribute_values">
          <parameter key="category" value="&quot;green&quot;"/>
          <parameter key="Incidents" value="7"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (4)" width="90" x="447" y="165">
        <list key="attribute_values">
          <parameter key="category" value="&quot;white&quot;"/>
          <parameter key="Incidents" value="8"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (5)" width="90" x="447" y="300">
        <list key="attribute_values">
          <parameter key="category" value="&quot;red&quot;"/>
          <parameter key="Incidents" value="2"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (6)" width="90" x="447" y="480">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Yellow&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (7)" width="90" x="447" y="705">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Gray&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (8)" width="90" x="447" y="840">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Navy&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (9)" width="90" x="447" y="570">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Purple&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="append" compatibility="5.3.015" expanded="true" height="220" name="Append" width="90" x="715" y="120"/>
      <connect from_op="Generate Data by User Specification" from_port="output" to_op="Append" to_port="example set 1"/>
      <connect from_op="Generate Data by User Specification (2)" from_port="output" to_op="Append" to_port="example set 5"/>
      <connect from_op="Generate Data by User Specification (3)" from_port="output" to_op="Append" to_port="example set 4"/>
      <connect from_op="Generate Data by User Specification (4)" from_port="output" to_op="Append" to_port="example set 2"/>
      <connect from_op="Generate Data by User Specification (5)" from_port="output" to_op="Append" to_port="example set 3"/>
      <connect from_op="Generate Data by User Specification (6)" from_port="output" to_op="Append" to_port="example set 6"/>
      <connect from_op="Generate Data by User Specification (7)" from_port="output" to_op="Append" to_port="example set 9"/>
      <connect from_op="Generate Data by User Specification (8)" from_port="output" to_op="Append" to_port="example set 7"/>
      <connect from_op="Generate Data by User Specification (9)" from_port="output" to_op="Append" to_port="example set 8"/>
      <connect from_op="Append" from_port="merged set" to_port="result 1"/>
      <portSpacing port="source_input 1" spacing="0"/>
      <portSpacing port="sink_result 1" spacing="0"/>
      <portSpacing port="sink_result 2" spacing="0"/>
    </process>
  </operator>
</process>

1 个答案:

答案 0 :(得分:0)

所以我找到了一个解决方法(感谢Andrew),这只适用于这个示例集。

我必须“解聚”它并为每个例子添加一个具有相同值的新多项式属性。

然后我可以创建一个Pareto图表,分组'类别'并将count-column设置为新属性。

enter image description here

导致此图表:

enter image description here

当我使用我的数据集执行此操作时,我得到此图表:

enter image description here

我想如果不能配置帕累托图表,对于分组中的很多不同的值来说真的很糟糕。