在 RapidMiner 中创建排列图

Creating a pareto chart in RapidMiner

我无法绘制简单的帕累托图。

我的数据如下:

当我尝试创建帕累托图时,我得到一个空白 space,我也无法 select "Count Value" 的值:

我在这里错过了什么? 我的示例数据存储在 xml:

<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.3.015">
  <context>
    <input/>
    <output/>
    <macros/>
  </context>
  <operator activated="true" class="process" compatibility="5.3.015" expanded="true" name="Process">
    <process expanded="true">
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification" width="90" x="447" y="75">
        <list key="attribute_values">
          <parameter key="category" value="&quot;black&quot;"/>
          <parameter key="Incidents" value="10"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (2)" width="90" x="447" y="390">
        <list key="attribute_values">
          <parameter key="category" value="&quot;blue&quot;"/>
          <parameter key="Incidents" value="2"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (3)" width="90" x="447" y="210">
        <list key="attribute_values">
          <parameter key="category" value="&quot;green&quot;"/>
          <parameter key="Incidents" value="7"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (4)" width="90" x="447" y="165">
        <list key="attribute_values">
          <parameter key="category" value="&quot;white&quot;"/>
          <parameter key="Incidents" value="8"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (5)" width="90" x="447" y="300">
        <list key="attribute_values">
          <parameter key="category" value="&quot;red&quot;"/>
          <parameter key="Incidents" value="2"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (6)" width="90" x="447" y="480">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Yellow&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (7)" width="90" x="447" y="705">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Gray&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (8)" width="90" x="447" y="840">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Navy&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="generate_data_user_specification" compatibility="5.3.015" expanded="true" height="60" name="Generate Data by User Specification (9)" width="90" x="447" y="570">
        <list key="attribute_values">
          <parameter key="category" value="&quot;Purple&quot;"/>
          <parameter key="Incidents" value="1"/>
        </list>
        <list key="set_additional_roles"/>
      </operator>
      <operator activated="true" class="append" compatibility="5.3.015" expanded="true" height="220" name="Append" width="90" x="715" y="120"/>
      <connect from_op="Generate Data by User Specification" from_port="output" to_op="Append" to_port="example set 1"/>
      <connect from_op="Generate Data by User Specification (2)" from_port="output" to_op="Append" to_port="example set 5"/>
      <connect from_op="Generate Data by User Specification (3)" from_port="output" to_op="Append" to_port="example set 4"/>
      <connect from_op="Generate Data by User Specification (4)" from_port="output" to_op="Append" to_port="example set 2"/>
      <connect from_op="Generate Data by User Specification (5)" from_port="output" to_op="Append" to_port="example set 3"/>
      <connect from_op="Generate Data by User Specification (6)" from_port="output" to_op="Append" to_port="example set 6"/>
      <connect from_op="Generate Data by User Specification (7)" from_port="output" to_op="Append" to_port="example set 9"/>
      <connect from_op="Generate Data by User Specification (8)" from_port="output" to_op="Append" to_port="example set 7"/>
      <connect from_op="Generate Data by User Specification (9)" from_port="output" to_op="Append" to_port="example set 8"/>
      <connect from_op="Append" from_port="merged set" to_port="result 1"/>
      <portSpacing port="source_input 1" spacing="0"/>
      <portSpacing port="sink_result 1" spacing="0"/>
      <portSpacing port="sink_result 2" spacing="0"/>
    </process>
  </operator>
</process>

所以我找到了一个解决方法(感谢 Andrew),它只适用于这个示例集。

我必须 "de-aggregate" 它并为每个示例添加一个具有相同值的新多项式属性。

然后我可以创建帕累托图,分组 'category' 并将计数列设置为新属性。

指向此图表:

当我对我的数据集执行此操作时,我得到了这张图表:

我想如果不能配置帕累托图,对于分组类别中的很多不同值来说真的很糟糕。