Export Clustered Set Data To Report
passmaster16
New Altair Community Member
Trying to export k-means cluster set to a report using the Generate Report and Report operators but all I end up with is an empty Excel file. What am I doing wrong? Do I have to convert the clustered set to another format before exporting? The XML is below.
Thanks!
Josh
Thanks!
Josh
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<process version="5.2.006">
<context>
<input/>
<output/>
<macros/>
</context>
<operator activated="true" class="process" compatibility="5.2.006" expanded="true" name="Process">
<process expanded="true" height="595" width="547">
<operator activated="true" class="read_database" compatibility="5.2.006" expanded="true" height="60" name="Read Database" width="90" x="45" y="30">
<parameter key="connection" value="HEAT Oracle"/>
<parameter key="query" value="SELECT "CALLDESC" FROM "CALLLOG" WHERE (("RECVDDATE">='2012-05-01') AND ("CALLSOURCE"<>'PTS'))"/>
<enumeration key="parameters"/>
</operator>
<operator activated="true" class="text:process_document_from_data" compatibility="5.2.002" expanded="true" height="76" name="Process Documents from Data" width="90" x="179" y="30">
<parameter key="add_meta_information" value="false"/>
<parameter key="keep_text" value="true"/>
<parameter key="prune_below_rank" value="5.0"/>
<parameter key="prune_above_rank" value="5.0"/>
<list key="specify_weights"/>
<process expanded="true" height="519" width="902">
<operator activated="true" class="text:tokenize" compatibility="5.2.002" expanded="true" height="60" name="Tokenize" width="90" x="112" y="120"/>
<operator activated="true" class="text:transform_cases" compatibility="5.2.002" expanded="true" height="60" name="Transform Cases" width="90" x="179" y="255"/>
<operator activated="true" class="text:filter_by_length" compatibility="5.2.002" expanded="true" height="60" name="Filter Tokens (by Length)" width="90" x="514" y="165">
<parameter key="min_chars" value="2"/>
<parameter key="max_chars" value="999"/>
</operator>
<operator activated="true" class="text:filter_stopwords_dictionary" compatibility="5.2.002" expanded="true" height="76" name="Filter Stopwords (Dictionary)" width="90" x="585" y="30">
<parameter key="file" value="C:\Program Files\Rapid-I\RapidMiner5\stopwordlist.txt"/>
</operator>
<connect from_port="document" to_op="Tokenize" to_port="document"/>
<connect from_op="Tokenize" from_port="document" to_op="Transform Cases" to_port="document"/>
<connect from_op="Transform Cases" from_port="document" to_op="Filter Tokens (by Length)" to_port="document"/>
<connect from_op="Filter Tokens (by Length)" from_port="document" to_op="Filter Stopwords (Dictionary)" to_port="document"/>
<connect from_op="Filter Stopwords (Dictionary)" from_port="document" to_port="document 1"/>
<portSpacing port="source_document" spacing="36"/>
<portSpacing port="sink_document 1" spacing="0"/>
<portSpacing port="sink_document 2" spacing="0"/>
</process>
</operator>
<operator activated="true" class="k_means" compatibility="5.2.006" expanded="true" height="76" name="Clustering" width="90" x="313" y="210">
<parameter key="k" value="60"/>
<parameter key="max_runs" value="5"/>
</operator>
<operator activated="true" class="reporting:generate_report" compatibility="5.1.000" expanded="true" height="76" name="Generate Report" width="90" x="380" y="345">
<parameter key="report_name" value="test"/>
<parameter key="format" value="Excel"/>
<parameter key="pdf_output_file" value="C:\Documents and Settings\Bilskyj\Desktop\test.pdf"/>
<parameter key="excel_output_file" value="C:\Documents and Settings\Bilskyj\Desktop\test.xls"/>
<parameter key="pdf_template_file" value="no file selected"/>
<parameter key="image_template_file" value="no file selected"/>
<parameter key="section_one_font" value="courier"/>
<parameter key="section_two_font" value="courier"/>
<parameter key="section_three_font" value="courier"/>
<parameter key="section_four_font" value="courier"/>
<parameter key="section_five_font" value="courier"/>
<parameter key="text_content_font" value="courier"/>
</operator>
<operator activated="true" class="reporting:report" compatibility="5.1.000" expanded="true" height="60" name="Report" width="90" x="380" y="525">
<parameter key="report_name" value="test"/>
<list key="parameters"/>
</operator>
<connect from_op="Read Database" from_port="output" to_op="Process Documents from Data" to_port="example set"/>
<connect from_op="Process Documents from Data" from_port="example set" to_op="Clustering" to_port="example set"/>
<connect from_op="Clustering" from_port="clustered set" to_op="Generate Report" to_port="through 1"/>
<connect from_op="Generate Report" from_port="through 1" to_op="Report" to_port="reportable in"/>
<connect from_op="Report" from_port="reportable out" to_port="result 1"/>
<portSpacing port="source_input 1" spacing="0"/>
<portSpacing port="sink_result 1" spacing="0"/>
<portSpacing port="sink_result 2" spacing="0"/>
</process>
</operator>
</process>
Tagged:
0
Answers
-
Hi Josh,
did you configure the Report operator correctly with the Configure Report button?
Best, Marius0 -
Hi Marius,Marius wrote:
Hi Josh,
did you configure the Report operator correctly with the Configure Report button?
Best, Marius
Well when I click the Configure Report button, nothing happens so maybe that is what's wrong. It should bring up a wizard to configure the operator but nothing ever comes up after clicking the button. Any way to correct this?
Thanks!
Josh0 -
Hm, the Reporting Extension seems to be borked in RapidMiner 5.2.6. We have already fixed it and it will work with the next release of RapidMiner. Until then we have to ask you to downgrade to RapidMiner 5.2.3 (which is the version available to the public directly before 5.2.6).
Best, Marius0