Problem with Xpath query? Processing documents from web
Hi there,
I am trying to extract documents from a movie review site. When I run the process below I get 0 results but can't figure out the problem, can anyone help? Thanks.
<?xml version="1.0" encoding="UTF-8"?><process version="9.0.003"><br> <context><br> <input/><br> <output/><br> <macros/><br> </context><br> <operator activated="true" class="process" compatibility="6.0.002" expanded="true" name="Process"><br> <process expanded="true"><br> <operator activated="true" class="concurrency:loop" compatibility="9.0.003" expanded="true" height="82" name="Loop" width="90" x="313" y="238"><br> <parameter key="number_of_iterations" value="10"/><br> <process expanded="true"><br> <operator activated="true" class="web:process_web_modern" compatibility="9.0.000" expanded="true" height="68" name="Process Documents from Web" width="90" x="179" y="85"><br> <parameter key="url" value="https://www.rottentomatoes.com/m/chef_2014/reviews/"/><br> <list key="crawling_rules"/><br> <process expanded="true"><br> <operator activated="true" class="text:cut_document" compatibility="8.1.000" expanded="true" height="68" name="Cut Document" width="90" x="246" y="34"><br> <parameter key="query_type" value="XPath"/><br> <list key="string_machting_queries"/><br> <list key="regular_expression_queries"/><br> <list key="regular_region_queries"/><br> <list key="xpath_queries"><br> <parameter key="seg" value="//h:table[@class='table table-striped']/h:tr"/><br> </list><br> <list key="namespaces"/><br> <list key="index_queries"/><br> <list key="jsonpath_queries"/><br> <process expanded="true"><br> <connect from_port="segment" to_port="document 1"/><br> <portSpacing port="source_segment" spacing="0"/><br> <portSpacing port="sink_document 1" spacing="0"/><br> <portSpacing port="sink_document 2" spacing="0"/><br> </process><br> </operator><br> <operator activated="true" class="text:extract_information" compatibility="8.1.000" expanded="true" height="68" name="Extract Information" width="90" x="447" y="34"><br> <parameter key="query_type" value="XPath"/><br> <list key="string_machting_queries"/><br> <list key="regular_expression_queries"/><br> <list key="regular_region_queries"/><br> <list key="xpath_queries"><br> <parameter key="text" value="//h:p/text|)"/><br> </list><br> <list key="namespaces"/><br> <list key="index_queries"/><br> <list key="jsonpath_queries"/><br> </operator><br> <connect from_port="document" to_op="Cut Document" to_port="document"/><br> <connect from_op="Cut Document" from_port="documents" to_port="document 1"/><br> <portSpacing port="source_document" spacing="0"/><br> <portSpacing port="sink_document 1" spacing="0"/><br> <portSpacing port="sink_document 2" spacing="0"/><br> </process><br> </operator><br> <connect from_op="Process Documents from Web" from_port="example set" to_port="output 1"/><br> <portSpacing port="source_input 1" spacing="0"/><br> <portSpacing port="sink_output 1" spacing="0"/><br> <portSpacing port="sink_output 2" spacing="0"/><br> </process><br> </operator><br> <connect from_op="Loop" from_port="output 1" to_port="result 1"/><br> <portSpacing port="source_input 1" spacing="0"/><br> <portSpacing port="sink_result 1" spacing="0"/><br> <portSpacing port="sink_result 2" spacing="0"/><br> </process><br> </operator><br></process>