| <?xml version="1.0" encoding="UTF-8"?> |
| <!-- |
| |
| Licensed to the Apache Software Foundation (ASF) under one or more |
| contributor license agreements. See the NOTICE file distributed with |
| this work for additional information regarding copyright ownership. |
| The ASF licenses this file to You under the Apache License, Version 2.0 |
| (the "License"); you may not use this file except in compliance with |
| the License. You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| |
| --> |
| <pipeline> |
| <info> |
| <name>0034-unique-rows</name> |
| <name_sync_with_filename>Y</name_sync_with_filename> |
| <description/> |
| <extended_description/> |
| <pipeline_version/> |
| <pipeline_type>Normal</pipeline_type> |
| <pipeline_status>0</pipeline_status> |
| <parameters> |
| </parameters> |
| <capture_transform_performance>N</capture_transform_performance> |
| <transform_performance_capturing_delay>1000</transform_performance_capturing_delay> |
| <transform_performance_capturing_size_limit>100</transform_performance_capturing_size_limit> |
| <created_user>-</created_user> |
| <created_date>2021/07/13 21:09:00.016</created_date> |
| <modified_user>-</modified_user> |
| <modified_date>2021/07/13 21:09:00.016</modified_date> |
| <key_for_session_key>H4sIAAAAAAAAAAMAAAAAAAAAAAA=</key_for_session_key> |
| <is_key_private>N</is_key_private> |
| </info> |
| <notepads> |
| <notepad> |
| <note>Warning, row are sorted in case insentive order and dataset is case sensitive order</note> |
| <xloc>112</xloc> |
| <yloc>32</yloc> |
| <width>437</width> |
| <heigth>26</heigth> |
| <fontname>Segoe UI</fontname> |
| <fontsize>9</fontsize> |
| <fontbold>N</fontbold> |
| <fontitalic>N</fontitalic> |
| <fontcolorred>14</fontcolorred> |
| <fontcolorgreen>58</fontcolorgreen> |
| <fontcolorblue>90</fontcolorblue> |
| <backgroundcolorred>201</backgroundcolorred> |
| <backgroundcolorgreen>232</backgroundcolorgreen> |
| <backgroundcolorblue>251</backgroundcolorblue> |
| <bordercolorred>14</bordercolorred> |
| <bordercolorgreen>58</bordercolorgreen> |
| <bordercolorblue>90</bordercolorblue> |
| </notepad> |
| </notepads> |
| <order> |
| <hop> |
| <from>Data grid</from> |
| <to>sort</to> |
| <enabled>Y</enabled> |
| </hop> |
| <hop> |
| <from>sort</from> |
| <to>Unique rows</to> |
| <enabled>Y</enabled> |
| </hop> |
| <hop> |
| <from>Unique rows</from> |
| <to>Result</to> |
| <enabled>Y</enabled> |
| </hop> |
| <hop> |
| <from>Unique rows</from> |
| <to>Duplicate row</to> |
| <enabled>Y</enabled> |
| </hop> |
| </order> |
| <transform> |
| <name>Data grid</name> |
| <type>DataGrid</type> |
| <description/> |
| <distribute>Y</distribute> |
| <custom_distribution/> |
| <copies>1</copies> |
| <partitioning> |
| <method>none</method> |
| <schema_name/> |
| </partitioning> |
| <fields> |
| <field> |
| <set_empty_string>N</set_empty_string> |
| <length>-1</length> |
| <name>Field_A</name> |
| <precision>-1</precision> |
| <type>String</type> |
| </field> |
| <field> |
| <set_empty_string>N</set_empty_string> |
| <length>-1</length> |
| <name>Field_B</name> |
| <precision>-1</precision> |
| <type>String</type> |
| </field> |
| <field> |
| <set_empty_string>N</set_empty_string> |
| <length>-1</length> |
| <name>Field_C</name> |
| <precision>-1</precision> |
| <type>Integer</type> |
| </field> |
| </fields> |
| <data> |
| <line> |
| <item>ABCD</item> |
| <item>Z</item> |
| <item>1</item> |
| </line> |
| <line> |
| <item>ABCD</item> |
| <item>Z</item> |
| <item>2</item> |
| </line> |
| <line> |
| <item>ABCD</item> |
| <item>z</item> |
| <item>2</item> |
| </line> |
| <line> |
| <item>ABCD</item> |
| <item>z</item> |
| <item>6</item> |
| </line> |
| <line> |
| <item>abcd</item> |
| <item>X</item> |
| <item>9</item> |
| </line> |
| <line> |
| <item>abcd</item> |
| <item>X</item> |
| <item>9</item> |
| </line> |
| <line> |
| <item>EFG</item> |
| <item>X</item> |
| <item>8</item> |
| </line> |
| <line> |
| <item>EFG</item> |
| <item>Z</item> |
| <item>1</item> |
| </line> |
| <line> |
| <item>ABCD</item> |
| <item>Z</item> |
| <item>2</item> |
| </line> |
| <line> |
| <item>ABCD</item> |
| <item>z</item> |
| <item>2</item> |
| </line> |
| <line> |
| <item>EFG</item> |
| <item>X</item> |
| <item>6</item> |
| </line> |
| <line> |
| <item>EFG</item> |
| <item>Z</item> |
| <item>8</item> |
| </line> |
| </data> |
| <attributes/> |
| <GUI> |
| <xloc>112</xloc> |
| <yloc>112</yloc> |
| </GUI> |
| </transform> |
| <transform> |
| <name>Duplicate row</name> |
| <type>Dummy</type> |
| <description/> |
| <distribute>Y</distribute> |
| <custom_distribution/> |
| <copies>1</copies> |
| <partitioning> |
| <method>none</method> |
| <schema_name/> |
| </partitioning> |
| <attributes/> |
| <GUI> |
| <xloc>368</xloc> |
| <yloc>240</yloc> |
| </GUI> |
| </transform> |
| <transform> |
| <name>Result</name> |
| <type>Dummy</type> |
| <description/> |
| <distribute>Y</distribute> |
| <custom_distribution/> |
| <copies>1</copies> |
| <partitioning> |
| <method>none</method> |
| <schema_name/> |
| </partitioning> |
| <attributes/> |
| <GUI> |
| <xloc>496</xloc> |
| <yloc>112</yloc> |
| </GUI> |
| </transform> |
| <transform> |
| <name>Unique rows</name> |
| <type>Unique</type> |
| <description/> |
| <distribute>Y</distribute> |
| <custom_distribution/> |
| <copies>1</copies> |
| <partitioning> |
| <method>none</method> |
| <schema_name/> |
| </partitioning> |
| <count_rows>Y</count_rows> |
| <count_field>CounterField</count_field> |
| <reject_duplicate_row>Y</reject_duplicate_row> |
| <error_description>ErrorDescription</error_description> |
| <fields> |
| <field> |
| <name>Field_A</name> |
| <case_insensitive>Y</case_insensitive> |
| </field> |
| <field> |
| <name>Field_B</name> |
| <case_insensitive>N</case_insensitive> |
| </field> |
| </fields> |
| <attributes/> |
| <GUI> |
| <xloc>368</xloc> |
| <yloc>112</yloc> |
| </GUI> |
| </transform> |
| <transform> |
| <name>sort</name> |
| <type>SortRows</type> |
| <description/> |
| <distribute>Y</distribute> |
| <custom_distribution/> |
| <copies>1</copies> |
| <partitioning> |
| <method>none</method> |
| <schema_name/> |
| </partitioning> |
| <directory>${java.io.tmpdir}</directory> |
| <prefix>out</prefix> |
| <sort_size>1000000</sort_size> |
| <free_memory/> |
| <compress>N</compress> |
| <compress_variable/> |
| <unique_rows>N</unique_rows> |
| <fields> |
| <field> |
| <name>Field_A</name> |
| <ascending>Y</ascending> |
| <case_sensitive>N</case_sensitive> |
| <collator_enabled>N</collator_enabled> |
| <collator_strength>0</collator_strength> |
| <presorted>N</presorted> |
| </field> |
| <field> |
| <name>Field_B</name> |
| <ascending>Y</ascending> |
| <case_sensitive>N</case_sensitive> |
| <collator_enabled>N</collator_enabled> |
| <collator_strength>0</collator_strength> |
| <presorted>N</presorted> |
| </field> |
| <field> |
| <name>Field_C</name> |
| <ascending>Y</ascending> |
| <case_sensitive>N</case_sensitive> |
| <collator_enabled>N</collator_enabled> |
| <collator_strength>0</collator_strength> |
| <presorted>N</presorted> |
| </field> |
| </fields> |
| <attributes/> |
| <GUI> |
| <xloc>240</xloc> |
| <yloc>112</yloc> |
| </GUI> |
| </transform> |
| <transform_error_handling> |
| <error> |
| <source_transform>Unique rows</source_transform> |
| <target_transform>Duplicate row</target_transform> |
| <is_enabled>Y</is_enabled> |
| <nr_valuename/> |
| <descriptions_valuename/> |
| <fields_valuename/> |
| <codes_valuename/> |
| <max_errors/> |
| <max_pct_errors/> |
| <min_pct_rows/> |
| </error> |
| </transform_error_handling> |
| <attributes/> |
| </pipeline> |