<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Remove duplicate row based on all column match before inserting to DB in Talend Studio</title>
    <link>https://community.qlik.com/t5/Talend-Studio/Remove-duplicate-row-based-on-all-column-match-before-inserting/m-p/2265999#M45360</link>
    <description>&lt;P&gt;I need to remove all duplicate records from a file before it get inserted to DB. In my case a record will be duplicate only in case all of the columns has same value. Example : The first two record will be considered as duplicate but third one is not. Here it is 5 columns , but could be more 10, 20.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;ip&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;host_name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;os_name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;os_version&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Windows&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;8&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Windows&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;8&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;Linux&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;5.6&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I need to insert records to Redshift DB after De-Dupe is done.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Sat, 16 Nov 2024 02:22:31 GMT</pubDate>
    <dc:creator>kaps1602</dc:creator>
    <dc:date>2024-11-16T02:22:31Z</dc:date>
    <item>
      <title>Remove duplicate row based on all column match before inserting to DB</title>
      <link>https://community.qlik.com/t5/Talend-Studio/Remove-duplicate-row-based-on-all-column-match-before-inserting/m-p/2265999#M45360</link>
      <description>&lt;P&gt;I need to remove all duplicate records from a file before it get inserted to DB. In my case a record will be duplicate only in case all of the columns has same value. Example : The first two record will be considered as duplicate but third one is not. Here it is 5 columns , but could be more 10, 20.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;ip&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;host_name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;os_name&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;os_version&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Windows&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;8&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; Windows&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;8&lt;/P&gt;
&lt;P&gt;1.1.1.1&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; abc.com&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;Linux&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;5.6&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;I need to insert records to Redshift DB after De-Dupe is done.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 16 Nov 2024 02:22:31 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/Remove-duplicate-row-based-on-all-column-match-before-inserting/m-p/2265999#M45360</guid>
      <dc:creator>kaps1602</dc:creator>
      <dc:date>2024-11-16T02:22:31Z</dc:date>
    </item>
    <item>
      <title>Re: Remove duplicate row based on all column match before inserting to DB</title>
      <link>https://community.qlik.com/t5/Talend-Studio/Remove-duplicate-row-based-on-all-column-match-before-inserting/m-p/2266000#M45361</link>
      <description>Use tUniqRow and select all fields as keys</description>
      <pubDate>Wed, 20 May 2020 22:12:17 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Talend-Studio/Remove-duplicate-row-based-on-all-column-match-before-inserting/m-p/2266000#M45361</guid>
      <dc:creator>TRF</dc:creator>
      <dc:date>2020-05-20T22:12:17Z</dc:date>
    </item>
  </channel>
</rss>

