<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Data Prep &amp; Duplicates in Data Quality</title>
    <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258604#M1302</link>
    <description>&lt;P&gt;yes you can apply it to a column but keep in mind your external link should be duplicate.&lt;/P&gt;</description>
    <pubDate>Mon, 03 Sep 2018 05:33:23 GMT</pubDate>
    <dc:creator>aashish_21nov</dc:creator>
    <dc:date>2018-09-03T05:33:23Z</dc:date>
    <item>
      <title>Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258601#M1299</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;
&lt;P&gt;Using The Data Prep tool I am trying to find duplicates within a column, is there a way to find those that are an exact match as well as those that are a close match (similar to how excel duplicates and fuzzy match works)?&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sat, 16 Nov 2024 07:43:53 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258601#M1299</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2024-11-16T07:43:53Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258602#M1300</link>
      <description>&lt;P&gt;tuniqrow will provide list of all duplicate records.&lt;/P&gt;</description>
      <pubDate>Mon, 03 Sep 2018 05:04:02 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258602#M1300</guid>
      <dc:creator>aashish_21nov</dc:creator>
      <dc:date>2018-09-03T05:04:02Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258603#M1301</link>
      <description>&lt;P&gt;Hi Aashish,&lt;/P&gt;&lt;P&gt;Is tuniqrow used in the Talend Data Prep Tool, I don't see can I select this and apply it to a column?&lt;/P&gt;&lt;P&gt;Regards&lt;/P&gt;</description>
      <pubDate>Mon, 03 Sep 2018 05:08:29 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258603#M1301</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2018-09-03T05:08:29Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258604#M1302</link>
      <description>&lt;P&gt;yes you can apply it to a column but keep in mind your external link should be duplicate.&lt;/P&gt;</description>
      <pubDate>Mon, 03 Sep 2018 05:33:23 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258604#M1302</guid>
      <dc:creator>aashish_21nov</dc:creator>
      <dc:date>2018-09-03T05:33:23Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258605#M1303</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;tUniqueRow is not available in Talend Data Preparation, it solely exists in Talend Studio.&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;So far in Data Prep, there is no equivalent to tUniqueRow, but addressing deduplication is part of the roadmap. Few things can already help spotting and solving duplicates:&lt;/P&gt; 
&lt;UL&gt; 
 &lt;LI&gt;The charts on the bottom right will show the most common values. Therefore, exact matches (if any) will&amp;nbsp;show up&amp;nbsp;at the top of the chart. See&amp;nbsp;&lt;A href="https://help.talend.com/reader/n~7tYndHPhSgSAN0bpenIA/rTPaBMcsHltniefJI2Caaw" target="_blank" rel="nofollow noopener noreferrer"&gt;https://help.talend.com/reader/n~7tYndHPhSgSAN0bpenIA/rTPaBMcsHltniefJI2Caaw&lt;/A&gt; for more details.&lt;/LI&gt; 
 &lt;LI&gt;The function "find and group similar text" performs text clustering&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;with fuzzy matching. See&amp;nbsp;&lt;A href="https://help.talend.com/reader/087PIlN0I5BrDxt9016xRA/RVQQzV9CAYXQVh1m6DYWkA" target="_blank" rel="nofollow noopener noreferrer"&gt;https://help.talend.com/reader/087PIlN0I5BrDxt9016xRA/RVQQzV9CAYXQVh1m6DYWkA&lt;/A&gt;&lt;/LI&gt; 
&lt;/UL&gt; 
&lt;P&gt;Regards,&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;Gwendal&lt;/P&gt;</description>
      <pubDate>Mon, 03 Sep 2018 07:52:39 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258605#M1303</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2018-09-03T07:52:39Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258606#M1304</link>
      <description>Thanks Gwendal,&lt;BR /&gt;Is there an idea of when this would be in place - I've seen mention of this in some posts in 2016/2017?&lt;BR /&gt;Regards,&lt;BR /&gt;Darren</description>
      <pubDate>Mon, 03 Sep 2018 21:10:07 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258606#M1304</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2018-09-03T21:10:07Z</dc:date>
    </item>
    <item>
      <title>Re: Data Prep &amp; Duplicates</title>
      <link>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258607#M1305</link>
      <description>&lt;P&gt;Hi Darren,&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;That is&amp;nbsp;something which&amp;nbsp;will be addressed in the course of next year.&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;Regards,&lt;/P&gt; 
&lt;P&gt;&amp;nbsp;&lt;/P&gt; 
&lt;P&gt;Gwendal&lt;/P&gt;</description>
      <pubDate>Wed, 05 Sep 2018 11:06:40 GMT</pubDate>
      <guid>https://community.qlik.com/t5/Data-Quality/Data-Prep-Duplicates/m-p/2258607#M1305</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2018-09-05T11:06:40Z</dc:date>
    </item>
  </channel>
</rss>

