<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Recommended data quality test suite for Hive / Pig / Oozie in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98038#M11549</link>
    <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;I am looking for Best practices around data quality Testing for hive / pig/ oozie based ETL. &lt;/P&gt;&lt;P&gt;Client is looking at tools like Data flux data quality for Hadoop . &lt;/P&gt;&lt;P&gt;If there are any alternate recommendations , please update this question. &lt;/P&gt;</description>
    <pubDate>Fri, 16 Sep 2022 09:51:36 GMT</pubDate>
    <dc:creator>pbalasundaram</dc:creator>
    <dc:date>2022-09-16T09:51:36Z</dc:date>
    <item>
      <title>Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98038#M11549</link>
      <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;I am looking for Best practices around data quality Testing for hive / pig/ oozie based ETL. &lt;/P&gt;&lt;P&gt;Client is looking at tools like Data flux data quality for Hadoop . &lt;/P&gt;&lt;P&gt;If there are any alternate recommendations , please update this question. &lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 09:51:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98038#M11549</guid>
      <dc:creator>pbalasundaram</dc:creator>
      <dc:date>2022-09-16T09:51:36Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98039#M11550</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/435/pbalasundaram.html" nodeid="435"&gt;@pbalasundaram&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A target="_blank" href="https://www.trifacta.com/"&gt;https://www.trifacta.com/&lt;/A&gt;   - It can be used for data quality checks during cleansing &lt;/P&gt;&lt;P&gt;&lt;A target="_blank" href="http://vis.stanford.edu/wrangler/"&gt;http://vis.stanford.edu/wrangler/&lt;/A&gt;  - open source version of trifacta&lt;/P&gt;&lt;P&gt;&lt;A target="_blank" href="https://www.talend.com/resource/data-quality-tools.html"&gt;https://www.talend.com/resource/data-quality-tools.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A target="_blank" href="https://www.ataccama.com/products/big-data-platform-for-hadoop/big-data-engine"&gt;https://www.ataccama.com/products/big-data-platform-for-hadoop/big-data-engine&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 08 Dec 2015 04:36:10 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98039#M11550</guid>
      <dc:creator>nsabharwal</dc:creator>
      <dc:date>2015-12-08T04:36:10Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98040#M11551</link>
      <description>&lt;P&gt;Hi Neeraj - Trifacta seems to be a data wrangling tool, does it also provide data quality measures OOTB ? &lt;/P&gt;</description>
      <pubDate>Tue, 08 Dec 2015 04:49:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98040#M11551</guid>
      <dc:creator>pbalasundaram</dc:creator>
      <dc:date>2015-12-08T04:49:42Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98041#M11552</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/435/pbalasundaram.html" nodeid="435"&gt;@pbalasundaram&lt;/A&gt; I have heard that it can be used for the quality while wrangling.&lt;/P&gt;&lt;P&gt;&lt;A target="_blank" href="https://www.trifacta.com/wp-content/uploads/2014/01/Trifacta_DataTransformValue_WP.pdf"&gt;https://www.trifacta.com/wp-content/uploads/2014/01/Trifacta_DataTransformValue_WP.pdf&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 08 Dec 2015 04:58:18 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98041#M11552</guid>
      <dc:creator>nsabharwal</dc:creator>
      <dc:date>2015-12-08T04:58:18Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98042#M11553</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/435/pbalasundaram.html" nodeid="435"&gt;@pbalasundaram&lt;/A&gt; are you still having issues with this? Can you accept best answer or provide your own solution?&lt;/P&gt;</description>
      <pubDate>Wed, 03 Feb 2016 23:48:51 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98042#M11553</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-02-03T23:48:51Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98043#M11554</link>
      <description>&lt;P&gt;Hi Neeraj, for data quality testing is there a model script developed on pig or spark, rather than using a tool. Thanks.&lt;/P&gt;</description>
      <pubDate>Wed, 25 May 2016 11:41:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/98043#M11554</guid>
      <dc:creator>Eukrev</dc:creator>
      <dc:date>2016-05-25T11:41:17Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended data quality test suite for Hive / Pig / Oozie</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/307120#M11555</link>
      <description>&lt;P&gt;2020 Update, what are the preferred data quality tools compatible with CDH for Hive,Hbase and Solr? Our team is looking at Apache Griffin.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Regards,&amp;nbsp;&lt;BR /&gt;Nithya Koka&lt;/P&gt;</description>
      <pubDate>Mon, 07 Dec 2020 19:36:20 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-data-quality-test-suite-for-Hive-Pig-Oozie/m-p/307120#M11555</guid>
      <dc:creator>KokaN</dc:creator>
      <dc:date>2020-12-07T19:36:20Z</dc:date>
    </item>
  </channel>
</rss>

