<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Remove Duplicate Record values without cache services in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343243#M233881</link>
    <description>&lt;P&gt;Not sure if this is the best way but try using QueryRecord and create one dynamic property to funnel the data into where your query will look like this:&lt;/P&gt;&lt;P&gt;Select distinct * from FLOWFILE&lt;/P&gt;</description>
    <pubDate>Thu, 05 May 2022 19:57:24 GMT</pubDate>
    <dc:creator>SAMSAL</dc:creator>
    <dc:date>2022-05-05T19:57:24Z</dc:date>
    <item>
      <title>Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343176#M233871</link>
      <description>&lt;P&gt;Hi All, Good Morning!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Please help me in removing Duplicate Records without using cache services (Apache NIFI)&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="Error Log" style="width: 844px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/34312i475EA143748A253A/image-size/large?v=v2&amp;amp;px=999" role="button" title="Error Log.PNG" alt="Error Log" /&gt;&lt;span class="lia-inline-image-caption" onclick="event.preventDefault();"&gt;Error Log&lt;/span&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 05 May 2022 05:10:45 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343176#M233871</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-05T05:10:45Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343243#M233881</link>
      <description>&lt;P&gt;Not sure if this is the best way but try using QueryRecord and create one dynamic property to funnel the data into where your query will look like this:&lt;/P&gt;&lt;P&gt;Select distinct * from FLOWFILE&lt;/P&gt;</description>
      <pubDate>Thu, 05 May 2022 19:57:24 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343243#M233881</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2022-05-05T19:57:24Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343346#M233905</link>
      <description>&lt;P&gt;Thanks for the valuable information and I got the results , but the Date and Error Message are not sorted/ordered properly.&lt;/P&gt;&lt;P&gt;Do We have any particular Function on Sql Query or any processor to sort in Order for the same&lt;/P&gt;</description>
      <pubDate>Fri, 06 May 2022 13:26:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343346#M233905</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-06T13:26:05Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343369#M233912</link>
      <description>&lt;P&gt;have you tried Selected distinct * order by Date, ERROR_MSG&lt;/P&gt;</description>
      <pubDate>Fri, 06 May 2022 17:20:12 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343369#M233912</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2022-05-06T17:20:12Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343429#M233932</link>
      <description>&lt;P&gt;No, Not yet and I am waiting from the client end for confirmation since my clients are abroad and they have access for the same, Would check and let you know the results by tomorrow 10th May 2022. Thanks for the help SAMSAL.&lt;/P&gt;</description>
      <pubDate>Mon, 09 May 2022 07:00:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343429#M233932</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-09T07:00:09Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343517#M233949</link>
      <description>&lt;P&gt;Thanks for the help SAMSAL and my next task is to insert these values into the table. Please let me know which processor would help me.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 10 May 2022 10:15:12 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343517#M233949</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-10T10:15:12Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343551#M233957</link>
      <description>&lt;P&gt;there are a lot of processors that can help you with that for example : PUTSQL, PutDatabaseRecord, ExecuteSQL&lt;/P&gt;</description>
      <pubDate>Tue, 10 May 2022 19:28:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343551#M233957</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2022-05-10T19:28:42Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343559#M233965</link>
      <description>&lt;P&gt;Sure SAMSAL, Once the table is created I would test the same with above mentioned. Which is HiveDB Table.&lt;/P&gt;</description>
      <pubDate>Wed, 11 May 2022 03:48:01 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343559#M233965</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-11T03:48:01Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343583#M233970</link>
      <description>&lt;P&gt;The table has been created, I have to perform Insert Statement on PutHiveStreaming Processor, Insert those Extracted Error Log Data. I am viewing results on Google and If I need any Help will get back here for sure, Thanks&lt;/P&gt;</description>
      <pubDate>Wed, 11 May 2022 09:10:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343583#M233970</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-11T09:10:34Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343631#M233983</link>
      <description>&lt;P&gt;Please help me in Inserting these data into Hive DB. (Process flow). Hive doesn't accept CSV and it has to convert to Avro. I am stuck on how to Put Insert Statement and direct to PutHiveStreaming.&lt;/P&gt;</description>
      <pubDate>Thu, 12 May 2022 04:04:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343631#M233983</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-12T04:04:35Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343678#M233990</link>
      <description>&lt;P&gt;I never worked with Hive DB, but if it only takes avro format and you have csv you can use processor ConvertRecrod to convert a record from one format to another. In this processor you create CSV Reader service and the writer is Avro&lt;/P&gt;</description>
      <pubDate>Thu, 12 May 2022 20:31:50 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343678#M233990</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2022-05-12T20:31:50Z</dc:date>
    </item>
    <item>
      <title>Re: Remove Duplicate Record values without cache services</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343685#M233994</link>
      <description>&lt;P&gt;&lt;SPAN&gt;&amp;nbsp;Sure SAMSOL, In Hive DB, I am having a table and no need for any SQL INSERT STATEMENT.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Say HIVE DB Table has XXX, in that I have to put these Data and Error Field, Just convert to Avro works or ??? have to call insert statement processor&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 13 May 2022 04:28:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Remove-Duplicate-Record-values-without-cache-services/m-p/343685#M233994</guid>
      <dc:creator>Gtec</dc:creator>
      <dc:date>2022-05-13T04:28:17Z</dc:date>
    </item>
  </channel>
</rss>

