<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question NiFi CRON read mutliple times in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206320#M59781</link>
    <description>&lt;P&gt;I am using a GetHDFS Processor with CRON driven strategy : sheduled to run every day at 10am.&lt;/P&gt;&lt;P&gt;I have one input file to read but when the dataflow starts it gets the source file multiple times instead of 1 time (9 times in my case). Why?&lt;/P&gt;&lt;P&gt;As a result, when I write the output dataflow, I get the following warning : file with same name already exists&lt;/P&gt;&lt;P&gt;Should I modify the parameter Plling Interval ? (set to 0 sec by default)&lt;/P&gt;</description>
    <pubDate>Thu, 20 Apr 2017 21:39:37 GMT</pubDate>
    <dc:creator>raphamarymtl</dc:creator>
    <dc:date>2017-04-20T21:39:37Z</dc:date>
    <item>
      <title>NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206320#M59781</link>
      <description>&lt;P&gt;I am using a GetHDFS Processor with CRON driven strategy : sheduled to run every day at 10am.&lt;/P&gt;&lt;P&gt;I have one input file to read but when the dataflow starts it gets the source file multiple times instead of 1 time (9 times in my case). Why?&lt;/P&gt;&lt;P&gt;As a result, when I write the output dataflow, I get the following warning : file with same name already exists&lt;/P&gt;&lt;P&gt;Should I modify the parameter Plling Interval ? (set to 0 sec by default)&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 21:39:37 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206320#M59781</guid>
      <dc:creator>raphamarymtl</dc:creator>
      <dc:date>2017-04-20T21:39:37Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206321#M59782</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/13246/raphamarymtl.html" nodeid="13246"&gt;@Raphaël MARY&lt;/A&gt;&lt;P&gt;What does your cron run schedule look like?&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 21:44:53 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206321#M59782</guid>
      <dc:creator>Wynner</dc:creator>
      <dc:date>2017-04-20T21:44:53Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206322#M59783</link>
      <description>&lt;P&gt;Run schedule : * * 10 * * ?&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 21:47:03 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206322#M59783</guid>
      <dc:creator>raphamarymtl</dc:creator>
      <dc:date>2017-04-20T21:47:03Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206323#M59784</link>
      <description>&lt;P&gt;Hi &lt;A rel="user" href="https://community.cloudera.com/users/13246/raphamarymtl.html" nodeid="13246"&gt;@Raphaël MARY&lt;/A&gt;,&lt;/P&gt;&lt;P&gt;Did you set a different value for number of concurrent tasks?&lt;/P&gt;&lt;P&gt;Are you in a cluster configuration?&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 21:56:21 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206323#M59784</guid>
      <dc:creator>pvillard</dc:creator>
      <dc:date>2017-04-20T21:56:21Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206324#M59785</link>
      <description>&lt;P&gt;No, only one node and 1 concurrent tasks.&lt;/P&gt;&lt;P&gt;I changed to 0 0 10 * * ?  in order to specify minutes and seconds.&lt;/P&gt;&lt;P&gt;It is working now!&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 22:03:02 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206324#M59785</guid>
      <dc:creator>raphamarymtl</dc:creator>
      <dc:date>2017-04-20T22:03:02Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206325#M59786</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/13246/raphamarymtl.html" nodeid="13246"&gt;@Raphaël MARY&lt;/A&gt;&lt;P&gt;If you are running a NiFi cluster, by default every node in your cluster will be running this getHDFS processor at 10 am each day.  This means every node will be getting a copy of the same files and processing them in the same way.&lt;/P&gt;&lt;P&gt;If you are running a cluster, considering changing the configuration of your getHDFS processor so it runs on primary node only.&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 22:04:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206325#M59786</guid>
      <dc:creator>MattWho</dc:creator>
      <dc:date>2017-04-20T22:04:42Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206326#M59787</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/13246/raphamarymtl.html" nodeid="13246"&gt;@Raphaël MARY&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Try setting the cron run schedule to 0 0 10 * * ? instead.&lt;/P&gt;&lt;P&gt;The reason the other cron schedule grabbed the same file multiple times is because the * * for second and minutes meant run every second and every minute for that hour.&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 22:16:04 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206326#M59787</guid>
      <dc:creator>Wynner</dc:creator>
      <dc:date>2017-04-20T22:16:04Z</dc:date>
    </item>
    <item>
      <title>Re: NiFi CRON read mutliple times</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206327#M59788</link>
      <description>&lt;P&gt;Possibility to run every second or minute.  In reality this means run as often as possible using the allowable number of concurrent tasks during the 10th hour  of each day.  I your case it sounds like it was able to run at least 10 times in that one hour.&lt;/P&gt;</description>
      <pubDate>Thu, 20 Apr 2017 22:18:02 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/NiFi-CRON-read-mutliple-times/m-p/206327#M59788</guid>
      <dc:creator>MattWho</dc:creator>
      <dc:date>2017-04-20T22:18:02Z</dc:date>
    </item>
  </channel>
</rss>

