<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Pig- fragment-replicate join in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184182#M61658</link>
    <description>&lt;P&gt;Hi Lester Martin,&lt;/P&gt;&lt;P&gt;Thanks for your reply, but still I am not clear. &lt;/P&gt;&lt;P&gt;Is my understanding on this is correct or not? &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;  Please let me know on the same.&lt;/P&gt;</description>
    <pubDate>Wed, 24 May 2017 22:36:08 GMT</pubDate>
    <dc:creator>SatishS</dc:creator>
    <dc:date>2017-05-24T22:36:08Z</dc:date>
    <item>
      <title>Pig- fragment-replicate join</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184180#M61656</link>
      <description>&lt;P&gt;Hi Friends,&lt;/P&gt;&lt;P&gt;Have a question regarding the Pig -fragment-replicate join. Could you please let me know whether my (below) understanding is correct or not.&lt;/P&gt;&lt;P&gt;I have two files File A (400MB) and File B (50MB), when I join these two files using keyword "replicated" then the small file i,e File B is loaded into memory (because it's small file) and during join with file A (as File A is 400MB and it's distributed in hadoop cluster with 4 blocks - 3*128MB and 116MB) pig will load only parts of the file A (one block each time) into memory for the join with file B and once its done, it will load the next block and so on..&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Satish.&lt;/P&gt;</description>
      <pubDate>Wed, 24 May 2017 05:52:51 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184180#M61656</guid>
      <dc:creator>SatishS</dc:creator>
      <dc:date>2017-05-24T05:52:51Z</dc:date>
    </item>
    <item>
      <title>Re: Pig- fragment-replicate join</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184181#M61657</link>
      <description>&lt;P&gt;Yep, as &lt;A href="http://pig.apache.org/docs/r0.14.0/perf.html#replicated-joins" target="_blank"&gt;http://pig.apache.org/docs/r0.14.0/perf.html#replicated-joins&lt;/A&gt; details it, you have the jist of what's happening here.  The (obvious) goal is to do a map-side join instead of doing a more classical reduce-side join.&lt;/P&gt;</description>
      <pubDate>Wed, 24 May 2017 22:18:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184181#M61657</guid>
      <dc:creator>LesterMartin</dc:creator>
      <dc:date>2017-05-24T22:18:09Z</dc:date>
    </item>
    <item>
      <title>Re: Pig- fragment-replicate join</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184182#M61658</link>
      <description>&lt;P&gt;Hi Lester Martin,&lt;/P&gt;&lt;P&gt;Thanks for your reply, but still I am not clear. &lt;/P&gt;&lt;P&gt;Is my understanding on this is correct or not? &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;  Please let me know on the same.&lt;/P&gt;</description>
      <pubDate>Wed, 24 May 2017 22:36:08 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184182#M61658</guid>
      <dc:creator>SatishS</dc:creator>
      <dc:date>2017-05-24T22:36:08Z</dc:date>
    </item>
    <item>
      <title>Re: Pig- fragment-replicate join</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184183#M61659</link>
      <description>&lt;P&gt;Correct, File B will be loaded into memory and used in that context for each block of File A that is processed independent of each other.&lt;/P&gt;</description>
      <pubDate>Thu, 25 May 2017 01:25:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184183#M61659</guid>
      <dc:creator>LesterMartin</dc:creator>
      <dc:date>2017-05-25T01:25:39Z</dc:date>
    </item>
    <item>
      <title>Re: Pig- fragment-replicate join</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184184#M61660</link>
      <description>&lt;P&gt;Thanks Lester.&lt;/P&gt;</description>
      <pubDate>Thu, 25 May 2017 06:02:20 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-fragment-replicate-join/m-p/184184#M61660</guid>
      <dc:creator>SatishS</dc:creator>
      <dc:date>2017-05-25T06:02:20Z</dc:date>
    </item>
  </channel>
</rss>

