<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Skew issue in spark sql in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232523#M194361</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I am joining two tables. One table is skewed. How to handle this in spark SQL. I am using spark 2.2.1 in AWS EMR. &lt;/P&gt;&lt;P&gt;Please assist on this.&lt;/P&gt;</description>
    <pubDate>Tue, 28 Aug 2018 18:43:57 GMT</pubDate>
    <dc:creator>elango_rk</dc:creator>
    <dc:date>2018-08-28T18:43:57Z</dc:date>
    <item>
      <title>Skew issue in spark sql</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232523#M194361</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I am joining two tables. One table is skewed. How to handle this in spark SQL. I am using spark 2.2.1 in AWS EMR. &lt;/P&gt;&lt;P&gt;Please assist on this.&lt;/P&gt;</description>
      <pubDate>Tue, 28 Aug 2018 18:43:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232523#M194361</guid>
      <dc:creator>elango_rk</dc:creator>
      <dc:date>2018-08-28T18:43:57Z</dc:date>
    </item>
    <item>
      <title>Re: Skew issue in spark sql</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232524#M194362</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/24259/elangork.html" nodeid="24259"&gt;@elango vaithiyanathan&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Perhaps you could pick another way to partition your data, by different column where the distribution of data is split evenly (hopefully)&lt;/P&gt;&lt;P&gt;Or else you could build an artificial (numeric) column by salting, and partition by this column.&lt;/P&gt;&lt;P&gt;HTH&lt;/P&gt;&lt;P&gt;*** If you found this answer addressed your question, please take a moment to login and click the "accept" link on the answer.&lt;/P&gt;</description>
      <pubDate>Tue, 28 Aug 2018 19:10:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232524#M194362</guid>
      <dc:creator>falbani</dc:creator>
      <dc:date>2018-08-28T19:10:00Z</dc:date>
    </item>
    <item>
      <title>Re: Skew issue in spark sql</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232525#M194363</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/11048/falbani.html" nodeid="11048"&gt;@Felix Albani&lt;/A&gt; Thank you.&lt;/P&gt;</description>
      <pubDate>Tue, 28 Aug 2018 19:22:21 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Skew-issue-in-spark-sql/m-p/232525#M194363</guid>
      <dc:creator>elango_rk</dc:creator>
      <dc:date>2018-08-28T19:22:21Z</dc:date>
    </item>
  </channel>
</rss>

