<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: pyspark example? in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150726#M24114</link>
    <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3017/erik.html" nodeid="3017"&gt;@Erik Putrycz&lt;/A&gt; To use the pyspark , you need to copy the python file to your hdfs and specify the hdfs path of python file in the &amp;lt;jar&amp;gt; tag &lt;/P&gt;&lt;P&gt;"&amp;lt;jar&amp;gt;${nameNode}/user/ambari-qa/examples/apps/spark/lib/pi.py&amp;lt;/jar&amp;gt;"&lt;/P&gt;&lt;P&gt;Also you need to export the SPARK_HOME in your hadoop-env.sh&lt;/P&gt;</description>
    <pubDate>Fri, 01 Apr 2016 11:48:30 GMT</pubDate>
    <dc:creator>mramasami</dc:creator>
    <dc:date>2016-04-01T11:48:30Z</dc:date>
    <item>
      <title>pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150723#M24111</link>
      <description>&lt;P&gt;Is there anywhere a full example of a pyspark workflow with oozie? I found examples for java spark workflows but I am not sure how to transpose them with HDP and pyspark.&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 11:34:22 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150723#M24111</guid>
      <dc:creator>erik1</dc:creator>
      <dc:date>2016-03-31T11:34:22Z</dc:date>
    </item>
    <item>
      <title>Re: pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150724#M24112</link>
      <description>&lt;P&gt;Oozie Spark action is available in the community, Hortonworks does not provide support for spark action in HDP 2.4 or below. As soon as it's available, there will be examples of pyspark in Oozie.&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 11:50:10 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150724#M24112</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-03-31T11:50:10Z</dc:date>
    </item>
    <item>
      <title>Re: pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150725#M24113</link>
      <description>&lt;P&gt;I did not get any errors in a job with this &lt;A href="http://oozie.apache.org/docs/4.2.0/DG_SparkActionExtension.html" target="_blank"&gt;http://oozie.apache.org/docs/4.2.0/DG_SparkActionExtension.html&lt;/A&gt; but it certainly is not obvious how do you use it for pyspark.&lt;/P&gt;</description>
      <pubDate>Fri, 01 Apr 2016 08:13:11 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150725#M24113</guid>
      <dc:creator>erik1</dc:creator>
      <dc:date>2016-04-01T08:13:11Z</dc:date>
    </item>
    <item>
      <title>Re: pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150726#M24114</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3017/erik.html" nodeid="3017"&gt;@Erik Putrycz&lt;/A&gt; To use the pyspark , you need to copy the python file to your hdfs and specify the hdfs path of python file in the &amp;lt;jar&amp;gt; tag &lt;/P&gt;&lt;P&gt;"&amp;lt;jar&amp;gt;${nameNode}/user/ambari-qa/examples/apps/spark/lib/pi.py&amp;lt;/jar&amp;gt;"&lt;/P&gt;&lt;P&gt;Also you need to export the SPARK_HOME in your hadoop-env.sh&lt;/P&gt;</description>
      <pubDate>Fri, 01 Apr 2016 11:48:30 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150726#M24114</guid>
      <dc:creator>mramasami</dc:creator>
      <dc:date>2016-04-01T11:48:30Z</dc:date>
    </item>
    <item>
      <title>Re: pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150727#M24115</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3017/erik.html" nodeid="3017"&gt;@Erik Putrycz&lt;/A&gt; I added a pyspark workflow example &lt;A href="https://github.com/dbist/oozie/tree/master/apps/pyspark" target="_blank"&gt;https://github.com/dbist/oozie/tree/master/apps/pyspark&lt;/A&gt; it works in HA HDFS, RM HA, OOZIE HA, kerberos.&lt;/P&gt;</description>
      <pubDate>Fri, 17 Feb 2017 02:00:13 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150727#M24115</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2017-02-17T02:00:13Z</dc:date>
    </item>
    <item>
      <title>Re: pyspark example?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150728#M24116</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3017/erik.html" nodeid="3017"&gt;@Erik Putrycz&lt;/A&gt; additionally, I added a tutorial here &lt;A href="https://community.hortonworks.com/articles/84071/apache-ambari-workflow-manager-view-for-apache-ooz-2.html" target="_blank"&gt;https://community.hortonworks.com/articles/84071/apache-ambari-workflow-manager-view-for-apache-ooz-2.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 17 Feb 2017 05:07:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/pyspark-example/m-p/150728#M24116</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2017-02-17T05:07:34Z</dc:date>
    </item>
  </channel>
</rss>

