<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Pig ParquetStorer is not working in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102596#M15107</link>
    <description>&lt;P&gt;i used:    &lt;/P&gt;&lt;P&gt;register parquet-pig-1.10.1.jar;&lt;BR /&gt;register parquet-encoding-1.8.2.jar;&lt;BR /&gt;register parquet-column-1.8.2.jar;&lt;BR /&gt;register parquet-common-1.8.2.jar;&lt;BR /&gt;register parquet-hadoop-1.8.2.jar;&lt;BR /&gt;register parquet-format-2.3.1.jar;&lt;/P&gt;&lt;P&gt;base =  LOAD '/XXX/yyy/archivo.parquet' USING org.apache.parquet.pig.ParquetLoader AS (&lt;/P&gt;&lt;P&gt;xxx:chararray,&lt;BR /&gt;yyyy:chararray,&lt;/P&gt;&lt;P&gt;...&lt;/P&gt;&lt;P&gt;)&lt;BR /&gt;;&lt;BR /&gt;&lt;BR /&gt;and ok&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
    <pubDate>Tue, 30 Jul 2019 07:32:04 GMT</pubDate>
    <dc:creator>rene_lobera1</dc:creator>
    <dc:date>2019-07-30T07:32:04Z</dc:date>
    <item>
      <title>Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102591#M15102</link>
      <description>&lt;P&gt;Hi There,&lt;/P&gt;&lt;P&gt;We are getting the following error when using ParquetStorer in Pig&lt;/P&gt;&lt;PRE&gt;ERROR org.apache.pig.PigServer - exception during parsing: Error during parsing. Cannot instantiate class org.apache.pig.builtin.ParquetStorer (parquet.pig.ParquetStorer) &lt;/PRE&gt;&lt;P&gt;We are using HDP-2.3.4.0-3485 version. &lt;/P&gt;&lt;P&gt;Appreciate if any one have any pointers on this.&lt;/P&gt;&lt;P&gt;Thank you,&lt;/P&gt;&lt;P&gt;Ibrahim&lt;/P&gt;</description>
      <pubDate>Fri, 15 Jan 2016 01:41:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102591#M15102</guid>
      <dc:creator>IbrahimJ</dc:creator>
      <dc:date>2016-01-15T01:41:16Z</dc:date>
    </item>
    <item>
      <title>Re: Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102592#M15103</link>
      <description>&lt;P&gt;you need to download the parquet jar, upload it to the cluster and register the Parquet jar. HDP doesn't ship with Parquet out of the box. &lt;A rel="user" href="https://community.cloudera.com/users/2134/ibrahimj.html" nodeid="2134"&gt;@Ibrahim Jarrar&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="http://www.intelliwareness.org/2014/05/reading-and-writing-parquet-files-with-mortar/"&gt;here's&lt;/A&gt; an example.&lt;/P&gt;</description>
      <pubDate>Fri, 15 Jan 2016 02:13:50 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102592#M15103</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-01-15T02:13:50Z</dc:date>
    </item>
    <item>
      <title>Re: Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102593#M15104</link>
      <description>&lt;P&gt;--Register the jars &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-pig-1.3.1.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-column-1.3.1.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-common-1.3.1.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-format-2.0.0.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-hadoop-1.3.1.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-pig-1.3.1.jar; &lt;/P&gt;&lt;P&gt;REGISTER lib/parquet-encoding-1.3.1.jar;&lt;/P&gt;&lt;P&gt;
--store in parquet format &lt;/P&gt;&lt;P&gt;SET parquet.compression gzip or SNAPPY; &lt;/P&gt;&lt;P&gt;STORE table INTO '/path/to/table' USING parquet.pig.ParquetStorer; &lt;/P&gt;&lt;P&gt;-- options you might want to fiddle with &lt;/P&gt;&lt;P&gt;SET parquet.page.size 1048576 -- default. this is your min read/write unit. &lt;/P&gt;&lt;P&gt;SET parquet.block.size 134217728 -- default. your memory budget for buffering data &lt;/P&gt;&lt;P&gt;SET parquet.compression lzo -- or you can use none, gzip, snappy &lt;/P&gt;&lt;P&gt;STORE mydata into '/some/path' USING parquet.pig.ParquetStorer;
--Reading
mydata = LOAD '/some/path' USING parquet.pig.ParquetLoader  AS (x: int, y int);&lt;/P&gt;</description>
      <pubDate>Fri, 15 Jan 2016 02:45:01 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102593#M15104</guid>
      <dc:creator>GeeKay2015</dc:creator>
      <dc:date>2016-01-15T02:45:01Z</dc:date>
    </item>
    <item>
      <title>Re: Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102594#M15105</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2134/ibrahimj.html" nodeid="2134"&gt;@Ibrahim Jarrar&lt;/A&gt; has this been resolved? Can you provide your solution or accept the best answer?&lt;/P&gt;</description>
      <pubDate>Wed, 03 Feb 2016 09:50:40 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102594#M15105</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-02-03T09:50:40Z</dc:date>
    </item>
    <item>
      <title>Re: Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102595#M15106</link>
      <description>&lt;P&gt;Here's a much cleaner working example tested with HDP 2.6&lt;/P&gt;&lt;PRE&gt;wget &lt;A href="http://central.maven.org/maven2/org/apache/parquet/parquet-pig-bundle/1.8.1/parquet-pig-bundle-1.8.1.jar"&gt;&lt;/A&gt;&lt;A href="http://central.maven.org/maven2/org/apache/parquet/parquet-pig-bundle/1.8.1/parquet-pig-bundle-1.8.1.jar" target="_blank"&gt;http://central.maven.org/maven2/org/apache/parquet/parquet-pig-bundle/1.8.1/parquet-pig-bundle-1.8.1.jar&lt;/A&gt;&lt;BR /&gt;hdfs dfs -put
parquet-pig-bundle-1.8.1.jar .&lt;BR /&gt;pig –x tez&lt;BR /&gt;REGISTER
hdfs://dlm3ha/user/centos/parquet-pig-bundle-1.8.1.jar;&lt;BR /&gt;// words is a CSV file with five fields&lt;BR /&gt;data = load 'words' using
PigStorage(',') as
(f1:chararray,f2:chararray,f3:chararray,f4:chararray,f5:chararray);&lt;BR /&gt;store data into
'hdfs://dlm3ha/user/centos/output' using &lt;STRONG&gt;org.apache.parquet&lt;/STRONG&gt;.pig.ParquetStorer;&lt;/PRE&gt;</description>
      <pubDate>Sat, 26 Aug 2017 00:07:47 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102595#M15106</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2017-08-26T00:07:47Z</dc:date>
    </item>
    <item>
      <title>Re: Pig ParquetStorer is not working</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102596#M15107</link>
      <description>&lt;P&gt;i used:    &lt;/P&gt;&lt;P&gt;register parquet-pig-1.10.1.jar;&lt;BR /&gt;register parquet-encoding-1.8.2.jar;&lt;BR /&gt;register parquet-column-1.8.2.jar;&lt;BR /&gt;register parquet-common-1.8.2.jar;&lt;BR /&gt;register parquet-hadoop-1.8.2.jar;&lt;BR /&gt;register parquet-format-2.3.1.jar;&lt;/P&gt;&lt;P&gt;base =  LOAD '/XXX/yyy/archivo.parquet' USING org.apache.parquet.pig.ParquetLoader AS (&lt;/P&gt;&lt;P&gt;xxx:chararray,&lt;BR /&gt;yyyy:chararray,&lt;/P&gt;&lt;P&gt;...&lt;/P&gt;&lt;P&gt;)&lt;BR /&gt;;&lt;BR /&gt;&lt;BR /&gt;and ok&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 30 Jul 2019 07:32:04 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Pig-ParquetStorer-is-not-working/m-p/102596#M15107</guid>
      <dc:creator>rene_lobera1</dc:creator>
      <dc:date>2019-07-30T07:32:04Z</dc:date>
    </item>
  </channel>
</rss>

