<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Change default output filename part-r-00000.snappy.parquet in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371164#M240911</link>
    <description>&lt;P&gt;this is possible,please try parquet,instead of csv&lt;/P&gt;</description>
    <pubDate>Fri, 19 May 2023 08:17:57 GMT</pubDate>
    <dc:creator>asish</dc:creator>
    <dc:date>2023-05-19T08:17:57Z</dc:date>
    <item>
      <title>Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371145#M240901</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am trying to run a mapreduce job and output it on a folder. Is there any way to change the default filename. My default filename is&amp;nbsp;part-r-00000.snappy.parquet and I want to add a date to this. Is this possible.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is there a parameter to change this, thank you.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 01:21:58 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371145#M240901</guid>
      <dc:creator>Josh2023</dc:creator>
      <dc:date>2023-05-19T01:21:58Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371152#M240904</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/105136"&gt;@Josh2023&lt;/a&gt;,&amp;nbsp;Welcome to our community! To help you get the best possible answer, I have tagged our MapR experts&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/71090"&gt;@asish&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/36139"&gt;@mugdha&lt;/a&gt;&amp;nbsp; who may be able to assist you further.&lt;BR /&gt;&lt;BR /&gt;Please feel free to provide any additional information or details about your query, and we hope that you will find a satisfactory solution to your question.&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 06:11:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371152#M240904</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2023-05-19T06:11:09Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371154#M240906</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/105136"&gt;@Josh2023&lt;/a&gt;&amp;nbsp; can you try below:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN class="hljs-keyword"&gt;SET&lt;/SPAN&gt;&lt;SPAN&gt; hive.exec.compress.output&lt;/SPAN&gt;&lt;SPAN class="hljs-operator"&gt;=&lt;/SPAN&gt;&lt;SPAN class="hljs-literal"&gt;false&lt;/SPAN&gt;&lt;SPAN&gt;; &lt;/SPAN&gt;&lt;SPAN class="hljs-keyword"&gt;SET&lt;/SPAN&gt;&lt;SPAN&gt; hive.exec.dynamic.partition.mode&lt;/SPAN&gt;&lt;SPAN class="hljs-operator"&gt;=&lt;/SPAN&gt;&lt;SPAN&gt;nonstrict; &lt;/SPAN&gt;&lt;SPAN class="hljs-comment"&gt;-- Create a temporary table or select data from existing tables&lt;/SPAN&gt; &lt;SPAN class="hljs-keyword"&gt;INSERT&lt;/SPAN&gt;&lt;SPAN&gt; OVERWRITE DIRECTORY &lt;/SPAN&gt;&lt;SPAN class="hljs-string"&gt;'/path/to/output_directory/filename_'&lt;/SPAN&gt; &lt;SPAN class="hljs-operator"&gt;||&lt;/SPAN&gt;&lt;SPAN&gt; from_unixtime(unix_timestamp(), &lt;/SPAN&gt;&lt;SPAN class="hljs-string"&gt;'yyyyMMdd'&lt;/SPAN&gt;&lt;SPAN&gt;) &lt;/SPAN&gt;&lt;SPAN class="hljs-operator"&gt;||&lt;/SPAN&gt; &lt;SPAN class="hljs-string"&gt;'.csv'&lt;/SPAN&gt; &lt;SPAN class="hljs-keyword"&gt;SELECT&lt;/SPAN&gt; &lt;SPAN class="hljs-operator"&gt;*&lt;/SPAN&gt; &lt;SPAN class="hljs-keyword"&gt;FROM&lt;/SPAN&gt;&lt;SPAN&gt; your_table;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 06:14:52 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371154#M240906</guid>
      <dc:creator>asish</dc:creator>
      <dc:date>2023-05-19T06:14:52Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371160#M240909</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/105136"&gt;@Josh2023&lt;/a&gt;&amp;nbsp;could you please accept as solution,if this has fixed your issue?&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 07:16:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371160#M240909</guid>
      <dc:creator>asish</dc:creator>
      <dc:date>2023-05-19T07:16:36Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371163#M240910</link>
      <description>&lt;P&gt;Hell&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/71090"&gt;@asish&lt;/a&gt;, thanks for the answer, unfortunately my output is already parquet format,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Example below is the usually output of my mapreduce job:&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;&lt;SPAN&gt;part-r-00000.snappy.parquet&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I need to use below format as an example:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;part-r-00000.2023-05-19-04-09.snappy.parquet&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Is this possible?&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 08:09:33 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371163#M240910</guid>
      <dc:creator>Josh2023</dc:creator>
      <dc:date>2023-05-19T08:09:33Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371164#M240911</link>
      <description>&lt;P&gt;this is possible,please try parquet,instead of csv&lt;/P&gt;</description>
      <pubDate>Fri, 19 May 2023 08:17:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371164#M240911</guid>
      <dc:creator>asish</dc:creator>
      <dc:date>2023-05-19T08:17:57Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371647#M241041</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/105136"&gt;@Josh2023&lt;/a&gt;&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future. Thanks.&lt;/P&gt;</description>
      <pubDate>Mon, 29 May 2023 12:19:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/371647#M241041</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2023-05-29T12:19:39Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372193#M241178</link>
      <description>&lt;P&gt;Since the output file is .parquet , hope you're using ParquetOutputFormat in the MR job config. In that case ParquetOutputFormat.setOutputname&amp;nbsp; method will help to set the base name of the output file.&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;&amp;nbsp;Ref -&lt;BR /&gt;&lt;A href="https://www.javadoc.io/doc/org.apache.parquet/parquet-hadoop/1.12.2/org/apache/parquet/hadoop/ParquetOutputFormat.html" target="_blank"&gt;https://www.javadoc.io/doc/org.apache.parquet/parquet-hadoop/1.12.2/org/apache/parquet/hadoop/ParquetOutputFormat.html&lt;/A&gt;&lt;BR /&gt;&lt;A href="https://hadoop.apache.org/docs/r2.8.0/api/org/apache/hadoop/mapreduce/lib/output/FileOutputFormat.html#setOutputName(org.apache.hadoop.mapreduce.JobContext,%20java.lang.String" target="_blank"&gt;https://hadoop.apache.org/docs/r2.8.0/api/org/apache/hadoop/mapreduce/lib/output/FileOutputFormat.html#setOutputName(org.apache.hadoop.mapreduce.JobContext,%20java.lang.String&lt;/A&gt;)&lt;/P&gt;</description>
      <pubDate>Tue, 06 Jun 2023 12:13:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372193#M241178</guid>
      <dc:creator>ggangadharan</dc:creator>
      <dc:date>2023-06-06T12:13:16Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372208#M241180</link>
      <description>&lt;P&gt;mapreduce.output.basename also works since as part of setoutput name assigning the same.&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;Code snippet form&amp;nbsp;ParquetOutputFormat.&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;    protected static void setOutputName(JobContext job, String name) {
        job.getConfiguration().set("mapreduce.output.basename", name);
    }&lt;/LI-CODE&gt;&lt;P&gt;&lt;BR /&gt;JOB CONF -&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt; Configuration conf = getConf();
 conf.set("mapreduce.output.basename","parquet_output");&lt;/LI-CODE&gt;&lt;P&gt;&lt;BR /&gt;Output&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;[hive@c1757-node3 ~]$ hdfs dfs -ls /tmp/parquet-sample
Found 4 items
-rw-r--r--   2 hive supergroup          0 2023-06-06 17:08 /tmp/parquet-sample/_SUCCESS
-rw-r--r--   2 hive supergroup        271 2023-06-06 17:08 /tmp/parquet-sample/_common_metadata
-rw-r--r--   2 hive supergroup       1791 2023-06-06 17:08 /tmp/parquet-sample/_metadata
-rw-r--r--   2 hive supergroup       2508 2023-06-06 17:08 /tmp/parquet-sample/parquet_output-m-00000.parquet&lt;/LI-CODE&gt;&lt;P&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 06 Jun 2023 17:14:56 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372208#M241180</guid>
      <dc:creator>ggangadharan</dc:creator>
      <dc:date>2023-06-06T17:14:56Z</dc:date>
    </item>
    <item>
      <title>Re: Change default output filename part-r-00000.snappy.parquet</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372399#M241243</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/105136"&gt;@Josh2023&lt;/a&gt;&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future. Thanks.&lt;/P&gt;</description>
      <pubDate>Fri, 09 Jun 2023 18:59:27 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Change-default-output-filename-part-r-00000-snappy-parquet/m-p/372399#M241243</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2023-06-09T18:59:27Z</dc:date>
    </item>
  </channel>
</rss>

