<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Problem when trying to convert parquet file in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398162#M250117</link>
    <description>&lt;P&gt;Sure, If you come up with a solution different than what I suggested please do post about it so it can help others who might run into similar situation. good luck&lt;/P&gt;</description>
    <pubDate>Wed, 27 Nov 2024 19:12:42 GMT</pubDate>
    <dc:creator>SAMSAL</dc:creator>
    <dc:date>2024-11-27T19:12:42Z</dc:date>
    <item>
      <title>Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398033#M250039</link>
      <description>&lt;P&gt;hello,&lt;BR /&gt;I'm trying to read a parquet file using the ConvertRecord processor and I'm getting the error:&lt;BR /&gt;&lt;BR /&gt;&lt;EM&gt;ConvertRecord[id=e599cd8f-9a1d-3134-4daf-af7bc91cdd57] Failed to process FlowFile[filename=objectTable_tract_5074_DC2_2_2i_runs_DP0_2_v23_0_1_PREOPS-905_step3_31_20220314T212509Z-part0_output.parquet]; will route to failure: org.apache.avro.SchemaParseException: Illegal initial character: 0&lt;/EM&gt;&lt;BR /&gt;&lt;BR /&gt;In my file the columns are numeric and the first one starts with 0 (zero).&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 26 Nov 2024 13:20:14 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398033#M250039</guid>
      <dc:creator>alecssander</dc:creator>
      <dc:date>2024-11-26T13:20:14Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398035#M250040</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/121841"&gt;@alecssander&lt;/a&gt;&amp;nbsp;Welcome to the Cloudera Community!&lt;BR /&gt;&lt;BR /&gt;To help you get the best possible solution, I have tagged our NiFi experts&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/35454"&gt;@MattWho&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/80381"&gt;@SAMSAL&lt;/a&gt;&amp;nbsp; who may be able to assist you further.&lt;BR /&gt;&lt;BR /&gt;Please keep us updated on your post, and we hope you find a satisfactory solution to your query.&lt;/P&gt;</description>
      <pubDate>Tue, 26 Nov 2024 15:11:20 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398035#M250040</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2024-11-26T15:11:20Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398042#M250043</link>
      <description>&lt;P&gt;Hi ,&lt;/P&gt;&lt;P&gt;Can you provide more explanation\screenshot of your dataflow and the configuration set on each processor\controller service? Also if you can provide sample data that can be converted to parquet which can then reproduce the error that would be helpful as well.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Tue, 26 Nov 2024 18:52:27 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398042#M250043</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2024-11-26T18:52:27Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398049#M250047</link>
      <description>&lt;P&gt;The process is simple, I take a parquet file from a bucket and try to insert it into a postresql database:&lt;BR /&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="alecssander_0-1732653085450.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/42810iD88235802EC1AAB3/image-size/medium?v=v2&amp;amp;px=400" role="button" title="alecssander_0-1732653085450.png" alt="alecssander_0-1732653085450.png" /&gt;&lt;/span&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="alecssander_2-1732653358222.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/42812iF62D7ED468C7C8BD/image-size/medium?v=v2&amp;amp;px=400" role="button" title="alecssander_2-1732653358222.png" alt="alecssander_2-1732653358222.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;My file has 301 columns ranging from 0 to 300 with more than 280 lines:&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="alecssander_1-1732653296212.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/42811i224A21EDEDA60667/image-size/medium?v=v2&amp;amp;px=400" role="button" title="alecssander_1-1732653296212.png" alt="alecssander_1-1732653296212.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 26 Nov 2024 20:37:25 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398049#M250047</guid>
      <dc:creator>alecssander</dc:creator>
      <dc:date>2024-11-26T20:37:25Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398050#M250048</link>
      <description>&lt;P&gt;It seems like whenever dealing with parquet reader\writer services , those services are trying to use Avro schema, possibly to make sense of the data &amp;nbsp; when passing it along to the target processors ( like PutDatabaseRecord ) since parquet is in binary format. The problem with this is that Avro has limitation on how fields should be called. Actually this is reported as a bug in &lt;A href="https://issues.apache.org/jira/browse/AVRO-153" target="_self"&gt;Jira&lt;/A&gt; but it doesnt seem to have been resolved. According to the ticket Avro fields should only start with the following characters &lt;SPAN class="error"&gt;[A-Za-z_]&lt;/SPAN&gt; . Given this , it seems you have to think of some workaround to address this issue since Nifi doesnt provide a solution out of the box. you can check my answer to this &lt;A href="https://community.cloudera.com/t5/Support-Questions/Put-data-from-Parquet-files-into-DynamoDB-with-NiFi/m-p/379313?lightbox-message-images-379622=39009i2550927E3D25C611" target="_self"&gt;post&lt;/A&gt; as an option. Basically, you can use python to read the parquet content and transfer to another format (such as CSV as an example) then pass the CSV to the PutDatabaseRecord. This should work as I have tested it. Since you seem to be using Nifi 2.0 , you can develop python extension processor&amp;nbsp; for this instead of ExecuteStreamCommand mentioned in the post.&lt;/P&gt;&lt;P&gt;Hope that helps. If it does, please accept the solution.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 26 Nov 2024 22:04:28 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398050#M250048</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2024-11-26T22:04:28Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398157#M250116</link>
      <description>&lt;P&gt;Thanks for the support&lt;/P&gt;</description>
      <pubDate>Wed, 27 Nov 2024 17:20:46 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398157#M250116</guid>
      <dc:creator>alecssander</dc:creator>
      <dc:date>2024-11-27T17:20:46Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398162#M250117</link>
      <description>&lt;P&gt;Sure, If you come up with a solution different than what I suggested please do post about it so it can help others who might run into similar situation. good luck&lt;/P&gt;</description>
      <pubDate>Wed, 27 Nov 2024 19:12:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398162#M250117</guid>
      <dc:creator>SAMSAL</dc:creator>
      <dc:date>2024-11-27T19:12:42Z</dc:date>
    </item>
    <item>
      <title>Re: Problem when trying to convert parquet file</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398605#M250254</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/121841"&gt;@alecssander&lt;/a&gt;&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future.&amp;nbsp; Thanks.&lt;/P&gt;</description>
      <pubDate>Tue, 10 Dec 2024 01:02:48 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Problem-when-trying-to-convert-parquet-file/m-p/398605#M250254</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2024-12-10T01:02:48Z</dc:date>
    </item>
  </channel>
</rss>

