<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Morphline ReadAvroParquetFile timestamp problem in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Morphline-ReadAvroParquetFile-timestamp-problem/m-p/23665#M4610</link>
    <description>&lt;P&gt;Hi all, i'm using the following morphline to index some parquet files:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;morphlines : [ { id : morphline1 importCommands : ["org.kitesdk.**","org.apache.solr.**"] commands : [ { readAvroParquetFile { projectionSchemaString : """ { "name": "record_parquet", "namespace": "parquet.avro", "type": "record", "fields": [ { "name": "id", "type":["null", "string"] }, { "name": "date_time", "type":["null", "string" ]}, { "name": "sessionid", "type": ["null","string" ]}, { "name": "client_id", "type": ["null","string" ]} ] } """ # supportedMimeTypes : [avro/binary] # projectionSchemaString : "" # optional, avro json schema blurb for getSchema() # projectionSchemaFile : /path/to/syslog.avsc } } { extractAvroPaths { flatten : true paths : { id : /id date_time : "/date_time" session_id : /sessionid client_id : /client_id } } } { addValues { # add values "text/log" and "text/log2" to the source_type output field Channel : [canal] } } { logDebug { format : "output record: {}", args : ["@{}"] } } # load the record into a Solr server or MapReduce Reducer { loadSolr { solrLocator : { collection : parquet_test # Name of solr collection zkHost : "$IP:2181/solr" # ZooKeeper ensemble batchSize : 1000 # batchSize } } } ] } ]&lt;/PRE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Everything is going well except the fact that the tdate_time field (already in solr format, and date type in the schema.xml) is converted in unix epoch format. Any idea about ? Thanks in advance&lt;/P&gt;</description>
    <pubDate>Fri, 16 Sep 2022 09:19:04 GMT</pubDate>
    <dc:creator>fkrantz</dc:creator>
    <dc:date>2022-09-16T09:19:04Z</dc:date>
    <item>
      <title>Morphline ReadAvroParquetFile timestamp problem</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Morphline-ReadAvroParquetFile-timestamp-problem/m-p/23665#M4610</link>
      <description>&lt;P&gt;Hi all, i'm using the following morphline to index some parquet files:&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;PRE&gt;morphlines : [ { id : morphline1 importCommands : ["org.kitesdk.**","org.apache.solr.**"] commands : [ { readAvroParquetFile { projectionSchemaString : """ { "name": "record_parquet", "namespace": "parquet.avro", "type": "record", "fields": [ { "name": "id", "type":["null", "string"] }, { "name": "date_time", "type":["null", "string" ]}, { "name": "sessionid", "type": ["null","string" ]}, { "name": "client_id", "type": ["null","string" ]} ] } """ # supportedMimeTypes : [avro/binary] # projectionSchemaString : "" # optional, avro json schema blurb for getSchema() # projectionSchemaFile : /path/to/syslog.avsc } } { extractAvroPaths { flatten : true paths : { id : /id date_time : "/date_time" session_id : /sessionid client_id : /client_id } } } { addValues { # add values "text/log" and "text/log2" to the source_type output field Channel : [canal] } } { logDebug { format : "output record: {}", args : ["@{}"] } } # load the record into a Solr server or MapReduce Reducer { loadSolr { solrLocator : { collection : parquet_test # Name of solr collection zkHost : "$IP:2181/solr" # ZooKeeper ensemble batchSize : 1000 # batchSize } } } ] } ]&lt;/PRE&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Everything is going well except the fact that the tdate_time field (already in solr format, and date type in the schema.xml) is converted in unix epoch format. Any idea about ? Thanks in advance&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 09:19:04 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Morphline-ReadAvroParquetFile-timestamp-problem/m-p/23665#M4610</guid>
      <dc:creator>fkrantz</dc:creator>
      <dc:date>2022-09-16T09:19:04Z</dc:date>
    </item>
    <item>
      <title>Re: Morphline ReadAvroParquetFile timestamp problem</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Morphline-ReadAvroParquetFile-timestamp-problem/m-p/23781#M4611</link>
      <description>I resolved this issue.&lt;BR /&gt;There is no need of projectionSchemaString in readerAvroparquetFile.&lt;BR /&gt;So after removing it, everything was working.&lt;BR /&gt;&lt;BR /&gt;Cheers.</description>
      <pubDate>Fri, 16 Jan 2015 14:04:28 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Morphline-ReadAvroParquetFile-timestamp-problem/m-p/23781#M4611</guid>
      <dc:creator>fkrantz</dc:creator>
      <dc:date>2015-01-16T14:04:28Z</dc:date>
    </item>
  </channel>
</rss>

