<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: How to convert pdf file into hive table? in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173059#M37608</link>
    <description>&lt;P&gt;How would you go about the install procedure for Apache Tika? Because I have the same situation.&lt;/P&gt;</description>
    <pubDate>Thu, 16 Feb 2017 00:51:16 GMT</pubDate>
    <dc:creator>Matthew_Chang-K</dc:creator>
    <dc:date>2017-02-16T00:51:16Z</dc:date>
    <item>
      <title>How to convert pdf file into hive table?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173057#M37606</link>
      <description>&lt;P&gt;I have pdf file. I have copied the file from local system to hdfs. But i need to convert the pdf file into a hive table. Is there anyway to do in hive? I know we can handle the same in pig. &lt;/P&gt;</description>
      <pubDate>Thu, 11 Aug 2016 20:24:45 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173057#M37606</guid>
      <dc:creator>balavignesh_nag</dc:creator>
      <dc:date>2016-08-11T20:24:45Z</dc:date>
    </item>
    <item>
      <title>Re: How to convert pdf file into hive table?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173058#M37607</link>
      <description>&lt;P&gt;If i understand ur question and i am making a assumption here, you want to store the pdf in hive to perform some analysis on the content inside the pdf file.  The way i have done this is with apache Tika.  The process will extract text file pdf and store in text format file.   Then apply data model to text and store in hive. &lt;/P&gt;</description>
      <pubDate>Thu, 11 Aug 2016 20:52:50 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173058#M37607</guid>
      <dc:creator>sunile_manjee</dc:creator>
      <dc:date>2016-08-11T20:52:50Z</dc:date>
    </item>
    <item>
      <title>Re: How to convert pdf file into hive table?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173059#M37608</link>
      <description>&lt;P&gt;How would you go about the install procedure for Apache Tika? Because I have the same situation.&lt;/P&gt;</description>
      <pubDate>Thu, 16 Feb 2017 00:51:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-convert-pdf-file-into-hive-table/m-p/173059#M37608</guid>
      <dc:creator>Matthew_Chang-K</dc:creator>
      <dc:date>2017-02-16T00:51:16Z</dc:date>
    </item>
  </channel>
</rss>

