<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128234#M31178</link>
    <description>&lt;A rel="user" href="https://community.cloudera.com/users/1926/guptabandhu25.html" nodeid="1926"&gt;@bandhu gupta&lt;/A&gt;&lt;P&gt;Can you please share the complete error along with sqoop command being used?&lt;/P&gt;&lt;P&gt;The issue might be when HIVE_HOME/HCAT_HOME is not set as Sqoop will use HIVE_HOME/HCAT_HOME to find hive libs, which are needed in hive import as Parquet file.&lt;/P&gt;&lt;P&gt;Thanks and Regards,&lt;/P&gt;&lt;P&gt;Sindhu&lt;/P&gt;</description>
    <pubDate>Wed, 08 Jun 2016 20:49:00 GMT</pubDate>
    <dc:creator>ssubhas</dc:creator>
    <dc:date>2016-06-08T20:49:00Z</dc:date>
    <item>
      <title>Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128233#M31177</link>
      <description>&lt;P&gt;I am getting this issue when using sqoop with parquet&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jun 2016 20:11:45 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128233#M31177</guid>
      <dc:creator>ClouderaVMissue</dc:creator>
      <dc:date>2016-06-08T20:11:45Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128234#M31178</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/1926/guptabandhu25.html" nodeid="1926"&gt;@bandhu gupta&lt;/A&gt;&lt;P&gt;Can you please share the complete error along with sqoop command being used?&lt;/P&gt;&lt;P&gt;The issue might be when HIVE_HOME/HCAT_HOME is not set as Sqoop will use HIVE_HOME/HCAT_HOME to find hive libs, which are needed in hive import as Parquet file.&lt;/P&gt;&lt;P&gt;Thanks and Regards,&lt;/P&gt;&lt;P&gt;Sindhu&lt;/P&gt;</description>
      <pubDate>Wed, 08 Jun 2016 20:49:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128234#M31178</guid>
      <dc:creator>ssubhas</dc:creator>
      <dc:date>2016-06-08T20:49:00Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128235#M31179</link>
      <description>&lt;P&gt;sqoop import --connect jdbc:oracle:thin:@XXX:XXXX/YYYY --username YYYYY --password YYYYY --table A.BBBB --hive-import --hive-database default --hive-table test15 --as-parquetfile -m 1&lt;/P&gt;&lt;P&gt;Job job_1465371735536_0055 failed with state FAILED due to: Job commit failed: java.lang.IllegalArgumentException: Wrong FS: ____file:/tmp/default/.temp/job_1465371735536_0055/mr/job_1465371735536_0055/b402d4ba-1a16-46bc-92c6-91fe141070d2.parquet, expected: hdfs://lxapp5524.dc.corp.telstra.com:8020 at org.apache.hadoop.fs.FileSystem.checkPath(FileSystem.java:646)&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jun 2016 17:34:01 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128235#M31179</guid>
      <dc:creator>ClouderaVMissue</dc:creator>
      <dc:date>2016-06-09T17:34:01Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128236#M31180</link>
      <description>&lt;P&gt;We are only getting the above error if we are using parquet otherwise my table get pulled in hive easily .Please keep in mind that we have installed the HDP without internet so it's highly possible that we missed some thing.&lt;/P&gt;</description>
      <pubDate>Thu, 09 Jun 2016 18:04:52 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128236#M31180</guid>
      <dc:creator>ClouderaVMissue</dc:creator>
      <dc:date>2016-06-09T18:04:52Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128237#M31181</link>
      <description>&lt;P&gt;We are facing the above error while we were using the below query &lt;/P&gt;&lt;P&gt;sqoop import --connect jdbc:oracle:thin:@XX:1521/DATABASENAME --username USER --password PWD --table SCHEMANAME.TABLENAME --hive-import --hive-table TABLENAME --hive-overwrite --num-mappers 1 --as-parquetfile&lt;/P&gt;&lt;P&gt;It's an issue when we are using Parquet and trying to ingest data in hive only because if we do the ingestion in hdfs with parquet , it gets completed.&lt;/P&gt;</description>
      <pubDate>Fri, 10 Jun 2016 07:41:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128237#M31181</guid>
      <dc:creator>ClouderaVMissue</dc:creator>
      <dc:date>2016-06-10T07:41:35Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128238#M31182</link>
      <description>&lt;P&gt;I am also getting same wrror on hdp 2.4 , while doing sqoop hive-import with parquet . Without parquet it is working fine .&lt;/P&gt;&lt;P&gt;16/06/09 21:12:11 INFO mapreduce.Job: Job job_1465467652802_0011 failed with state FAILED due to: Job commit failed: java.lang.IllegalArgumentException: Wrong FS: _______file:/tmp/default/.temp/job_1465467652802_0011/mr/job_1465467652802_0011/dc944213-b925-4e5b-ac2c-736e5fa8610f.parquet, expected: hdfs://lxapp5524.dc.corp.hdp.com:8020
        at org.apache.hadoop.fs.FileSystem.checkPath(FileSystem.java:646)
        at org.apache.hadoop.hdfs.DistributedFileSystem.getPathName(DistributedFileSystem.java:194)
        at org.apache.hadoop.hdfs.DistributedFileSystem.rename(DistributedFileSystem.java:636)
        at org.kitesdk.data.spi.filesystem.FileSystemDataset.merge(FileSystemDataset.java:327)
        at org.kitesdk.data.spi.filesystem.FileSystemDataset.merge(FileSystemDataset.java:56)
        at org.kitesdk.data.mapreduce.DatasetKeyOutputFormat$MergeOutputCommitter.commitJob(DatasetKeyOutputFormat.java:370)
        at org.apache.hadoop.mapreduce.v2.app.commit.CommitterEventHandler$EventProcessor.handleJobCommit(CommitterEventHandler.java:285)
        at org.apache.hadoop.mapreduce.v2.app.commit.CommitterEventHandler$EventProcessor.run(CommitterEventHandler.java:237)
        at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)
        at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)
        at java.lang.Thread.run(Thread.java:745) &lt;/P&gt;</description>
      <pubDate>Fri, 10 Jun 2016 10:57:19 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128238#M31182</guid>
      <dc:creator>Rabin</dc:creator>
      <dc:date>2016-06-10T10:57:19Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128239#M31183</link>
      <description>&lt;P&gt;Then tried changing the dependency version for kite-sdk from 1.0.0 to 1.1.0 , and the issue gone . It worked !!! Issue resolved.&lt;/P&gt;</description>
      <pubDate>Sun, 12 Jun 2016 00:37:41 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128239#M31183</guid>
      <dc:creator>Rabin</dc:creator>
      <dc:date>2016-06-12T00:37:41Z</dc:date>
    </item>
    <item>
      <title>Re: Issue when using parquet org.kitesdk.data.DatasetNotFoundException: Descriptor location does not exist</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128240#M31184</link>
      <description>&lt;P&gt;We were able to resolve it here:&lt;/P&gt;&lt;P&gt;&lt;A href="https://discuss.cloudxlab.com/t/sqoop-import-to-hive-as-parquet-file-is-failing/1089/6" target="_blank"&gt;https://discuss.cloudxlab.com/t/sqoop-import-to-hive-as-parquet-file-is-failing/1089/6&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 12 Apr 2018 14:07:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Issue-when-using-parquet-org-kitesdk-data/m-p/128240#M31184</guid>
      <dc:creator>sandeep1</dc:creator>
      <dc:date>2018-04-12T14:07:39Z</dc:date>
    </item>
  </channel>
</rss>

