<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations. in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388641#M246729</link>
    <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/110701"&gt;@adsejnf&lt;/a&gt;&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future. Thanks.&lt;/P&gt;</description>
    <pubDate>Fri, 31 May 2024 21:17:46 GMT</pubDate>
    <dc:creator>DianaTorres</dc:creator>
    <dc:date>2024-05-31T21:17:46Z</dc:date>
    <item>
      <title>Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations.</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388117#M246532</link>
      <description>&lt;P&gt;I created a table and in beeline (hive) and it worked quickly.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;# Movies table
CREATE EXTERNAL TABLE movies (
  movieId INT,
  title STRING,
  genres STRING
)
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
WITH SERDEPROPERTIES (
  "separatorChar" = ",",
  "quoteChar" = "\"",
  "escapeChar" = "\\"
)
STORED AS TEXTFILE
LOCATION '/user/hive/warehouse/movielens/movies'
TBLPROPERTIES ("skip.header.line.count"="1");

# Ratings table
CREATE EXTERNAL TABLE ratings (
  userId INT,
  movieId INT,
  rating DOUBLE,
  rating_timestamp BIGINT
)
ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.OpenCSVSerde'
WITH SERDEPROPERTIES (
  "separatorChar" = ",",
  "quoteChar" = "\"",
  "escapeChar" = "\\"
)
STORED AS TEXTFILE
LOCATION '/user/hive/warehouse/movielens/ratings'
TBLPROPERTIES ("skip.header.line.count"="1");&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am attempting:&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;CREATE TABLE avg_movie_ratings AS
SELECT movieId, AVG(rating) AS avg_rating
FROM ratings
GROUP BY movieId;&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;which starts a map-reduce job, which is struck.&lt;BR /&gt;I have the hadoop and hive running.&amp;nbsp;&lt;/P&gt;&lt;P&gt;However,&lt;/P&gt;&lt;P&gt;The url to track the job:&amp;nbsp;&lt;A href="http://anushkahp14:8088/proxy/application_1716189650320_0005/" target="_blank" rel="noopener"&gt;http://anushkahp14:8088/proxy/application_1716189650320_0005/&lt;/A&gt;&amp;nbsp; returns&amp;nbsp;&lt;SPAN&gt;ERR_CONNECTION_REFUSED.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;Please help.&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 20 May 2024 12:35:55 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388117#M246532</guid>
      <dc:creator>adsejnf</dc:creator>
      <dc:date>2024-05-20T12:35:55Z</dc:date>
    </item>
    <item>
      <title>Re: Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations.</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388120#M246535</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/110701"&gt;@adsejnf&lt;/a&gt;, Welcome to Cloudera community!&lt;/P&gt;&lt;P&gt;Do you see any issues in the Hive logs?&lt;BR /&gt;&lt;BR /&gt;Or try checking the application logs via CLI:&lt;/P&gt;&lt;PRE&gt;» yarn logs -applicationId &amp;lt;application ID&amp;gt; -appOwner &amp;lt;AppOwner&amp;gt;&lt;/PRE&gt;</description>
      <pubDate>Mon, 20 May 2024 13:53:13 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388120#M246535</guid>
      <dc:creator>tj2007</dc:creator>
      <dc:date>2024-05-20T13:53:13Z</dc:date>
    </item>
    <item>
      <title>Re: Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations.</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388210#M246575</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/99744"&gt;@tj2007&lt;/a&gt;, Thanks!&lt;/P&gt;&lt;P&gt;No logs were recorded,&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;anushkakundu@AnushkaHP14:~$ /opt/hadoop/bin/yarn logs -applicationId application_1716374810626_0001 -appOwner anushkakundu
2024-05-22 16:29:07,059 INFO client.DefaultNoHARMFailoverProxyProvider: Connecting to ResourceManager at /0.0.0.0:8032
Can not find the logs for the application: application_1716374810626_0001 with the appOwner: anushkakundu&lt;/LI-CODE&gt;&lt;P&gt;Kindly check my localhost:8088,&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="adsejnf_0-1716375414545.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/40755i8146B7DD80009654/image-size/medium?v=v2&amp;amp;px=400" role="button" title="adsejnf_0-1716375414545.png" alt="adsejnf_0-1716375414545.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;It says:&amp;nbsp;&lt;/P&gt;&lt;P&gt;Log Aggregation Status:&amp;nbsp;&lt;/P&gt;&lt;TABLE width="115px"&gt;&lt;TBODY&gt;&lt;TR&gt;&lt;TD width="114.631px"&gt;NOT_START&lt;/TD&gt;&lt;/TR&gt;&lt;/TBODY&gt;&lt;/TABLE&gt;&lt;P&gt;could it be an issue?&lt;/P&gt;</description>
      <pubDate>Wed, 22 May 2024 11:05:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388210#M246575</guid>
      <dc:creator>adsejnf</dc:creator>
      <dc:date>2024-05-22T11:05:05Z</dc:date>
    </item>
    <item>
      <title>Re: Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations.</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388431#M246664</link>
      <description>&lt;DIV class="flex flex-grow flex-col max-w-full"&gt;&lt;DIV class="min-h-[20px] text-message flex flex-col items-start whitespace-pre-wrap break-words [.text-message+&amp;amp;]:mt-5 juice:w-full juice:items-end overflow-x-auto gap-2"&gt;&lt;DIV class="flex w-full flex-col gap-1 juice:empty:hidden juice:first:pt-[3px]"&gt;&lt;DIV class="markdown prose w-full break-words dark:prose-invert light"&gt;&lt;P&gt;The diagnostics message in YARN RM UI indicates that the application has been added to the scheduler but has not yet been activated. The message provides details about the reason for skipping the ApplicationMaster (AM) assignment. Let's break down the components of the message for a better understanding:&lt;/P&gt;&lt;H3&gt;Diagnostic Message Breakdown&lt;/H3&gt;&lt;OL&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Application is added to the scheduler and is not yet activated.&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;This indicates that the application is recognized by the scheduler but hasn't started the process of resource allocation and execution.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Skipping AM assignment as cluster resource is empty.&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;The ApplicationMaster (AM) assignment is skipped because there are no available resources in the cluster to fulfill the request.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Details:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Provides additional information about the resource request and limits.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;AM Partition = &amp;lt;DEFAULT_PARTITION&amp;gt;;&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;&lt;STRONG&gt;AM Partition:&lt;/STRONG&gt; The partition in which the AM is supposed to run. In this case, it's the &amp;lt;DEFAULT_PARTITION&amp;gt;, which typically means the default resource pool for the cluster.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;AM Resource Request = &amp;lt;memory:2048, Cores:1&amp;gt;;&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;&lt;STRONG&gt;AM Resource Request:&lt;/STRONG&gt; The resources requested for the ApplicationMaster. Here, it requests 2048 MB of memory and 1 core.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Queue Resource Limit for AM = &amp;lt;memory:0, vCores:0&amp;gt;;&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;&lt;STRONG&gt;Queue Resource Limit for AM:&lt;/STRONG&gt; The maximum resources allocated for ApplicationMasters in the queue. In this case, it shows &amp;lt;memory:0, vCores:0&amp;gt;, indicating that there are no resources currently allocated for AMs in the queue.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;User AM Resource Limit of the queue&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;&lt;STRONG&gt;User AM Resource Limit of the queue:&lt;/STRONG&gt; This part of the message is truncated, but it generally refers to the per-user resource limits within the queue. This would typically indicate the maximum resources a single user's applications can consume within the queue.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/OL&gt;&lt;H3&gt;Explanation&lt;/H3&gt;&lt;P&gt;The diagnostic message suggests that:&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;&lt;STRONG&gt;Resource Scarcity:&lt;/STRONG&gt; The cluster currently has no available resources to assign to the ApplicationMaster. This could be due to the cluster being fully utilized or the specific queue not having sufficient resources allocated or available.&lt;/LI&gt;&lt;LI&gt;&lt;STRONG&gt;Queue Limits:&lt;/STRONG&gt; The specific queue the application belongs to has its AM resource limits set to zero (&amp;lt;memory:0, vCores:0&amp;gt;), which means no resources are allocated for ApplicationMasters in this queue at the moment.&lt;/LI&gt;&lt;LI&gt;&lt;STRONG&gt;Activation Pending:&lt;/STRONG&gt; The application is added to the scheduler, but activation (resource assignment and start) is pending due to the lack of available resources.&lt;/LI&gt;&lt;/UL&gt;&lt;H3&gt;Possible Causes and Solutions&lt;/H3&gt;&lt;OL&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Cluster Resource Constraints:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;The cluster might be fully utilized, leaving no available resources for new ApplicationMasters.&lt;/LI&gt;&lt;LI&gt;&lt;STRONG&gt;Solution:&lt;/STRONG&gt; Monitor and manage cluster resources. Consider scaling the cluster or optimizing the current workload.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Queue Configuration Issues:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;The queue configuration might have stringent limits or no resources allocated for ApplicationMasters.&lt;/LI&gt;&lt;LI&gt;&lt;STRONG&gt;Solution:&lt;/STRONG&gt; Review and adjust the queue configurations in the capacity-scheduler.xml or equivalent configuration file to ensure there are sufficient resources for AMs.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;User Resource Limits:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;The user might have reached their resource quota in the queue.&lt;/LI&gt;&lt;LI&gt;&lt;STRONG&gt;Solution:&lt;/STRONG&gt; Check the per-user resource limits and adjust them if necessary to allow more resource allocation.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/OL&gt;&lt;H3&gt;Steps to Diagnose Further&lt;/H3&gt;&lt;OL&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Check Cluster Resource Utilization:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Use the ResourceManager web UI or CLI to check the current resource utilization of the cluster.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Review Queue Configurations:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Inspect the queue configurations, particularly the settings for ApplicationMaster resource limits.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Inspect Application Logs:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Look at the application logs for any additional diagnostics or error messages.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;LI&gt;&lt;P&gt;&lt;STRONG&gt;Consult YARN ResourceManager Logs:&lt;/STRONG&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;The ResourceManager logs can provide more context about why resources are unavailable or why the AM assignment is being skipped.&lt;/LI&gt;&lt;/UL&gt;&lt;/LI&gt;&lt;/OL&gt;&lt;P&gt;By understanding and addressing the issues highlighted in this diagnostic message, you can ensure that your YARN applications get the necessary resources to run effectively.&lt;/P&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV class="mt-1 flex gap-3 empty:hidden juice:-ml-3"&gt;&lt;DIV class="items-center justify-start rounded-xl p-1 flex"&gt;&lt;DIV class="flex items-center"&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;&lt;P&gt;&lt;STRONG&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/STRONG&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 28 May 2024 10:39:20 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388431#M246664</guid>
      <dc:creator>ggangadharan</dc:creator>
      <dc:date>2024-05-28T10:39:20Z</dc:date>
    </item>
    <item>
      <title>Re: Mapreduce doesn't successfully do INSERT / CREATE TABLE from existing table operations.</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388641#M246729</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/110701"&gt;@adsejnf&lt;/a&gt;&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future. Thanks.&lt;/P&gt;</description>
      <pubDate>Fri, 31 May 2024 21:17:46 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Mapreduce-doesn-t-successfully-do-INSERT-CREATE-TABLE-from/m-p/388641#M246729</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2024-05-31T21:17:46Z</dc:date>
    </item>
  </channel>
</rss>

