在我按照这些教程tutorial推出一个wordcount查询后,在hive中尝试了stackoverflow的所有解决方案。我的工作不会完成。
SELECT word, COUNT(*) FROM doc LATERAL VIEW explode(split(text, ' ')) doc as word GROUP BY word;
我的mapered.xml
<?xml version="1.0"?>
<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
<configuration>
<property>
<name>mapred.job.tracker</name>
<value>localhost:54311</value>
<description>The host and port that the MapReduce job tracker runs
at. If "local", then jobs are run in-process as a single map
and reduce task.
</description>
</property>
<property>
<name>mapreduce.framework.name</name>
<value>yarn</value>
</property>
</configuration>
我的yarn.xml
<?xml version="1.0"?>
<configuration>
<property>
<name>yarn.nodemanager.resource.memory-mb</name>
<value>1100</value>
<description>Amount of physical memory, in MB, that can be allocated for containers.</description>
</property>
<property>
<name>yarn.scheduler.minimum-allocation-mb</name>
<value>250</value>
</property>
<property>
<name>yarn.nodemanager.disk-health-checker.min-healthy-disks</name>
<value>0.0</value>
</property>
<property>
<name>yarn.nodemanager.disk-health-checker.max-disk-utilization-per-disk-percentage</name>
<value>100.0</value>
</property>
</configuration>