Hadoop 统计文件中单词出现的次数

版权声明:本文为博主原创文章,未经博主允许不得转载。 https://blog.csdn.net/phone13144830339/article/details/78990896

pom.xml

<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
  <modelVersion>4.0.0</modelVersion>
  <groupId>cn.et</groupId>
  <artifactId>MavenProject</artifactId>
  <version>0.0.1-SNAPSHOT</version>
  <packaging>war</packaging>
  <!-- 添加项目jdk编译插件 -->
  <build>
     <plugins>
	   <plugin>
	     <groupId>org.apache.maven.plugins</groupId>
	  	 <artifactId>maven-compiler-plugin</artifactId>
	  	 <configuration>
	  	   <source>1.7</source>
	  	   <target>1.7</target>
	  	   <encoding>UTF-8</encoding>
	  	 </configuration>
	   </plugin>
     </plugins>
  </build>
</project>
web.xml

<?xml version="1.0" encoding="UTF-8"?>
<web-app xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://java.sun.com/xml/ns/javaee" xsi:schemaLocation="http://java.sun.com/xml/ns/javaee http://java.sun.com/xml/ns/javaee/web-app_2_5.xsd" version="2.5">
  <display-name>MavenProject</display-name>
  <welcome-file-list>
    <welcome-file>index.html</welcome-file>
    <welcome-file>index.htm</welcome-file>
    <welcome-file>index.jsp</welcome-file>
    <welcome-file>default.html</welcome-file>
    <welcome-file>default.htm</welcome-file>
    <welcome-file>default.jsp</welcome-file>
  </welcome-file-list>
</web-app>
########## 我的演示源文件位置

[root@localhost localhost]# cd /mnt/hgfs/VMwareShare/

[root@localhost VMwareShare]# ll

总用量 218756

-rwxrwxrwx. 1 root root   7073612 9月  24 2016 apache-tomcat-6.0.45.tar.gz

-rwxrwxrwx. 1 root root 216929574 1月   6 09:43 hadoop-2.7.5.tar.gz

-rwxrwxrwx. 1 root root       757 1月   5 20:19 pom.xml

-rwxrwxrwx. 1 root root       640 1月   5 20:11 web.xml


########## 把xml文件复制到我的/home/localhost目录中

[root@localhost VMwareShare]# cp /mnt/hgfs/VMwareShare/*.xml /home/localhost/


########## 开始统计

[root@localhost VMwareShare]# hadoop jar /usr/local/hadoop-2.7.5/share/hadoop/mapreduce/hadoop-mapreduce-examples-2.7.5.jare/hadoop-mapreduce-examples-2.7.5.jar wordcount /home/localhost/ /mnt/hgfs/VMwareShare/result

#注意/mnt/hgfs/VMwareShare/result为我定义的统计结果存放目录 result目录不能先前创建,hadoop会自动创建


##########  查看统计结果

[root@localhost /]# cd /mnt/hgfs/VMwareShare/result

[root@localhost result]# ll

总用量 0

-rwxrwxrwx. 1 root root 1298 1月   6 18:53 part-r-00000

-rwxrwxrwx. 1 root root    0 1月   6 18:53 _SUCCESS

[root@localhost result]# more part-r-00000

--> 1

<!-- 1

</build> 1

</configuration> 1

</plugin> 1

</plugins> 1

</project> 1

</web-app> 1

</welcome-file-list> 1

<?xml 1

<artifactId>MavenProject</artifactId> 1

<artifactId>maven-compiler-plugin</artifactId> 1

<build> 1

<configuration> 1

<display-name>MavenProject</display-name> 1

<encoding>UTF-8</encoding> 1

<groupId>cn.et</groupId> 1

<groupId>org.apache.maven.plugins</groupId> 1

<modelVersion>4.0.0</modelVersion> 1

<packaging>war</packaging> 1

<plugin> 1

<plugins> 1

<project 1

<source>1.7</source> 1

<target>1.7</target> 1

<version>0.0.1-SNAPSHOT</version> 1

<web-app 1

<welcome-file-list> 1

<welcome-file>default.htm</welcome-file> 1

<welcome-file>default.html</welcome-file> 1

<welcome-file>default.jsp</welcome-file> 1

<welcome-file>index.htm</welcome-file> 1

<welcome-file>index.html</welcome-file> 1

<welcome-file>index.jsp</welcome-file> 1

encoding="UTF-8"?> 1

http://java.sun.com/xml/ns/javaee/web-app_2_5.xsd" 1

http://maven.apache.org/xsd/maven-4.0.0.xsd"> 1

version="1.0" 1

version="2.5"> 1

xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 2

xmlns="http://java.sun.com/xml/ns/javaee" 1

xmlns="http://maven.apache.org/POM/4.0.0" 1

xsi:schemaLocation="http://java.sun.com/xml/ns/javaee 1

xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 1

添加项目jdk编译插件 1



猜你喜欢

转载自blog.csdn.net/phone13144830339/article/details/78990896