标签:stdout cli pat 2.7 test oss inpu int 服务器
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
|
import java.io.IOException; import org.apache.hadoop.io.IntWritable; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Text; import org.apache.hadoop.mapreduce.Mapper; public class WordMapper extends Mapper<LongWritable,Text, Text, IntWritable> { @Override protected void map(LongWritable key, Text value, Mapper<LongWritable, Text, Text, IntWritable>.Context context) throws IOException, InterruptedException { String line = value.toString(); String[] words = line.split( " " ); for (String word : words) { context.write( new Text(word), new IntWritable( 1 )); } } } |
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
|
import java.io.IOException; import org.apache.hadoop.io.IntWritable; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Text; import org.apache.hadoop.mapreduce.Reducer; public class WordReducer extends Reducer<Text, IntWritable, Text, LongWritable> { @Override protected void reduce(Text key, Iterable<IntWritable> values, Reducer<Text, IntWritable, Text, LongWritable>.Context context) throws IOException, InterruptedException { long count = 0 ; for (IntWritable v : values) { count += v.get(); } context.write(key, new LongWritable(count)); } } |
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
|
import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.fs.Path; import org.apache.hadoop.io.IntWritable; import org.apache.hadoop.io.LongWritable; import org.apache.hadoop.io.Text; import org.apache.hadoop.mapreduce.Job; import org.apache.hadoop.mapreduce.lib.input.FileInputFormat; import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat; public class Test { public static void main(String[] args) throws Exception { Configuration conf = new Configuration(); Job job = Job.getInstance(conf); job.setMapperClass(WordMapper. class ); job.setReducerClass(WordReducer. class ); job.setMapOutputKeyClass(Text. class ); job.setMapOutputValueClass(IntWritable. class ); job.setOutputKeyClass(Text. class ); job.setOutputValueClass(LongWritable. class ); FileInputFormat.setInputPaths(job, "c:/bigdata/hadoop/test/test.txt" ); FileOutputFormat.setOutputPath(job, new Path( "c:/bigdata/hadoop/test/out/" )); job.waitForCompletion( true ); } } |
1
2
3
|
|
1
2
3
4
5
6
7
|
conf.set( "mapreduce.job.jar" , "target/wc.jar" ); conf.set( "mapreduce.framework.name" , "yarn" ); conf.set( "yarn.resourcemanager.hostname" , "master" ); conf.set( "mapreduce.app-submission.cross-platform" , "true" ); |
1
2
3
|
FileInputFormat.setInputPaths(job, "/wcinput/" ); FileOutputFormat.setOutputPath(job, new Path( "/wcoutput3/" )); |
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
|
< project xmlns = "http://maven.apache.org/POM/4.0.0" xmlns:xsi = "http://www.w3.org/2001/XMLSchema-instance" xsi:schemalocation = "http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd" > < modelversion >4.0.0</ modelversion > < groupid >mashibing.com</ groupid > < artifactid >maven</ artifactid > < version >0.0.1-SNAPSHOT</ version > < name >wc</ name > < description >hello mp</ description > < properties > < project.build.sourceencoding >UTF-8</ project.build.sourceencoding > < hadoop.version >2.7.3</ hadoop.version > </ properties > < dependencies > < dependency > < groupId >junit</ groupId > < artifactId >junit</ artifactId > < version >4.12</ version > </ dependency > < dependency > < groupId >org.apache.hadoop</ groupId > < artifactId >hadoop-client</ artifactId > < version >${hadoop.version}</ version > </ dependency > < dependency > < groupId >org.apache.hadoop</ groupId > < artifactId >hadoop-common</ artifactId > < version >${hadoop.version}</ version > </ dependency > < dependency > < groupId >org.apache.hadoop</ groupId > < artifactId >hadoop-hdfs</ artifactId > < version >${hadoop.version}</ version > </ dependency > </ dependencies > </ project > |
1
2
3
4
5
6
|
log4j.rootCategory=INFO, stdout log4j.appender.stdout=org.apache.log4j.ConsoleAppender log4j.appender.stdout.layout=org.apache.log4j.PatternLayout log4j.appender.stdout.layout.ConversionPattern=[QC] %p [%t] %C.%M(%L) | %m%n |
标签:stdout cli pat 2.7 test oss inpu int 服务器
原文地址:http://www.cnblogs.com/Jxiaobai/p/6649827.html