Generating new Columns Using Map Reduce (Map Only)
we also offer , online and classroom trainings
we support in POC
author: Bharat (sree ram)
contact : 09640892992
___________________________________________________________________________
input file : emp.txt
_____________________
101,amar,m,20000,hyd
102,amala,f,30000,pune
103,siva,m,40000,hyd
104,sivani,f,50000,hyd
105,hari,m,40000,pune
____________________
output expected:
from the input file , 4th field is salary. I want to generate tax, and netsal fields.
tax to be applied as 10% .
netsal=sal-tax.
101,amar,m,20000,4000,16000,hyd
102,amala,f,30000,6000,24000,pune
103,siva,m,40000,8000,32000,hyd
104,sivani,f,50000,10000,40000,hyd
105,hari,m,40000,8000,32000,pune
package my.map.red;
import java.io.IOException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
import org.apache.hadoop.util.GenericOptionsParser;
public class GenerateColumns{
public static class Map1 extends Mapper<LongWritable,Text,Text,Text> {
public void map(LongWritable k, Text v, Context con)
throws IOException, InterruptedException{
throws IOException, InterruptedException{
String line=v.toString();
String[] words=line.split(",");
int sal=Integer.parseInt(words[3]);
int tax = sal*10/100;
int netsal = sal - tax;
int sal=Integer.parseInt(words[3]);
int tax = sal*10/100;
int netsal = sal - tax;
String newline=words[0]+","+words[1]+","+words[2]+","+
words[3]+","+tax+","+netsal+","+words[4];
con.write(new Text(newline), new Text());
}
}
public static void main(String[] args) throws Exception {
Configuration c=new Configuration();
String[] files=new GenericOptionsParser(c,args).getRemainingArgs();
Path p1=new Path(files[0]);
Path p2=new Path(files[1]);
Job j = new Job(c,"GeneraterColumns");
j.setJarByClass(GenerateColumns.class);
j.setMapperClass(Map1.class);
j.setNumReduceTasks(0);
j.setOutputKeyClass(Text.class);
j.setOutputValueClass(Text.class);
FileInputFormat.addInputPath(j,p1);
FileOutputFormat.setOutputPath(j, p2);
FileOutputFormat.setOutputPath(j, p2);
System.exit(j.waitForCompletion(true) ? 0:1);
}
}
0 comments: