0% found this document useful (0 votes)

132 views

SalesData Map Reduce

This document contains code for a MapReduce job in Java that analyzes sales data by country. It creates an input directory in HDFS, copies a CSV file to that directory, and runs a MapReduce job on the data. The Mapper class splits each line on commas and emits the country field as the key and the value "1". The Reducer class sums the values for each key to get a total count of sales by country.

Uploaded by

bhavana16686

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

132 views

SalesData Map Reduce

Uploaded by

bhavana16686

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 3

C:\hadoop-2.8.

0\sbin>hadoop fs -mkdir /input_dir_sales

C:\hadoop-2.8.0\sbin>cd..

C:\hadoop-2.8.0>hadoop fs -put c:/SalesJan2009.csv /input_dir_sales

C:\hadoop-2.8.0>hadoop jar C:/hadoop-2.8.0/SalesMapReduce.jar SalesData.SalesCountryDriver

/input_dir_sales/SalesJan2009.csv /output_dir_sales

package SalesData;

import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.*;
import org.apache.hadoop.mapred.*;
import java.util.*;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.Text;
import java.io.IOException;

public class SalesCountryDriver {

public static void main(String[] args) {
JobClient my_client = new JobClient();
// Create a configuration object for the job
JobConf job_conf = new
JobConf(SalesCountryDriver.class);

// Set a name of the Job

job_conf.setJobName("SalePerCountry");

// Specify data type of output key and value

job_conf.setOutputKeyClass(Text.class);
job_conf.setOutputValueClass(IntWritable.class);

// Specify names of Mapper and Reducer Class

job_conf.setMapperClass(SalesMapper.class);
job_conf.setReducerClass(SalesCountryReducer.class);

// Specify formats of the data type of Input and

output
job_conf.setInputFormat(TextInputFormat.class);
job_conf.setOutputFormat(TextOutputFormat.class);

// Set input and output directories using command

line arguments,
//arg[0] = name of input directory on HDFS, and
arg[1] = name of output directory to be created to store
the output file.

FileInputFormat.setInputPaths(job_conf, new
Path(args[0]));
FileOutputFormat.setOutputPath(job_conf, new
Path(args[1]));

my_client.setConf(job_conf);
try {
// Run the job
JobClient.runJob(job_conf);
} catch (Exception e) {
e.printStackTrace();
}
}
}
class SalesMapper extends MapReduceBase implements Mapper
<LongWritable, Text, Text, IntWritable> {
private final static IntWritable one = new
IntWritable(1);

public void map(LongWritable key, Text value,

OutputCollector <Text, IntWritable> output, Reporter
reporter) throws IOException {

String valueString = value.toString();

String[] SingleCountryData =
valueString.split(",");
output.collect(new Text(SingleCountryData[7]),
one);
}
}

class SalesCountryReducer extends MapReduceBase implements

Reducer<Text, IntWritable, Text, IntWritable> {

public void reduce(Text t_key, Iterator<IntWritable>

values, OutputCollector<Text,IntWritable> output, Reporter
reporter) throws IOException {
Text key = t_key;
int frequencyForCountry = 0;
while (values.hasNext()) {
// replace type of value with the actual
type of our value
IntWritable value = (IntWritable)
values.next();
frequencyForCountry += value.get();

}
output.collect(key, new
IntWritable(frequencyForCountry));
}
}

Infoscale Licensing Guide
100% (2)
Infoscale Licensing Guide
13 pages
ExtremeXOS Operations and Configuration Lab Guide
100% (2)
ExtremeXOS Operations and Configuration Lab Guide
254 pages
Big Data - ASSIGNMENT 2
No ratings yet
Big Data - ASSIGNMENT 2
15 pages
DSBDA GRP B Print
No ratings yet
DSBDA GRP B Print
21 pages
Exp-12
No ratings yet
Exp-12
7 pages
Document 6
No ratings yet
Document 6
15 pages
02-Wordcount Mapreduce
No ratings yet
02-Wordcount Mapreduce
5 pages
Classcreation
No ratings yet
Classcreation
2 pages
ADA Lab Manual
No ratings yet
ADA Lab Manual
34 pages
Running Jar Program
No ratings yet
Running Jar Program
3 pages
Practical 2-3
No ratings yet
Practical 2-3
3 pages
To Count Using Map and Reduce Program: Wordcount - Java
No ratings yet
To Count Using Map and Reduce Program: Wordcount - Java
2 pages
MapReduce Example
No ratings yet
MapReduce Example
3 pages
Group B PR 3 DSBDA
No ratings yet
Group B PR 3 DSBDA
6 pages
6 - Simple Wordcount
No ratings yet
6 - Simple Wordcount
2 pages
Practical-11
No ratings yet
Practical-11
3 pages
CS246 TA Session: Hadoop Tutorial: Peyman Kazemian 1/11/2011
No ratings yet
CS246 TA Session: Hadoop Tutorial: Peyman Kazemian 1/11/2011
13 pages
BDAV Practical
No ratings yet
BDAV Practical
17 pages
BDA3
No ratings yet
BDA3
7 pages
Practical 2c
No ratings yet
Practical 2c
2 pages
MapReduce and Yarn
No ratings yet
MapReduce and Yarn
39 pages
12.LogFileMapReduce
No ratings yet
12.LogFileMapReduce
2 pages
Import Import Import Import Import Import Import Import Public Class Extends Implements
No ratings yet
Import Import Import Import Import Import Import Import Public Class Extends Implements
7 pages
Source Code for Wordcount
No ratings yet
Source Code for Wordcount
3 pages
BDA
No ratings yet
BDA
6 pages
1WordCount
No ratings yet
1WordCount
2 pages
Wordcount
No ratings yet
Wordcount
3 pages
ContarPalabras Java
No ratings yet
ContarPalabras Java
2 pages
Run Wordcount
No ratings yet
Run Wordcount
3 pages
Map Reduce Example
No ratings yet
Map Reduce Example
6 pages
Mcsl26 See QP Solution 2024
No ratings yet
Mcsl26 See QP Solution 2024
33 pages
MR Progs For Self Excercise
No ratings yet
MR Progs For Self Excercise
14 pages
3 MapReduce program ex code
No ratings yet
3 MapReduce program ex code
14 pages
Practical 3bcbs
No ratings yet
Practical 3bcbs
5 pages
✅ PART 1- Install Java and Hadoop on Ubuntu
No ratings yet
✅ PART 1- Install Java and Hadoop on Ubuntu
4 pages
Map Reduce
No ratings yet
Map Reduce
5 pages
wrordcount
No ratings yet
wrordcount
2 pages
bda lab
No ratings yet
bda lab
39 pages
579 BDA Week-04
No ratings yet
579 BDA Week-04
1 page
Big Data Practical 2
No ratings yet
Big Data Practical 2
11 pages
Word Count
No ratings yet
Word Count
10 pages
Prácticas Bigdata: 1. Lanzar Un Proceso Mapreduce Contra El Cluster
No ratings yet
Prácticas Bigdata: 1. Lanzar Un Proceso Mapreduce Contra El Cluster
3 pages
Exp 9
No ratings yet
Exp 9
7 pages
Word Count Program
No ratings yet
Word Count Program
2 pages
Customer - 3.java: Import Import Import Import Import Import Import Import
No ratings yet
Customer - 3.java: Import Import Import Import Import Import Import Import
15 pages
Analyzing The Data With Hadoop
No ratings yet
Analyzing The Data With Hadoop
13 pages
Big Data Lab
No ratings yet
Big Data Lab
12 pages
BDC Output 3
No ratings yet
BDC Output 3
4 pages
Map Reduce
No ratings yet
Map Reduce
4 pages
Exp 4 Word Count
No ratings yet
Exp 4 Word Count
4 pages
rapprot
No ratings yet
rapprot
3 pages
Hadoop Map Reduce
No ratings yet
Hadoop Map Reduce
8 pages
049
No ratings yet
049
2 pages
USERLOGIN
No ratings yet
USERLOGIN
7 pages
Week-8 de
No ratings yet
Week-8 de
9 pages
Bda Final 11jan
No ratings yet
Bda Final 11jan
7 pages
Bda Experiment No2
No ratings yet
Bda Experiment No2
12 pages
Exp-11
No ratings yet
Exp-11
4 pages
otonamcode
No ratings yet
otonamcode
54 pages
Practical-1: Aim: Hadoop Configuration and Single Node Cluster Setup and Perform File Management Task in
No ratings yet
Practical-1: Aim: Hadoop Configuration and Single Node Cluster Setup and Perform File Management Task in
61 pages
Execute Java Map Reduce Sample Using Eclipse
No ratings yet
Execute Java Map Reduce Sample Using Eclipse
9 pages
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
BH - Release Plan
No ratings yet
BH - Release Plan
1 page
Unit 1 - AP For Data Science
No ratings yet
Unit 1 - AP For Data Science
19 pages
Python Practical
No ratings yet
Python Practical
1 page
Java Practice Program
No ratings yet
Java Practice Program
2 pages
Mis Unit 2: Evolution of Management Thoughts & Business Ethics
No ratings yet
Mis Unit 2: Evolution of Management Thoughts & Business Ethics
17 pages
SPM Unit 1
No ratings yet
SPM Unit 1
74 pages
IWT Unit 3 - JS DOM
No ratings yet
IWT Unit 3 - JS DOM
29 pages
Serv Lets
No ratings yet
Serv Lets
84 pages
Chapter 3: Agile Development
No ratings yet
Chapter 3: Agile Development
20 pages
Types of Bugs Bugs Life Cycle
No ratings yet
Types of Bugs Bugs Life Cycle
12 pages
CNS Unit 3
No ratings yet
CNS Unit 3
38 pages
Extensible Markup Language
100% (1)
Extensible Markup Language
89 pages
M.SC IT Semester: 1 Subject: Data Communication and Networking Theory Assignment 1 Submission Date
No ratings yet
M.SC IT Semester: 1 Subject: Data Communication and Networking Theory Assignment 1 Submission Date
1 page
Unit 1 Physical Layer
No ratings yet
Unit 1 Physical Layer
86 pages
Basis Path Testing Example
No ratings yet
Basis Path Testing Example
3 pages
Object Oriented Concepts Through Java
No ratings yet
Object Oriented Concepts Through Java
39 pages
A D I S: Lympia Usiness Chool
No ratings yet
A D I S: Lympia Usiness Chool
44 pages
Datatypes Operators Control Statements
No ratings yet
Datatypes Operators Control Statements
22 pages
Real Time DSP
No ratings yet
Real Time DSP
4 pages
Comp 034 Advanced Programming Language - Prelim
No ratings yet
Comp 034 Advanced Programming Language - Prelim
88 pages
AEM-Test Automation: A Project Report On
No ratings yet
AEM-Test Automation: A Project Report On
54 pages
Dinamica Tutorial
No ratings yet
Dinamica Tutorial
2 pages
(Partially Observable) Markov Decision Processes: Frederike Petzschner & Lionel Rigoux
No ratings yet
(Partially Observable) Markov Decision Processes: Frederike Petzschner & Lionel Rigoux
19 pages
Ccna 1
No ratings yet
Ccna 1
64 pages
Report On Chapter 4 Bus-Based Computer Systems
No ratings yet
Report On Chapter 4 Bus-Based Computer Systems
2 pages
Chapter 6 - Software Requirements
No ratings yet
Chapter 6 - Software Requirements
26 pages
MongoDB Aggregation Guide PDF
No ratings yet
MongoDB Aggregation Guide PDF
46 pages
HarkriderLogicResources - Prashanth Pallavolla
No ratings yet
HarkriderLogicResources - Prashanth Pallavolla
8 pages
ALV Row Editable
No ratings yet
ALV Row Editable
9 pages
BW ZIO M002 Q001 35 JPN A and P Report by Internal Order
No ratings yet
BW ZIO M002 Q001 35 JPN A and P Report by Internal Order
35 pages
Bca76 Project Guideline-2010
No ratings yet
Bca76 Project Guideline-2010
23 pages
Operating Systems: History
No ratings yet
Operating Systems: History
9 pages
Machine Learning Yearning
100% (1)
Machine Learning Yearning
9 pages
16CS3123-Java Programming Course File-Autonomous
No ratings yet
16CS3123-Java Programming Course File-Autonomous
122 pages
Flow Chart Wap Alumni Registration System
No ratings yet
Flow Chart Wap Alumni Registration System
31 pages
JS Strict Mode
No ratings yet
JS Strict Mode
14 pages
DFL FRP For Hitachi Manual PDF
No ratings yet
DFL FRP For Hitachi Manual PDF
26 pages
Ipe Studio Log
No ratings yet
Ipe Studio Log
8 pages
Compiler Lab
No ratings yet
Compiler Lab
3 pages
Adaptive Software Development
100% (1)
Adaptive Software Development
10 pages
Basic Hacking Techniques PDF
No ratings yet
Basic Hacking Techniques PDF
60 pages
Designing Chabots and Human-AI Interaction
No ratings yet
Designing Chabots and Human-AI Interaction
41 pages
Man G31T-M2 D
No ratings yet
Man G31T-M2 D
23 pages
Project#2 Report
No ratings yet
Project#2 Report
7 pages
20 Linux System Monitoring Tools Every SysAdmin Should Know
No ratings yet
20 Linux System Monitoring Tools Every SysAdmin Should Know
69 pages
Capitolul 8: Child Window Controls
100% (1)
Capitolul 8: Child Window Controls
41 pages

SalesData Map Reduce

Uploaded by

SalesData Map Reduce

Uploaded by

C:\hadoop-2.8.

0\sbin>hadoop fs -mkdir /input_dir_sales

C:\hadoop-2.8.0>hadoop fs -put c:/SalesJan2009.csv /input_dir_sales

C:\hadoop-2.8.0>hadoop jar C:/hadoop-2.8.0/SalesMapReduce.jar SalesData.SalesCountryDriver

public class SalesCountryDriver {

// Set a name of the Job

// Specify data type of output key and value

// Specify names of Mapper and Reducer Class

// Specify formats of the data type of Input and

// Set input and output directories using command

public void map(LongWritable key, Text value,

String valueString = value.toString();

class SalesCountryReducer extends MapReduceBase implements

public void reduce(Text t_key, Iterator<IntWritable>

You might also like