0% found this document useful (0 votes)

4 views5 pages

Bai3

The document is a Java program that implements a MapReduce job to process customer and transaction data, followed by a second job to generate a promotion list based on profession and salary criteria. It consists of multiple mappers and reducers to handle customer information, transaction counts, and filtering based on salary. The program requires specific input files and outputs the results to a specified directory.

Uploaded by

duy nguyen hoang

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

4 views5 pages

Bai3

Uploaded by

duy nguyen hoang

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 5

import java.io.

IOException;
import java.util.ArrayList;
import java.util.List;

import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.NullWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
import org.apache.hadoop.mapreduce.Mapper;
import org.apache.hadoop.mapreduce.Reducer;
import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
import org.apache.hadoop.mapreduce.lib.input.MultipleInputs;
import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;

public class Bai3 {

// First Job: Process customer and transaction data

public static class CustomerMapper extends Mapper<LongWritable, Text, Text,
Text> {
private Text outKey = new Text();
private Text outValue = new Text();

@Override
public void map(LongWritable key, Text value, Context context) throws
IOException, InterruptedException {
String[] fields = value.toString().split(",");
if (fields.length >= 5) {
String custId = fields[0].trim();
String firstName = fields[1].trim();
String lastName = fields[2].trim();
// Combine fields[4] and beyond for professions with spaces
StringBuilder professionBuilder = new StringBuilder();
for (int i = 4; i < fields.length; i++) {
professionBuilder.append(fields[i].trim()).append(" ");
}
String profession = professionBuilder.toString().trim();
outKey.set(custId);
outValue.set("C:" + firstName + "," + lastName + "," + profession);
context.write(outKey, outValue);
}
}
}

public static class TransactionMapper extends Mapper<LongWritable, Text, Text,

Text> {
private Text outKey = new Text();
private Text outValue = new Text();

@Override
public void map(LongWritable key, Text value, Context context) throws
IOException, InterruptedException {
String[] fields = value.toString().split(",");
if (fields.length >= 3) {
String custId = fields[2].trim();
outKey.set(custId);
outValue.set("T:1");
context.write(outKey, outValue);
}
}
}

public static class CustomerTransactionReducer extends Reducer<Text, Text,

Text, Text> {
private Text outKey = new Text();
private Text outValue = new Text();

@Override
public void reduce(Text key, Iterable<Text> values, Context context) throws
IOException, InterruptedException {
String customerInfo = null;
int transactionCount = 0;

for (Text val : values) {

String[] parts = val.toString().split(":");
if (parts[0].equals("C")) {
customerInfo = parts[1];
} else if (parts[0].equals("T")) {
transactionCount++;
}
}

if (customerInfo != null && transactionCount > 0) {

String[] custParts = customerInfo.split(",");
if (custParts.length == 3) {
String profession = custParts[2];
outKey.set(profession);
outValue.set("CT:" + custParts[0] + "," + custParts[1] + "," +
transactionCount);
context.write(outKey, outValue);
}
}
}
}

// Second Job: Process profession data and join with first job's output
public static class ProfessionMapper extends Mapper<LongWritable, Text, Text,
Text> {
private Text outKey = new Text();
private Text outValue = new Text();

@Override
public void map(LongWritable key, Text value, Context context) throws
IOException, InterruptedException {
String[] fields = value.toString().split(",");
if (fields.length >= 2) {
String profession = fields[0].trim();
String salaryStr = fields[1].trim();
try {
double salary = Double.parseDouble(salaryStr);
if (salary > 70000) {
outKey.set(profession);
outValue.set("S:" + salaryStr);
context.write(outKey, outValue);
}
} catch (NumberFormatException e) {
// Ignore invalid salary entries
}
}
}
}

public static class FirstJobOutputMapper extends Mapper<LongWritable, Text,

Text, Text> {
private Text outKey = new Text();
private Text outValue = new Text();

@Override
public void map(LongWritable key, Text value, Context context) throws
IOException, InterruptedException {
String line = value.toString();
String[] parts = line.split("\t");
if (parts.length == 2) {
outKey.set(parts[0]);
outValue.set(parts[1]);
context.write(outKey, outValue);
}
}
}

public static class FinalReducer extends Reducer<Text, Text, NullWritable,

Text> {
private Text result = new Text();

@Override
public void reduce(Text key, Iterable<Text> values, Context context) throws
IOException, InterruptedException {
String salary = null;
List<String> customers = new ArrayList<>();

for (Text val : values) {

String[] parts = val.toString().split(":");
if (parts[0].equals("S")) {
salary = parts[1];
} else if (parts[0].equals("CT")) {
customers.add(parts[1]);
}
}

if (salary != null) {
try {
double sal = Double.parseDouble(salary);
if (sal > 70000) {
for (String cust : customers) {
String[] custParts = cust.split(",");
if (custParts.length == 3) {
String firstName = custParts[0];
String lastName = custParts[1];
int transCount = Integer.parseInt(custParts[2]);
if (transCount < 12) {
String name = firstName + " " + lastName;
String output = String.format("%-20s%-20d%-20s
%-20s", name, transCount, key.toString(), salary);
result.set(output);
context.write(NullWritable.get(), result);
}
}
}
}
} catch (NumberFormatException e) {
// Ignore invalid entries
}
}
}
}

public static void main(String[] args) throws Exception {

if (args.length != 7) {
System.err.println("Usage: Bai3 <cust1> <cust2> <prof1> <prof2>
<trans1> <trans2> <output>");
System.exit(1);
}

Configuration conf = new Configuration();

Job job1 = Job.getInstance(conf, "Customer Transaction Join");
job1.setJarByClass(Bai3.class);

MultipleInputs.addInputPath(job1, new Path(args[0]), TextInputFormat.class,

CustomerMapper.class);
MultipleInputs.addInputPath(job1, new Path(args[1]), TextInputFormat.class,
CustomerMapper.class);
MultipleInputs.addInputPath(job1, new Path(args[4]), TextInputFormat.class,
TransactionMapper.class);
MultipleInputs.addInputPath(job1, new Path(args[5]), TextInputFormat.class,
TransactionMapper.class);

Path tempOutputPath = new Path(args[6] + "_temp");

FileOutputFormat.setOutputPath(job1, tempOutputPath);

job1.setReducerClass(CustomerTransactionReducer.class);
job1.setOutputKeyClass(Text.class);
job1.setOutputValueClass(Text.class);

boolean success = job1.waitForCompletion(true);

if (!success) {
System.exit(1);
}

Configuration conf2 = new Configuration();

Job job2 = Job.getInstance(conf2, "Generate Promotion List");
job2.setJarByClass(Bai3.class);

MultipleInputs.addInputPath(job2, tempOutputPath, TextInputFormat.class,

FirstJobOutputMapper.class);
MultipleInputs.addInputPath(job2, new Path(args[2]), TextInputFormat.class,
ProfessionMapper.class);
MultipleInputs.addInputPath(job2, new Path(args[3]), TextInputFormat.class,
ProfessionMapper.class);

FileOutputFormat.setOutputPath(job2, new Path(args[6]));

job2.setReducerClass(FinalReducer.class);
job2.setOutputKeyClass(Text.class);
job2.setOutputValueClass(Text.class);

System.exit(job2.waitForCompletion(true) ? 0 : 1);
}
}

Polymorphism, Relations
50% (2)
Polymorphism, Relations
46 pages
dokumen.pub_microsoft-python-certification-exam-98-281-amp-pcep-preparation-guide-introduction-to-programming-using-python-pcep-certified-entry-level-python-programmer-9798589463590
No ratings yet
dokumen.pub_microsoft-python-certification-exam-98-281-amp-pcep-preparation-guide-introduction-to-programming-using-python-pcep-certified-entry-level-python-programmer-9798589463590
65 pages
CC2 Java Programs-Merged
No ratings yet
CC2 Java Programs-Merged
655 pages
AJP TU Solution 2070 76
No ratings yet
AJP TU Solution 2070 76
156 pages
Pro192 HW w3 SE17B04
No ratings yet
Pro192 HW w3 SE17B04
12 pages
Ex3 - Payroll System in EJB
No ratings yet
Ex3 - Payroll System in EJB
9 pages
Hicom 100e
100% (1)
Hicom 100e
334 pages
Code
No ratings yet
Code
23 pages
The Use of GPS in Civil Engineering As A
No ratings yet
The Use of GPS in Civil Engineering As A
32 pages
KPMG Task 1
No ratings yet
KPMG Task 1
1,714 pages
Assignment Cse311
No ratings yet
Assignment Cse311
27 pages
Almas Baji
No ratings yet
Almas Baji
21 pages
Module 5 - DAO - Other Mappings (1)
No ratings yet
Module 5 - DAO - Other Mappings (1)
25 pages
Bai2500loc
No ratings yet
Bai2500loc
20 pages
Practice PDF
No ratings yet
Practice PDF
14 pages
PP Sarkar
No ratings yet
PP Sarkar
60 pages
Customer - 3.java: Import Import Import Import Import Import Import Import
No ratings yet
Customer - 3.java: Import Import Import Import Import Import Import Import
15 pages
Lab 3 Oop
No ratings yet
Lab 3 Oop
35 pages
Tang2004 Methods for Minimizing Segregation (Hay)
No ratings yet
Tang2004 Methods for Minimizing Segregation (Hay)
18 pages
Life Time of A Variable
No ratings yet
Life Time of A Variable
10 pages
11 Task Performance in Integrative Programming
No ratings yet
11 Task Performance in Integrative Programming
10 pages
Static Electricity and Chemical Safety: Vahid Ebadat, PH.D., M.Inst.P., MIET, C.Phys. Stonehouse Process Safety, Inc
No ratings yet
Static Electricity and Chemical Safety: Vahid Ebadat, PH.D., M.Inst.P., MIET, C.Phys. Stonehouse Process Safety, Inc
32 pages
Dairy
No ratings yet
Dairy
6 pages
CR Eat Ecl Asses
No ratings yet
CR Eat Ecl Asses
6 pages
Oop 3 Fa20-Be-012
No ratings yet
Oop 3 Fa20-Be-012
19 pages
Mad 26
No ratings yet
Mad 26
5 pages
04 Task Performance 1prelim Exam - ARG
No ratings yet
04 Task Performance 1prelim Exam - ARG
4 pages
HQL Joins
No ratings yet
HQL Joins
9 pages
HarshJAVA Worksheet 1
No ratings yet
HarshJAVA Worksheet 1
4 pages
Lab 7
No ratings yet
Lab 7
29 pages
MATHEMATICS
No ratings yet
MATHEMATICS
4 pages
Hash Map in Java
No ratings yet
Hash Map in Java
5 pages
12FM Alg Methods
No ratings yet
12FM Alg Methods
6 pages
Person
No ratings yet
Person
3 pages
Employee
No ratings yet
Employee
3 pages
JAVA Worksheet 1.1.2
No ratings yet
JAVA Worksheet 1.1.2
4 pages
hw7
No ratings yet
hw7
5 pages
Terminals
No ratings yet
Terminals
12 pages
Q003Employee Details_program in java
No ratings yet
Q003Employee Details_program in java
4 pages
Storage in
No ratings yet
Storage in
11 pages
ADBMS_9101_CA2
No ratings yet
ADBMS_9101_CA2
35 pages
One to Many
No ratings yet
One to Many
6 pages
Java Major Project
No ratings yet
Java Major Project
11 pages
Employees: Employee
No ratings yet
Employees: Employee
6 pages
Mats01g SQD Logic
No ratings yet
Mats01g SQD Logic
12 pages
Purino EA5 mONGOdb
No ratings yet
Purino EA5 mONGOdb
8 pages
Dionex ASE 350 Accelerated Solvent Extractor Operator's Manual
No ratings yet
Dionex ASE 350 Accelerated Solvent Extractor Operator's Manual
268 pages
Chapter 1 VLSI Introduction
No ratings yet
Chapter 1 VLSI Introduction
83 pages
Ziv Oc Ef Relay
No ratings yet
Ziv Oc Ef Relay
9 pages
Registered Customer (100 Points)
No ratings yet
Registered Customer (100 Points)
23 pages
Varun Contextual Hands On
No ratings yet
Varun Contextual Hands On
8 pages
Java 2
No ratings yet
Java 2
4 pages
PRA Mock
No ratings yet
PRA Mock
11 pages
Analysis & SQL Commands
No ratings yet
Analysis & SQL Commands
35 pages
Source Approval For Thermoplastic Road Marking Paint Kataline
100% (1)
Source Approval For Thermoplastic Road Marking Paint Kataline
37 pages
JAVA Worksheet 1
No ratings yet
JAVA Worksheet 1
4 pages
Test-2 Key
No ratings yet
Test-2 Key
20 pages
Employee Salary Code - PDF
No ratings yet
Employee Salary Code - PDF
3 pages
SPT英文版本(2025-03-24 07_10_54)
No ratings yet
SPT英文版本(2025-03-24 07_10_54)
10 pages
Test Cases - Examples - Mangesh Sir
No ratings yet
Test Cases - Examples - Mangesh Sir
25 pages
30-04
No ratings yet
30-04
5 pages
Assignment8_AbstractClass_Staff (1)
No ratings yet
Assignment8_AbstractClass_Staff (1)
4 pages
Pra 2
No ratings yet
Pra 2
2 pages
Neelu
No ratings yet
Neelu
14 pages
Function assignment
No ratings yet
Function assignment
4 pages
op 5
No ratings yet
op 5
9 pages
Experiment 2
No ratings yet
Experiment 2
17 pages
CODER
No ratings yet
CODER
14 pages
Catalogue - Merlin Gerin
No ratings yet
Catalogue - Merlin Gerin
60 pages
Module 1-1 (RC Coupling)
No ratings yet
Module 1-1 (RC Coupling)
9 pages
Oop 2
No ratings yet
Oop 2
7 pages
Brochure Victron Energy Quattro II
No ratings yet
Brochure Victron Energy Quattro II
2 pages
Entity Framework Notes
No ratings yet
Entity Framework Notes
2 pages
java ass 6
No ratings yet
java ass 6
8 pages
S4
No ratings yet
S4
18 pages
Hydraulic System: Muhamad Wildan Firdaus
No ratings yet
Hydraulic System: Muhamad Wildan Firdaus
21 pages
Bilectric Dehydrators-Desalters
No ratings yet
Bilectric Dehydrators-Desalters
2 pages
Notification UPSC CGS 2025 30
No ratings yet
Notification UPSC CGS 2025 30
1 page
TRAINING
No ratings yet
TRAINING
14 pages
Computer Application Project
No ratings yet
Computer Application Project
17 pages
Java Case Study Ad All
No ratings yet
Java Case Study Ad All
8 pages
Cs4227 Edc Phy Product Brief
No ratings yet
Cs4227 Edc Phy Product Brief
2 pages
Java
No ratings yet
Java
2 pages
Chemistry Project
No ratings yet
Chemistry Project
22 pages
Stepper Motor Driver Specification
No ratings yet
Stepper Motor Driver Specification
5 pages
Chapter 5 Geotech Report PDF
No ratings yet
Chapter 5 Geotech Report PDF
28 pages
Bit Plane Slicing and Bit Plane Compression
No ratings yet
Bit Plane Slicing and Bit Plane Compression
5 pages
Mix Design For M-35 Pile: Sieve Analysis
No ratings yet
Mix Design For M-35 Pile: Sieve Analysis
5 pages
C++ Functions and tutorial
From Everand
C++ Functions and tutorial
Nino Paiotta
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet