package mapred;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapred.FileInputFormat;
import org.apache.hadoop.mapred.FileOutputFormat;
import org.apache.hadoop.mapred.JobClient;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.MapReduceBase;
import org.apache.hadoop.mapred.Mapper;
import org.apache.hadoop.mapred.OutputCollector;
import org.apache.hadoop.mapred.Reducer;
import org.apache.hadoop.mapred.Reporter;
import org.apache.hadoop.mapred.RunningJob;
import org.apache.hadoop.mapred.TextInputFormat;
import org.apache.hadoop.mapred.TextOutputFormat;
//import org.conan.myhadoop.hdfs.HdfsDAO;
public class Step4 {
public static class Step4_PartialMultiplyMapper extends MapReduceBase implements Mapper<LongWritable, Text, IntWritable, Text> {
private final static IntWritable k = new IntWritable();
private final static Text v = new Text();
private final static Map<Integer, List<Cooccurrence>> cooccurrenceMatrix = new HashMap<Integer, List<Cooccurrence>>();
public void map(LongWritable key, Text values, OutputCollector<IntWritable, Text> output, Reporter reporter) throws IOException {
String[] tokens = Recommend.DELIMITER.split(values.toString());
String[] v1 = tokens[0].split(":");
String[] v2 = tokens[1].split(":");
if (v1.length > 1) {// cooccurrence
int itemID1 = Integer.parseInt(v1[0]);
int itemID2 = Integer.parseInt(v1[1]);
int num = Integer.parseInt(tokens[1]);
List<Cooccurrence> list = null;
if (!cooccurrenceMatrix.containsKey(itemID1)) {
list = new ArrayList<Cooccurrence>();
} else {
list = cooccurrenceMatrix.get(itemID1);
}
list.add(new Cooccurrence(itemID1, itemID2, num));
cooccurrenceMatrix.put(itemID1, list);
}
if (v2.length > 1) {// userVector
int itemID = Integer.parseInt(tokens[0]);
int userID = Integer.parseInt(v2[0]);
double pref = Double.parseDouble(v2[1]);
k.set(userID);
for (Cooccurrence co : cooccurrenceMatrix.get(itemID)) {
v.set(co.getItemID2() + "," + pref * co.getNum());
output.collect(k, v);
}
}
}
}
public static class Step4_AggregateAndRecommendReducer extends MapReduceBase implements Reducer<IntWritable, Text, IntWritable, Text> {
private final static Text v = new Text();
public void reduce(IntWritable key, Iterator<Text> values, OutputCollector<IntWritable, Text> output, Reporter reporter) throws IOException {
Map<String, Double> result = new HashMap<String, Double>();
while (values.hasNext()) {
String[] str = values.next().toString().split(",");
if (result.containsKey(str[0])) {
result.put(str[0], result.get(str[0]) + Double.parseDouble(str[1]));
} else {
result.put(str[0], Double.parseDouble(str[1]));
}
}
Iterator<String> iter = result.keySet().iterator();
while (iter.hasNext()) {
String itemID = iter.next();
double score = result.get(itemID);
//String Item=","+;
v.set(itemID + "," + score);
output.collect(key,v);
}
}
}
public static void run(Map<String, String> path) throws IOException {
JobConf conf = Recommend.config();
String input1 = path.get("Step4Input1");
String input2 = path.get("Step4Input2");
String output = path.get("Step4Output");
HdfsDAO hdfs = new HdfsDAO(Recommend.HDFS, conf);
hdfs.rmr(output);
conf.setOutputKeyClass(IntWritable.class);
conf.setOutputValueClass(Text.class);
conf.setMapperClass(Step4_PartialMultiplyMapper.class);
conf.setCombinerClass(Step4_AggregateAndRecommendReducer.class);
conf.setReducerClass(Step4_AggregateAndRecommendReducer.class);
conf.setInputFormat(TextInputFormat.class);
conf.setOutputFormat(TextOutputFormat.class);
FileInputFormat.setInputPaths(conf, new Path(input1), new Path(input2));
FileOutputFormat.setOutputPath(conf, new Path(output));
RunningJob job = JobClient.runJob(conf);
while (!job.isComplete()) {
job.waitForCompletion();
}
}
}
class Cooccurrence {
private int itemID1;
private int itemID2;
private int num;
public Cooccurrence(int itemID1, int itemID2, int num) {
super();
this.itemID1 = itemID1;
this.itemID2 = itemID2;
this.num = num;
}
public int getItemID1() {
return itemID1;
}
public void setItemID1(int itemID1) {
this.itemID1 = itemID1;
}
public int getItemID2() {
return itemID2;
}
public void setItemID2(int itemID2) {
this.itemID2 = itemID2;
}
public int getNum() {
return num;
}
public void setNum(int num) {
this.num = num;
}
}
没有合适的资源?快使用搜索试试~ 我知道了~
资源推荐
资源详情
资源评论
收起资源包目录
基于mapreduce的小型电影推荐系统 (375个子文件)
HdfsDAO.class 5KB
Step4$Step4_PartialMultiplyMapper.class 4KB
InputdataDaoImpl.class 4KB
Step4$Step4_AggregateAndRecommendReducer.class 4KB
UserDaoImpl.class 3KB
Step3$Step31_UserVectorSplitterMapper.class 3KB
Step2$Step2_UserVectorToCooccurrenceMapper.class 3KB
Step3.class 3KB
Step1.class 3KB
Step1$Step1_ToItemPreMapper.class 3KB
Step1$Step1_ToUserVectorReducer.class 3KB
Recommend.class 3KB
Step4.class 3KB
Step2.class 3KB
Step3$Step32_CooccurrenceColumnWrapperMapper.class 3KB
MetadataDaoImpl.class 2KB
Step2$Step2_UserVectorToConoccurrenceReducer.class 2KB
MovieDaoImpl.class 2KB
DBconn.class 2KB
Searchall.class 2KB
UpdateServlet.class 2KB
DengluServlet.class 2KB
DeleteServlet.class 2KB
ZhuceServlet.class 2KB
SelectServlet.class 2KB
EncodingFilter.class 1KB
InputdataServlet.class 1KB
User.class 1KB
Cooccurrence.class 916B
Metadata.class 909B
movie.class 903B
UserDao.class 429B
InputdataDao.class 395B
MapredDaoImpl.class 370B
MetadataDao.class 348B
MovieDao.class 319B
MapredDao.class 129B
.classpath 18KB
org.eclipse.wst.common.component 464B
org.eclipse.wst.jsdt.ui.superType.container 49B
bootstrap.css 138KB
flat-ui.min.css 128KB
bootstrap.min.css 115KB
layui.css 59KB
bootstrap-theme.min.css 19KB
jquery-ui.css 19KB
layer.css 14KB
layui.mobile.css 10KB
laydate.css 7KB
common.css 5KB
commonCopy.css 4KB
login.css 4KB
jquery.nouislider.css 3KB
slide.css 2KB
jquery.nouislider.min.css 1KB
code.css 1KB
Thumbs.db 2.31MB
iconfont.eot 39KB
lato-bold.eot 31KB
lato-regular.eot 30KB
lato-black.eot 30KB
lato-bolditalic.eot 30KB
lato-light.eot 29KB
lato-italic.eot 29KB
glyphicons-halflings-regular.eot 20KB
adminthemes-webfont.eot 6KB
59.gif 10KB
22.gif 10KB
24.gif 8KB
13.gif 7KB
16.gif 7KB
39.gif 6KB
64.gif 6KB
63.gif 6KB
50.gif 6KB
loading-0.gif 6KB
4.gif 6KB
1.gif 5KB
42.gif 5KB
71.gif 5KB
21.gif 5KB
20.gif 5KB
29.gif 5KB
70.gif 4KB
5.gif 4KB
17.gif 4KB
27.gif 4KB
9.gif 4KB
44.gif 4KB
11.gif 4KB
8.gif 4KB
3.gif 4KB
23.gif 4KB
34.gif 4KB
41.gif 4KB
38.gif 4KB
65.gif 3KB
32.gif 3KB
45.gif 3KB
7.gif 3KB
共 375 条
- 1
- 2
- 3
- 4
资源评论
- 轻松鼠2020-05-28请问应该怎么运行呢?我用的eclipse的java,谢谢
- Stephen__Curry302019-06-14感觉很有用,请问是否可以提供一下使用的数据集Souane2019-07-01这是相对应的数据集:https://download.csdn.net/download/qq_41945793/11266871
Souane
- 粉丝: 12
- 资源: 21
上传资源 快速赚钱
- 我的内容管理 展开
- 我的资源 快来上传第一个资源
- 我的收益 登录查看自己的收益
- 我的积分 登录查看自己的积分
- 我的C币 登录后查看C币余额
- 我的收藏
- 我的下载
- 下载帮助
安全验证
文档复制为VIP权益,开通VIP直接复制
信息提交成功