-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreviewByBusiness.js
127 lines (117 loc) · 4.23 KB
/
reviewByBusiness.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
// this map reduce mongo shell script combines data from the business, reviews, and tips
// collections to generate a collection by business, each document containing
// location info and a list of pertinent user_id and date for each review and tip.
// drop the collection if it already exists
db.reviewByBusiness.drop();
// map the business data first, using the business_id as the collection _id.
var mapBusiness = function() {
var values = {
// reshape the location data into geoJSON so we can run geospatial queries
loc: {
type: "Point",
coordinate: [this.latitude, this.longitude]
},
street: this.full_address,
city: this.city,
state: this.state,
name: this.name,
categories: this.categories,
stars: this.stars
};
emit(this.business_id, values);
};
// map reviews. all we keep is the user_id, review_id, rating, and date
var mapReview = function() {
var values = {
user_id: this.user_id,
review_id: this.review_id,
rating: this.stars,
funny: this.votes.funny,
useful: this.votes.useful,
cool: this.votes.cool,
date: new ISODate(this.date)
};
emit(this.business_id, values);
};
// map tips. all we keep are the user_id, tip_id, and date
var mapTip = function() {
var values = {
user_id: this.user_id,
tip_id: this._id,
date: new ISODate(this.date)
};
emit(this.business_id, values);
};
// the reduce function.
// combine data from the three collections above
var reduce = function(k, values) {
var result = new Object(),
// we generate this to use set membership test to filter out just adding fields
// that should be pushed to the list
reviewFields = {
"user_id": '',
"review_id": '',
"tip_id": '',
"funny": '',
"cool": '',
"useful": '',
"rating": '',
"date": ''
};
values.forEach(function(value) {
var field;
// only reviews have "review_id", we push the data to the 'reviews' array
if ("review_id" in value) {
if (!("reviews" in result)) {
result.reviews = new Array();
}
result.reviews.push(value);
}
// only tips have "tip_id", we push the data to the 'tips' array
if ("tip_id" in value) {
if (!("tips" in result)) {
result.tips = new Array();
}
result.tips.push(value);
}
// if the 'reviews' array already exists in the input -
// e.g. this is a 2nd+ go around of reduce - we pass that straight
// through to the output object array
if ("reviews" in value) {
if (!("reviews" in result)) {
result.reviews = new Array();
}
value.reviews.forEach(function(v) {
result.reviews.push(v);
});
}
// if the 'tips' array already exists in the input -
// e.g. this is a 2nd+ go around of reduce - we pass that straight
// through to the output object array
if ("tips" in value) {
if (!("tips" in result)) {
result.tips = new Array();
}
value.reviews.forEach(function(v) {
result.tips.push(v);
});
}
// add all of the 'business' location fields back in to the output object
for (field in value) {
if (value.hasOwnProperty(field) && !(field in reviewFields)) {
result[field] = value[field];
}
}
});
return result;
};
db.business.mapReduce(mapBusiness, reduce, {"sort":{"business_id":1}, "out": {"reduce": "reviewByBusiness"}});
db.review.mapReduce(mapReview, reduce, {"sort":{"business_id":1,"date":1}, "out": {"reduce":"reviewByBusiness"}});
db.tip.mapReduce(mapTip, reduce, {"sort":{"business_id":1,"date":1}, "out": {"reduce":"reviewByBusiness"}});
// reshape the collection to remove the 'key' and 'value' metaobject
db.reviewByBusiness.find().forEach(function(item) {
db.reviewByBusiness.update({_id: item._id}, item.value);
});
// create indexes
db.reviewByBusiness.createIndex({business_id:1})
db.reviewByBusiness.createIndex({state:1,categories:"text"})