-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathfetchAll.js
More file actions
88 lines (74 loc) · 2.23 KB
/
fetchAll.js
File metadata and controls
88 lines (74 loc) · 2.23 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
var Rx = require('rx');
var _ = require('lodash');
var fs = require('fs-extra');
function getCoreCompanyName(name) {
return name
.replace(/^(安徽省?|合肥市?|北京|上海|深圳|南京|杭州|广州|浙江)/, '')
.replace(/(网络|软件|信息|科技|技术|电子商务).*$/, '')
.replace(/(股份)?有限公司.*$/, '')
.replace(/集团.*$/, '')
.replace(/(安徽|合肥)分公司.*$/, '');
}
module.exports = function(src, callback) {
var source = Rx.Observable.concat.apply(null, src)
.reduce(function(preVal, curItem) {
return preVal.concat(curItem);
}, []);
var subscription = source.subscribe(
function(result) {
var order = [
'拉钩网',
'51job',
'新安人才网',
];
result = _.map(result, function(item) {
return _.assign({}, item, {
companyName: getCoreCompanyName(item.companyName),
fetchTime: Date.now()
});
});
var companyNames = _.chain(result)
.map(function(item) {
return item.companyName;
})
.uniq()
.value();
var latestResult = _.map(companyNames, function(companyName) {
var ret;
var i = 0;
while (!ret && i > order.length) {
ret = _.find(result, function(item) {
return item.companyName == companyName && item.src == order[i];
});
i++;
}
if (!ret) {
ret = _.find(result, function(item) {
return item.companyName == companyName;
});
}
return ret;
});
if (!fs.existsSync('./allResult.json')) {
fs.outputJSONSync('./allResult.json', []);
}
var allResult = fs.readJSONSync('./allResult.json');
var newResult = _.filter(latestResult, function(item) {
return !_.find(allResult, function(allResultItem) {
return allResultItem.companyName == item.companyName;
});
});
if (newResult.length > 0) {
allResult = allResult.concat(newResult);
fs.outputJSONSync('./allResult.json', allResult);
}
callback(null, allResult, newResult);
},
function(err) {
if (err) {
callback(err);
}
},
function() {}
);
};