-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathexample.js
More file actions
executable file
·88 lines (77 loc) · 2.86 KB
/
example.js
File metadata and controls
executable file
·88 lines (77 loc) · 2.86 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
var es = require('event-stream');
var request = require('request');
var url = require('url');
var varType = require('var-type');
var serialize = require('serialize');
var Logparser = require('logagent-js');
var logParser = new Logparser();
var parseLine = serialize(logParser.parseLine.bind(logParser));
var filterDistinctFactory = require('./filter-distinct');
var filterDistinctOptions = {
preserve: false,
//select properties that are used for determining distinct records
propertyExtractor: function (data) {
return {
query: data.query
};
},
//define sets of dependent properties where it is important to track combinations of value classes
features: {x:['query.osc', 'query.author']},
//similar property sets are treated distinct, if in different groups
groupExtractor: function (data) {
return data.method + data.file;
}
};
var filterDistinct = filterDistinctFactory.create(filterDistinctOptions);
var ins=0;
var outs=0;
function extractData (input) {
if (varType(input, 'Object')) {
return {
method: input.method,
status_code: input.status_code,
path: input.path,
file: input.path && input.path.replace(url.parse(input.path).search,''),
query: input.path && url.parse(input.path, true).query
}
}
}
function filterSkipEmptyLines(line) {
if (line) {
return line
}
}
var dataStream = request("http://redlug.com/logs/access.log")
//request("http://www.hoonlir.com/logs/access.log")
//split stream to break on newlines
.pipe(es.split())
.on('data', function () {ins++;})
.pipe(es.mapSync(filterSkipEmptyLines))
.pipe(es.map(function(line, callback) {
parseLine(line, '', callback)})
)
.pipe(es.mapSync(extractData))
//alternative test dataStream - duplicate data rows
// var dataStream = es.readArray([{"method":"GET","status_code":200,"path":"/logs/access.log","file":"/logs/access.log","query":{}},
// {"method":"GET","status_code":200,"path":"/logs/access.log","file":"/logs/access.log","query":{}}]);
dataStream.pipe(es.map(
function (data, callback) {
filterDistinct(data)
.then(function (distinct) {
if (distinct) {
// data is distinct, keep
callback(null, data);
return;
}
//not distinct, skip
callback();
})
.catch(callback);
}))
.pipe(es.stringify())
.on('data', function () {outs++;})
.on('end', function (err) {
console.log('DONE!');
console.log('in:' + ins+' out:' + outs);
})
.pipe(process.stdout)