Canal.js函数式数据处理框架
Canal.js是一款函数式数据处理框架,提供了大量类似Spark的API。
For More API 指引
Common Transform
Canal.of([ 4, 0, 3, 5, 2, 4 ]) .filter(function(d) { return d > 2; }) .distinct() .sortWith() .map(function(d) { return [ d % 2, d ]; }) .collect();
[1, 3] [0, 4] [1, 5]
Attach to Array
Canal.on(Array);
[ 4, 0, 3, 5, 2, 4 ] .canal() .filter(function(d) { return d > 2; }) .distinct() .sortWith() .map(function(d) { return [ d % 2, d ]; }) .collect();
[1, 3] [0, 4] [1, 5]
Group Operation
Canal.of([ 4, 0, 3, 5, 2, 4 ]) .filter(function(d) { return d > 2; }) .distinct() .sortWith() .groupBy(function(d) { return d % 2; }) .collect();
[0, [4 ]] [1, [3,5]]
Join Operation
Canal.of([ 4, 0, 3, 5, 2, 4 ]) .filter(function(d) { return d > 2; }) .distinct() .sortWith() .groupBy(function(d) { return d % 2; }) .join(Canal.of([ 0, 1, 2 ]) .map(function(d) { return [ d, d ]; })) .collect();
[0, [[4 ], 0]] [1, [[3,5], 1]]
Window Operation
Canal.of([ {"id":"1","grp":"1","rnk":1,"sal":1000.00}, {"id":"2","grp":"1","rnk":1,"sal":1100.00}, {"id":"3","grp":"1","rnk":2,"sal":1200.00}, {"id":"4","grp":"1","rnk":2,"sal":1300.00}, {"id":"5","grp":"1","rnk":3,"sal":1400.00}, {"id":"6","grp":"2","rnk":1,"sal":1500.00}, {"id":"7","grp":"2","rnk":1,"sal":1600.00}, {"id":"8","grp":"2","rnk":2,"sal":1700.00} ]).window( Canal.wf.sum(d=>d.sal) .partBy(d=>d.grp) .orderBy(d=>d.rnk) .rows().between(-1, 1) // From the last row to the next row .as("sum_sal") ).collect();
[ {"id":"1","grp":"1","rnk":1,"sal":1000.00,"sum_sal":2100.00}, {"id":"2","grp":"1","rnk":1,"sal":1100.00,"sum_sal":3300.00}, {"id":"3","grp":"1","rnk":2,"sal":1200.00,"sum_sal":3600.00}, {"id":"4","grp":"1","rnk":2,"sal":1300.00,"sum_sal":3900.00}, {"id":"5","grp":"1","rnk":3,"sal":1400.00,"sum_sal":2700.00}, {"id":"6","grp":"2","rnk":1,"sal":1500.00,"sum_sal":3100.00}, {"id":"7","grp":"2","rnk":1,"sal":1600.00,"sum_sal":4800.00}, {"id":"8","grp":"2","rnk":2,"sal":1700.00,"sum_sal":3300.00} ]
评论