Canal.js函数式数据处理框架
Canal.js是一款函数式数据处理框架,提供了大量类似Spark的API。
For More API 指引
Common Transform
Canal.of([ 4, 0, 3, 5, 2, 4 ])
.filter(function(d)
{
return d > 2;
})
.distinct()
.sortWith()
.map(function(d)
{
return [ d % 2, d ];
})
.collect();
[1, 3] [0, 4] [1, 5]
Attach to Array
Canal.on(Array);
[ 4, 0, 3, 5, 2, 4 ]
.canal()
.filter(function(d)
{
return d > 2;
})
.distinct()
.sortWith()
.map(function(d)
{
return [ d % 2, d ];
})
.collect();
[1, 3] [0, 4] [1, 5]
Group Operation
Canal.of([ 4, 0, 3, 5, 2, 4 ])
.filter(function(d)
{
return d > 2;
})
.distinct()
.sortWith()
.groupBy(function(d)
{
return d % 2;
})
.collect();
[0, [4 ]] [1, [3,5]]
Join Operation
Canal.of([ 4, 0, 3, 5, 2, 4 ])
.filter(function(d)
{
return d > 2;
})
.distinct()
.sortWith()
.groupBy(function(d)
{
return d % 2;
})
.join(Canal.of([ 0, 1, 2 ])
.map(function(d)
{
return [ d, d ];
}))
.collect();
[0, [[4 ], 0]] [1, [[3,5], 1]]
Window Operation
Canal.of([
{"id":"1","grp":"1","rnk":1,"sal":1000.00},
{"id":"2","grp":"1","rnk":1,"sal":1100.00},
{"id":"3","grp":"1","rnk":2,"sal":1200.00},
{"id":"4","grp":"1","rnk":2,"sal":1300.00},
{"id":"5","grp":"1","rnk":3,"sal":1400.00},
{"id":"6","grp":"2","rnk":1,"sal":1500.00},
{"id":"7","grp":"2","rnk":1,"sal":1600.00},
{"id":"8","grp":"2","rnk":2,"sal":1700.00}
]).window(
Canal.wf.sum(d=>d.sal)
.partBy(d=>d.grp)
.orderBy(d=>d.rnk)
.rows().between(-1, 1) // From the last row to the next row
.as("sum_sal")
).collect();
[
{"id":"1","grp":"1","rnk":1,"sal":1000.00,"sum_sal":2100.00},
{"id":"2","grp":"1","rnk":1,"sal":1100.00,"sum_sal":3300.00},
{"id":"3","grp":"1","rnk":2,"sal":1200.00,"sum_sal":3600.00},
{"id":"4","grp":"1","rnk":2,"sal":1300.00,"sum_sal":3900.00},
{"id":"5","grp":"1","rnk":3,"sal":1400.00,"sum_sal":2700.00},
{"id":"6","grp":"2","rnk":1,"sal":1500.00,"sum_sal":3100.00},
{"id":"7","grp":"2","rnk":1,"sal":1600.00,"sum_sal":4800.00},
{"id":"8","grp":"2","rnk":2,"sal":1700.00,"sum_sal":3300.00}
]评论
