Apache pig 猪嵌套示例
我写了以下的猪脚本。我怎样才能使它成为嵌套的Apache pig 猪嵌套示例,apache-pig,Apache Pig,我写了以下的猪脚本。我怎样才能使它成为嵌套的 input= LOAD '/path/to/input/data' USING PigStorage('\t') AS (id:chararray,category:chararray); grp= GROUP input BY category; grp_count= FOREACH grp generate group, COUNT(input); grp_ordered= order grp_count by $1 DESC; top_
input= LOAD '/path/to/input/data' USING PigStorage('\t') AS (id:chararray,category:chararray);
grp= GROUP input BY category;
grp_count= FOREACH grp generate group, COUNT(input);
grp_ordered= order grp_count by $1 DESC;
top_grp= LIMIT grp_ordered 5;
这很简单-看看grp_计数关系:
input= LOAD '/path/to/input/data' USING PigStorage('\t') AS (id:chararray,category:chararray);
grp_count= FOREACH (GROUP input BY category)
generate flatten(group) as category
,COUNT(input) as cnt;
grp_ordered= order grp_count by $1 DESC;
top_grp= LIMIT grp_ordered 5;
如果我正确理解你的问题,下面是代码
data = LOAD 'data' USING PigStorage() AS (id,category);
grp = GROUP data BY category;
grp_count = FOREACH grp {
ord = order data by $1 DESC ;
top_grp = LIMIT ord 5;
GENERATE flatten(group),COUNT(top_grp.$1) ; };
dump grp_count;