reducer 按key聚合

#coding=utf8

import sys
import itertools
import json


reload(sys)
sys.setdefaultencoding("utf8")
 

def get_line():
"""
return key, value
"""
  for line in sys.stdin:
      yield line.strip().split('\t', 1)


for key, lines in itertools.groupby(get_line(), key=lambda x: x[0]):
    #print key, list(lines)
    res = []
    for it in list(lines):
        res.append(it[1])

    print '%s\t%s' % (key, ' '.join(res))

 

posted on 2018-12-04 19:37  TMatrix52  阅读(127)  评论(0)    收藏  举报

导航