shell :
cat xxx | sort | uniq -c | awk '{print $2,$1}'
spark:
scala> sc.textFile("/home/lzq/test").map((_,1)).reduceByKey(_+_).sortBy(_._1,false).collect
res0: Array[(String, Int)] = Array((zeppelin,2), (world,1), (spark,1), (hello,2), (flink,2))\
flink:
senv.socketTextStream("localhost",888).map((_,1)).keyBy(0).sum(1)