spark reduce by top words
cleanedMobyDick.filter(!_.isEmpty) .map(_.toLowerCase()) .map((_, 1)) .reduceByKey(_ + _) .takeOrdered(10)(Ordering[Int].reverse.on(_._2)) .foreach(println)