dgadiraju
6/3/2017 - 2:37 PM

spark-scala-cardcountbysuit.scala

// Make sure you do not have directory used for output path
// hadoop fs -rm -R /user/dgadiraju/cardcountbysuit
val inputPath = "/public/cards/largedeck.txt"
val outputPath = "/user/dgadiraju/cardcountbysuit"

sc.textFile(inputPath).
  map(card => (card.split("\\|")(1), 1)).
  reduceByKey((total, card) => total + card).
  saveAsTextFile(outputPath)