in src/main/scala/com/spotify/bdrc/pipeline/CountDistinctItems.scala [70:75]
def spark(input: RDD[Rating]): Long = { input .map(_.item) .distinct() .count() }