in src/main/scala/com/spotify/bdrc/pipeline/CountDistinctItems.scala [78:82]
def sparkApprox(input: RDD[Rating]): Long = { input .map(_.item) .countApproxDistinct() }