in src/main/scala/com/spotify/bdrc/pipeline/CountUsers.scala [63:68]
def spark(input: RDD[Rating]): Long = { input .filter(_.user == "Smith") // `count` is an action and collects data back to the driver node .count() }