#Check out our lab for practice: https://labs.itversity.com
#Get Daily Revenue per product using join - Execution Life Cycle
products = open("/data/retail_db/products/part-00000").read().splitlines()
productsRDD = sc.parallelize(products)
productsMap = productsRDD.map(lambda product: (int(product.split(",")[0]), product.split(",")[2]))
dailyRevenuePerProductIdMap = dailyRevenuePerProductId.map(lambda rec: (rec[0][1], (rec[0][0], rec[1])))
dailyRevenuePerProductJoinProductsMap = dailyRevenuePerProductIdMap.join(productsMap)
dailyRevenuePerProductName = dailyRevenuePerProductJoinProductsMap.map(lambda rec: rec[1])
for i in dailyRevenuePerProductName.take(10): print(i)
#Raise any issues on https://discuss.itversity.com - make sure to categorize properly