dgadiraju
8/1/2017 - 11:08 AM

pyspark-create-data-frame.py

ordersDF = sc.textFile(inputPath + "/orders"). \
map(lambda rec:
  Row(order_id=int(rec.split(",")[0]),
      order_date=rec.split(",")[1],
      order_customer_id=int(rec.split(",")[2]),
      order_status=rec.split(",")[3])
).toDF()