cala> val dfJson = sqlContext.read.format("json").load("/home/hadoop/Desktop/olympic.json")
dfJson: org.apache.spark.sql.DataFrame = [age: bigint, athelete: string ... 8 more fields]
scala> val dfXML = sqlContext.read.format("xml").option("rowTag","book").load("/home/hadoop/Desktop/sample.xml")
dfXML: org.apache.spark.sql.DataFrame = [_id: string, author: string ... 5 more fields]
No comments:
Post a Comment