第46课程 Spark 2.0实战之Dataset:sort、join、joinWith、randomSplit、sample、select、groupBy、agg、col等
people.json
{"name":"Michael", "age":16} {"name":"Andy", "age":30} {"name":"Justin", "age":19}
package com.dt.spark200
import org.apache.spark.sql.SparkSession import scala.collection.mutable.ArrayBuffer
object DataSetsops {
case class Person(name:String,age:Long) case class Score(n:String,score:Long) def main(args: Array[String]): Unit = { val spark = SparkSession .builder() .appName("DatasetOps") .master("local") .config("spark.sql.warehouse.dir", "file:///G:/IMFBigDataSpark2016/IMFScalaWorkspace_spark200/Spark200/spark-warehouse") .getOrCreate