import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.functions._
val spark = SparkSession.builder
.appName("hello-sparklabx")
.config("spark.jars.packages", "io.delta:delta-spark_2.12:3.0.0")
.getOrCreate()
println(s"Spark ${spark.version}")val df = spark.read
.option("header", "true")
.option("inferSchema", "true")
.csv("s3a://workspace/public/students.csv")
df.groupBy("department")
.agg(avg($"gpa").as("avg_gpa"))
.orderBy($"avg_gpa".desc)
.show()df.filter($"gpa" > 3.5).show(5)