示例代码:
from pyspark.sql import SparkSession from delta.tables import *
spark = SparkSession
.builder
.appName("Delta Lake on AWS Glue")
.config("spark.executor.memory", "6g")
.config("spark.driver.memory", "6g")
.getOrCreate()
df = spark.read.format("delta").load("s3://
df = df.groupBy("name").agg({"age": "max"})
try:
df.write.format("delta").mode("overwrite").save("s3://