First page Back Continue Last page Image

Spark examples in Scala

https://spark.apache.org/examples.html

# Creates a DataFrame based on a table named "people"

# stored in a MySQL database.

url = \

"jdbc:mysql://yourIP:yourPort/test?user=yourUsername;password=yourPassword"

df = sqlContext \

.read \

.format("jdbc") \

.option("url", url) \

.option("dbtable", "people") \

.load()

# Looks the schema of this DataFrame.

df.printSchema()

# Counts people by age

countsByAge = df.groupBy("age").count()

countsByAge.show()

# Saves countsByAge to S3 in the JSON format.

countsByAge.write.format("json").save("s3a://...")