Spark読み書きMySQL

3352 ワード

1.Spark MySQLデータの読み込み
         1. spark.read.jdbc()
  def main(args: Array[String]): Unit = {
    val spark = SparkSession.builder().appName("sparksql").master("local").getOrCreate()

    val prop = new Properties()
    prop.put("user", "root")
    prop.put("password", "863863")

    val url = "jdbc:mysql://localhost:3306/test?useUnicode=true&characterEncoding=UTF-8&serverTimezone=UTC"

    val dataFrame = spark.read.jdbc(url,"test01",prop).select("id").where("id >= 3").show()

    spark.stop()
  }

         2. spark.read.format().option().load()
object SparkReadMysql {
  def main(args: Array[String]): Unit = {
    val spark = SparkSession.builder()
      .appName("sparksql")
      .master("local")
      .getOrCreate()

    //useUnicode=true&characterEncoding=UTF-8   
    //serverTimezone=UTC   
    val dataDF = spark.read.format("jdbc")
      .option("url","jdbc:mysql://localhost:3306/test?useUnicode=true&characterEncoding=UTF-8&serverTimezone=UTC")
      .option("dbtable","test01")
      .option("user","root")
      .option("password","863863")
      .load()

    dataDF.createOrReplaceTempView("tmptable")

    val sql = "select * from tmptable where id >= 3"

    spark.sql(sql).show()

    spark.stop()
  }
}

 
2.Spark MySQLにデータを書く
         spark.write.mode().jdbc()
         1. クエリ後の書き込み
  def main(args: Array[String]): Unit = {
    val spark = SparkSession.builder().appName("sparksql").master("local").getOrCreate()

    val prop = new Properties()
    prop.put("user", "root")
    prop.put("password", "863863")

    val url = "jdbc:mysql://localhost:3306/test?useUnicode=true&characterEncoding=UTF-8&serverTimezone=UTC"

    val dataFrame = spark.read.jdbc(url,"test01",prop).where("id >= 3")

    dataFrame.write.mode(SaveMode.Append).jdbc(url,"test02",prop)

    spark.stop()
  }

         1. DataFrame再書き込みの構築
  def main(args: Array[String]): Unit = {
    val spark = SparkSession.builder()
      .appName("test")
      .master("local")
      .getOrCreate()

    val prop = new Properties()
    prop.put("user","root")
    prop.put("password","863863")

    val url = "jdbc:mysql://localhost:3306/test?useUnicode=true&characterEncoding=UTF-8&serverTimezone=UTC"

    val rdd = spark.sparkContext.textFile("d://data/word.txt")

    val rdd2 = rdd.flatMap(_.split(",")).distinct().zipWithIndex().map(t =>{Row(t._2,t._1)})

    val schema = StructType{
      List(
        StructField("id",LongType,true),
        StructField("user",StringType,true)
      )}

    val dataFrame = spark.createDataFrame(rdd2,schema)

    dataFrame.write.mode(SaveMode.Overwrite).jdbc(url,"test02",prop)

    spark.stop()
  }

3.プレゼンテーション
         1. spark.read.jdbc() 
         2. spark.read.format().option().load()
         3. Sparkクエリデータ書き込みMySQL
         4. 構築データFrame MySQLへの書き込み