CreateDFFromMysql

package com.bjsxt.sparksql.dataframe;

import java.util.HashMap;
import java.util.Map;
import java.util.Properties;

import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.sql.DataFrame;
import org.apache.spark.sql.DataFrameReader;
import org.apache.spark.sql.SQLContext;
import org.apache.spark.sql.SaveMode;


public class CreateDFFromMysql {
	public static void main(String[] args) {
		SparkConf conf = new SparkConf();
		conf.setMaster("local").setAppName("mysql");
		/**
		 * 	配置join或者聚合操作shuffle数据时分区的数量
		 */
		conf.set("spark.sql.shuffle.partitions", "1");
		
		JavaSparkContext sc = new JavaSparkContext(conf);
		SQLContext sqlContext = new SQLContext(sc);
		/**
		 * 第一种方式读取MySql数据库表,加载为DataFrame
		 */
		Map<String, String> options = new HashMap<String,String>();
		options.put("url", "jdbc:mysql://192.168.179.4:3306/spark");
		options.put("driver", "com.mysql.jdbc.Driver");
		options.put("user", "root");
		options.put("password", "123456");
		options.put("dbtable", "person");
		
		DataFrame person = sqlContext.read().format("jdbc").options(options).load();
		person.show();
		person.registerTempTable("person1");
		/**
		 * 第二种方式读取MySql数据表加载为DataFrame
		 */
		DataFrameReader reader = sqlContext.read().format("jdbc");
		reader.option("url", "jdbc:mysql://192.168.179.4:3306/spark");
		reader.option("driver", "com.mysql.jdbc.Driver");
		reader.option("user", "root");
		reader.option("password", "123456");
		reader.option("dbtable", "score");
		DataFrame score = reader.load();
		score.show();
		score.registerTempTable("score1");
		
		DataFrame result = 
				sqlContext.sql("select person1.id,person1.name,person1.age,score1.score "
						+ "from person1,score1 "
						+ "where person1.name = score1.name");
		result.show();
		/**
		 * 将DataFrame结果保存到Mysql中
		 */
		Properties properties = new Properties();
		properties.setProperty("user", "root");
		properties.setProperty("password", "123456");
		/**
		 * SaveMode:
		 * Overwrite:覆盖
		 * Append:追加
		 * ErrorIfExists:如果存在就报错
		 * Ignore:如果存在就忽略
		 * 
		 */		result.write().mode(SaveMode.Overwrite).jdbc("jdbc:mysql://192.168.179.4:3306/spark", "result", properties);
		System.out.println("----Finish----");
		sc.stop();
	}
}

  

posted @ 2018-06-18 13:34  uuhh  阅读(1)  评论(0)    收藏  举报