Spark SQL saveMode 方式

package com.bjsxt.java.spark.sql.loadsave;

import org.apache.spark.SparkConf;
import org.apache.spark.api.java.JavaSparkContext;
import org.apache.spark.sql.DataFrame;
import org.apache.spark.sql.SQLContext;
import org.apache.spark.sql.SaveMode;

/**
 * 读取json或者parquet文件创建一个DataFrame
 * DataFrame存储到某一个路径下,默认存储格式是parquet
 * SaveMode.Overwrite:重写
 * Append:
 * @author root
 *
 */

public class SaveModeTest {

	@SuppressWarnings("deprecation")
	public static void main(String[] args) {
		SparkConf conf = new SparkConf()   
				.setAppName("SaveModeTest")
				.setMaster("local");
		JavaSparkContext sc = new JavaSparkContext(conf);
		SQLContext sqlContext = new SQLContext(sc);
	
		
		DataFrame peopleDF = sqlContext.read().json("hdfs://hadoop1:9000/input/people.json"); 
		
		
		peopleDF.write().mode(SaveMode.Append).save("hdfs://hadoop1:9000/output/namesAndFavColors_scala"); 

		sqlContext.read().parquet("hdfs://hadoop1:9000/output/namesAndFavColors_scala").show();
	}
}

posted @ 2017-01-17 22:37  yuerspring  阅读(1767)  评论(0编辑  收藏  举报