zoukankan      html  css  js  c++  java
  • Spark SQL saveMode 方式

    package com.bjsxt.java.spark.sql.loadsave;
    
    import org.apache.spark.SparkConf;
    import org.apache.spark.api.java.JavaSparkContext;
    import org.apache.spark.sql.DataFrame;
    import org.apache.spark.sql.SQLContext;
    import org.apache.spark.sql.SaveMode;
    
    /**
     * 读取json或者parquet文件创建一个DataFrame
     * DataFrame存储到某一个路径下,默认存储格式是parquet
     * SaveMode.Overwrite:重写
     * Append:
     * @author root
     *
     */
    
    public class SaveModeTest {
    
    	@SuppressWarnings("deprecation")
    	public static void main(String[] args) {
    		SparkConf conf = new SparkConf()   
    				.setAppName("SaveModeTest")
    				.setMaster("local");
    		JavaSparkContext sc = new JavaSparkContext(conf);
    		SQLContext sqlContext = new SQLContext(sc);
    	
    		
    		DataFrame peopleDF = sqlContext.read().json("hdfs://hadoop1:9000/input/people.json"); 
    		
    		
    		peopleDF.write().mode(SaveMode.Append).save("hdfs://hadoop1:9000/output/namesAndFavColors_scala"); 
    
    		sqlContext.read().parquet("hdfs://hadoop1:9000/output/namesAndFavColors_scala").show();
    	}
    }
    

  • 相关阅读:
    XML约束之DTD
    XML基础
    向方法传递多个参数
    从方法里返回值
    给方法传值
    对象状态和行为
    对象类型数组
    数组
    避开关键字
    primitive数据类型
  • 原文地址:https://www.cnblogs.com/TendToBigData/p/10501294.html
Copyright © 2011-2022 走看看