zoukankan      html  css  js  c++  java
  • Spark SQL saveMode 方式

    package com.bjsxt.java.spark.sql.loadsave;
    
    import org.apache.spark.SparkConf;
    import org.apache.spark.api.java.JavaSparkContext;
    import org.apache.spark.sql.DataFrame;
    import org.apache.spark.sql.SQLContext;
    import org.apache.spark.sql.SaveMode;
    
    /**
     * 读取json或者parquet文件创建一个DataFrame
     * DataFrame存储到某一个路径下,默认存储格式是parquet
     * SaveMode.Overwrite:重写
     * Append:
     * @author root
     *
     */
    
    public class SaveModeTest {
    
    	@SuppressWarnings("deprecation")
    	public static void main(String[] args) {
    		SparkConf conf = new SparkConf()   
    				.setAppName("SaveModeTest")
    				.setMaster("local");
    		JavaSparkContext sc = new JavaSparkContext(conf);
    		SQLContext sqlContext = new SQLContext(sc);
    	
    		
    		DataFrame peopleDF = sqlContext.read().json("hdfs://hadoop1:9000/input/people.json"); 
    		
    		
    		peopleDF.write().mode(SaveMode.Append).save("hdfs://hadoop1:9000/output/namesAndFavColors_scala"); 
    
    		sqlContext.read().parquet("hdfs://hadoop1:9000/output/namesAndFavColors_scala").show();
    	}
    }
    

  • 相关阅读:
    jmeter之正则表达式
    python_appium搭建APP自动化测试环境
    网络编程
    四种单例模式
    Pycharm快捷键
    面向对象
    阶段性总结
    模块之numpy,pandas,matplotlib
    模块之json,pickle,os,sys,logging
    模块之Time,datatime,hashlib,hmac
  • 原文地址:https://www.cnblogs.com/TendToBigData/p/10501294.html
Copyright © 2011-2022 走看看