spark2.2读写操作hive和mysql数据库

2019独角兽企业重金招聘Python工程师标准>>>

sparksession操作hive数据库

1.需要将core-site.xml,hdfs-site.xml,hive-site.xml放入resources中。

2.创建sparksession的时候加入属性

.enableHiveSupport()

3.操作hive数据库

spark.sql("use hisms_sl")spark.sql("show tables").show(10)val data:DataFrame&＃61;spark.sql("select * from sl_data")data.createOrReplaceTempView("sl_data")data.select(data("id"),data("zfy")).filter(data("id").<&＃61;(100)).show()val table1:DataFrame&＃61;spark.sql("select\n&＃96;id&＃96; as id,\n&＃96;BAH&＃96; as akc190,\nconcat(&＃96;XM&＃96;,&＃96;CSRQ&＃96;) as aac001 \nfrom sl_data")
//保存数据到hive中 table2.write.format("orc").saveAsTable("sn_20180108")

sparksession读取text文件&＃xff0c;存储到mysql数据库

val text:DataFrame&＃61;spark.read.format("org.apache.spark.sql.execution.datasources.csv.CSVFileFormat").option("header", true)//首行作为字段名.option("delimiter", ",")//指定定界符--分隔符.load("file:///C:\\Users\\91BGJK2\\Desktop\\sl_hive.txt")
text.createOrReplaceTempView("hisms")
val table1:DataFrame&＃61;spark.sql("select\n&＃96;id&＃96; as id,\n&＃96;BAH&＃96; as akc190,\nconcat(&＃96;XM&＃96;,&＃96;CSRQ&＃96;) as aac001\nfrom hisms")
//保存到jdbc
table1.write.mode(SaveMode.Append).format("jdbc")
//记得指定编码&＃xff0c;防止写入数据库乱码.option("url","jdbc:mysql://10.111.121.111:3306/hisms_sn?useUnicode&＃61;true&characterEncoding&＃61;UTF-8").option("dbtable","sn_test2").option("user", "root").option("password", "root").save();

/*** 配置文件读取mysql*/
val properties&＃61;Map("url"->"jdbc:mysql://10.111.121.111:3306/hisms_sn","driver"->"com.mysql.jdbc.Driver","user"->"root","dbtable"->"t_drg_fz","password"->"root")
val t_drg_fz&＃61;spark.read.format("jdbc").options(properties).load()