sparksql 读取Oracle一张表的数据
<dependency>
<groupId>com.oracle</groupId>
<artifactId>ojdbc14</artifactId>
<version>10.2.0.4.0</version>
</dependency>
记得添加oracle的驱动添加链接描述
import org.apache.spark.SparkConf
import org.apache.spark.sql.{DataFrame, SparkSession}
object Conn_Oracle {
def main(args: Array[String]): Unit = {
//Spark 连接Oracle数据库
//获取sparkConf
val conf = new SparkConf()
.setMaster("local[*]")
.set("spark.serializer", "org.apache.spark.serializer.KryoSerializer")
.setAppName(this.getClass.getName)
//获取sparksesssion
val session = SparkSession
.builder()
.config(conf)
.getOrCreate()
val sc = session.sparkContext
// --------------------------------连接oracle数据库 ----------------------------------
val reader = session.read.format("jdbc")
.option("url", "jdbc:oracle:thin:@10.10.1.253:1521:bidwdev")
.option("driver", "oracle.jdbc.driver.OracleDriver")
.option("user", "user")
.option("password", "username")
.option("dbtable", "table")
val jdbcDf: DataFrame = reader.load()
jdbcDf.show()
}
}
