maven pom依赖配置:

<dependency>
  <groupId>org.elasticsearch</groupId>
  <artifactId>elasticsearch-spark-13_2.10</artifactId>
  <version>6.1.2</version>
</dependency>


code:

import org.apache.spark.{SparkConf, SparkContext}
import org.elasticsearch.spark._

object ReadEs {
  def main(args: Array[String]){

    System.setProperty("spark.serializer", "org.apache.spark.serializer.KryoSerializer")
    System.setProperty("hadoop.home.dir", "C:\\hadoop-2.6.0-cdh5.11.0")
    val conf = new SparkConf().setAppName("READES").setMaster("local").set("es.nodes","172.18.10.34")

    val sc = new SparkContext(conf)


//    val query = """{"query" : { "match" : { "content" : "上海" }}}"""
//    val query = """{"query" : { "match" : { "_id" : 1 }}}"""
//    val RDD = sc.esRDD("tracy/fulltext",query)

   
val RDD = sc.esRDD("tracy/fulltext")

    RDD.collect().foreach(x=> (println(x._1,x._2)))

    sc.stop()

  }

}


执行测试:

spark读取ES数据



相关文章:

  • 2021-11-27
  • 2021-11-27
  • 2022-01-07
  • 2021-11-18
  • 2021-11-27
  • 2021-11-18
  • 2021-08-29
  • 2021-11-18
猜你喜欢
  • 2021-08-14
  • 2021-07-09
  • 2021-11-27
  • 2021-11-27
  • 2022-02-24
  • 2021-12-10
相关资源
相似解决方案