- Represents a one-to-one dependency between ranges of partitions in the parent and child RDDs.
- SPARK 源码分析技术分享(bilibilid视频汇总套装视频): https://www.bilibili.com/video/av37442139/
- github: https://github.com/opensourceteams/spark-scala-maven
- csdn(汇总视频在线看): https://blog.csdn.net/thinktothings/article/details/84726769
- https://youtu.be/_4DeWWPQubc (youtube视频)
- https://www.bilibili.com/video/av37442139/?p=2(bilibili视频)
- github: https://github.com/opensourceteams/spark-scala-maven
c.txt
a bc
a
a.txt
a b
c a
package com.opensource.bigdata.spark.local.rdd.operation.dependency.narrow.n_02_RangeDependency
import com.opensource.bigdata.spark.local.rdd.operation.base.BaseScalaSparkContext
object Run3 extends BaseScalaSparkContext{
def main(args: Array[String]): Unit = {
val sc = pre()
val rdd1 = sc.textFile("/opt/data/2/c.txt",2)
val rdd2 = sc.textFile("/opt/data/2/a.txt",2)
val rdd3 = rdd1.union(rdd2)
println(rdd3.collect().mkString("\n"))
sc.stop()
}
}