文章目录
- 1.From Memory
- 2.From File
- 3.From File
1.From Memory
object RDDTest01 {
def main(args: Array[String]): Unit = {
val sparkConf = new SparkConf().setAppName("rdd").setMaster("local")
val sc = new SparkContext(sparkConf)
val rdd1 = sc.parallelize(Seq(1, 2, 3, 4))
val rdd2 = sc.makeRDD(Seq(1, 2, 3, 4))
rdd2.collect().foreach(println)
rdd1.collect().foreach(print)
sc.stop()
}
}
这里的makeRDD和parallelize没有区别, make底层用的就是parallelize函数
2.From File
object RDDTest02 {
def main(args: Array[String]): Unit = {
val sparkConf = new SparkConf().setAppName("rdd").setMaster("local")
val sc = new SparkContext(sparkConf)
val value1 = sc.textFile("E:\\atguigu05\\spark\\spark-core\\src\\main\\resources\\1.txt")
value1.collect().foreach(println)
sc.stop()
}
}
3.From File
object RDDTest03 {
def main(args: Array[String]): Unit = {
val sparkConf = new SparkConf().setAppName("rdd").setMaster("local")
val sc = new SparkContext(sparkConf)
// 路径可以为目录
sc.textFile("data").collect().foreach(println)
sc.wholeTextFiles("data").collect().foreach(println)
sc.stop()
}
}
第二个方法返回了完整路径