Slide 12
Slide 12 text
12
val rawData = sc.textFile("/user/srowen/kddcup.data", 120)!
rawData: org.apache.spark.rdd.RDD[String] =!
MappedRDD[13] at textFile at :15!
!
rawData.count!
...!
res1: Long = 4898431!
!
rawData.take(1)!
...!
res3: Array[String] = Array(0,tcp,http,SF,
215,45076,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,1,0.00,0.00,0.
00,0.00,1.00,0.00,0.00,0,0,0.00,0.00,0.00,0.00,0.00,0.00,0
.00,0.00,normal.)!