Create a RDD
!
// from textile
JavaRDD lines = sc.textFile("ensemble-des-equipements-
sportifs-de-lile-de-france.csv");
// from HDFS
JavaRDD lines = sc.textFile("hdfs://dataset/ensemble-des-
equipements-sportifs-de-lile-de-france.csv");
// from S3
JavaRDD lines = sc.textFile("s3n://dataset/ensemble-des-
equipements-sportifs-de-lile-de-france.csv");
!
!
// file from Hadoop
sc.hadoopFile(path, inputFormatClass, keyClass, valueClass);
!
// create a distributed dataset
sc.parallelize(data);