Example : Reading CSV File

sparkexamples > c20 > a60
cat z15_csv_file.input
subject,mark
english,80
science,75
  1. [raj@Rajkumars-MacBook-Pro ~/gitws/.../a60_infer_textfile]$spark-shell --master local[*] --packages com.databricks:spark-csv_2.11:1.2.0
  2. ...
  3. scala> val df = sqlContext.read.
  4. | format("com.databricks.spark.csv").
  5. | option("header", "true") .
  6. | option("inferSchema", "true").
  7. | load("file:///Users/.../a60_infer_textfile/z15_csv_file.input");
  8. df: org.apache.spark.sql.DataFrame = [subject: string, mark: int]
  9.  
  10. scala> df.printSchema()
  11. root
  12. |-- subject: string (nullable = true)
  13. |-- mark: integer (nullable = true)
  14.  
  15.  
  16. scala> df.collect()
  17. res1: Array[org.apache.spark.sql.Row] = Array([english,80], [science,75], [math,82])