apache · wojtek-szymanski · Feb 25, 2017 · Feb 25, 2017 · Feb 28, 2017 · Feb 28, 2017
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVInferSchema.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVInferSchema.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.execution.datasources.csv
 import java.math.BigDecimal
 
 import scala.util.control.Exception._
+import scala.util.{Failure, Success, Try}
 
 import com.univocity.parsers.csv.CsvParser
 
@@ -40,7 +41,19 @@ private[csv] object CSVInferSchema {
       csv: Dataset[String],
       caseSensitive: Boolean,
       options: CSVOptions): StructType = {
-    val firstLine: String = CSVUtils.filterCommentAndEmpty(csv, options).first()
+    val lines = CSVUtils.filterCommentAndEmpty(csv, options)
+    Try(lines.first()) match {
+      case Success(firstLine) => infer(csv, caseSensitive, options, firstLine)
+      case Failure(e: NoSuchElementException) => StructType(Seq())
+      case Failure(e) => throw e
+    }
+  }
+
+  private def infer(
+      csv: Dataset[String],
+      caseSensitive: Boolean,
+      options: CSVOptions,
+      firstLine: String): StructType = {
     val firstRow = new CsvParser(options.asParserSettings).parseLine(firstLine)
     val header = makeSafeHeader(firstRow, caseSensitive, options)
 

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
@@ -298,13 +298,21 @@ class CSVSuite extends QueryTest with SharedSQLContext with SQLTestUtils {
   test("test with empty file and known schema") {
     val result = spark.read
       .format("csv")
-      .schema(StructType(List(StructField("column", StringType, false))))
+      .schema(StructType(List(StructField("column", StringType, nullable = false))))
       .load(testFile(emptyFile))
 
-    assert(result.collect.size === 0)
+    assert(result.collect().isEmpty)
     assert(result.schema.fieldNames.size === 1)
   }
 
+  test("test with empty file without schema") {
+    val result = spark.read
+      .csv(testFile(emptyFile))
+
+    assert(result.collect().isEmpty)
+    assert(result.schema.fieldNames.isEmpty)
+  }
+
   test("DDL test with empty file") {
     withView("carsTable") {
       spark.sql(