apache · HeartSaVioR · Jan 22, 2019 · Jan 22, 2019 · Jan 22, 2019 · Jan 22, 2019
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecution.scala
@@ -508,12 +508,20 @@ class MicroBatchExecution(
           cd.dataType, cd.timeZoneId)
     }
 
+    // Pre-resolve new attributes to ensure all attributes are resolved before
+    // accessing schema of logical plan. Note that it only leverages the information
+    // of attributes, so we don't need to concern about the value of literals.
+
+    val newAttrPlanPreResolvedForSchema = newAttributePlan transformAllExpressions {
+      case cbt: CurrentBatchTimestamp => cbt.toLiteral
+    }
+
     val triggerLogicalPlan = sink match {
       case _: Sink => newAttributePlan
       case s: StreamingWriteSupportProvider =>
         val writer = s.createStreamingWriteSupport(
           s"$runId",
-          newAttributePlan.schema,
+          newAttrPlanPreResolvedForSchema.schema,
           outputMode,
           new DataSourceOptions(extraOptions.asJava))
         WriteToDataSourceV2(new MicroBatchWrite(currentBatchId, writer), newAttributePlan)

diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala
@@ -1079,6 +1079,42 @@ class StreamSuite extends StreamTest {
       assert(query.exception.isEmpty)
     }
   }
+
+  Seq(true, false).foreach { useV2Sink =>
+    import org.apache.spark.sql.functions._
+
+    val newTestName = "SPARK-26379 Structured Streaming - Exception on adding column to Dataset" +
+      s" - use v2 sink - $useV2Sink"
+
+    test(newTestName) {
+      val input = MemoryStream[Int]
+      val df = input.toDS().withColumn("cur_timestamp", lit(current_timestamp()))
+
+      def assertBatchOutputAndUpdateLastTimestamp(
+          rows: Seq[Row],
+          curTimestamp: Long,
+          expectedValue: Int): Long = {
+        assert(rows.size === 1)
+        val row = rows.head
+        assert(row.getInt(0) === expectedValue)
+        assert(row.getTimestamp(1).getTime > curTimestamp)
+        row.getTimestamp(1).getTime
+      }
+
+      var lastTimestamp = -1L
+      testStream(df, useV2Sink = useV2Sink) (
+        AddData(input, 1),
+        CheckLastBatch { rows: Seq[Row] =>
+          lastTimestamp = assertBatchOutputAndUpdateLastTimestamp(rows, lastTimestamp, 1)
+        },
+        Execute { _ => Thread.sleep(3 * 1000) },
+        AddData(input, 2),
+        CheckLastBatch { rows: Seq[Row] =>
+          lastTimestamp = assertBatchOutputAndUpdateLastTimestamp(rows, lastTimestamp, 2)
+        }
+      )
+    }
+  }
 }
 
 abstract class FakeSource extends StreamSourceProvider {