apache · wuchong · Mar 1, 2021 · Jan 22, 2021 · Mar 1, 2021 · JingsongLi
diff --git a/...er-blink/src/main/java/org/apache/flink/table/planner/plan/schema/CatalogSourceTable.java b/...er-blink/src/main/java/org/apache/flink/table/planner/plan/schema/CatalogSourceTable.java
@@ -259,4 +259,8 @@ private DynamicTableSource createDynamicTableSource(
  Thread.currentThread().getContextClassLoader(),
  schemaTable.isTemporary());
  }
+
+ public CatalogTable getCatalogTable() {
+ return catalogTable;
+ }
 }
diff --git a/...lanner-blink/src/main/scala/org/apache/flink/table/planner/calcite/FlinkTypeFactory.scala b/...lanner-blink/src/main/scala/org/apache/flink/table/planner/calcite/FlinkTypeFactory.scala
@@ -39,6 +39,7 @@ import org.apache.flink.table.planner.plan.schema.{GenericRelDataType, _}
 import org.apache.flink.table.runtime.types.{LogicalTypeDataTypeConverter, PlannerTypeUtils}
 import org.apache.flink.table.types.logical._
 import org.apache.flink.table.typeutils.TimeIndicatorTypeInfo
+import org.apache.flink.table.utils.TableSchemaUtils
 import org.apache.flink.types.Nothing
 import org.apache.flink.util.Preconditions.checkArgument
 
@@ -234,6 +235,16 @@ class FlinkTypeFactory(typeSystem: RelDataTypeSystem)
  buildStructType(fields.map(_.getName), fields.map(_.getType), StructKind.FULLY_QUALIFIED)
  }
 
+ /**
+ * Creates a struct type with the physical columns using FlinkTypeFactory
+ *
+ * @param tableSchema schema to convert to Calcite's specific one
+ * @return a struct type with the input fieldNames, input fieldTypes.
+ */
+ def buildPhysicalRelNodeRowType(tableSchema: TableSchema): RelDataType = {
+ buildRelNodeRowType(TableSchemaUtils.getPhysicalSchema(tableSchema))
+ }
+
  /**
  * Creates a struct type with the input fieldNames and input fieldTypes using FlinkTypeFactory.
  *

diff --git a/...ner-blink/src/main/scala/org/apache/flink/table/planner/calcite/PreValidateReWriter.scala b/...ner-blink/src/main/scala/org/apache/flink/table/planner/calcite/PreValidateReWriter.scala
@@ -21,7 +21,8 @@ package org.apache.flink.table.planner.calcite
 import org.apache.flink.sql.parser.SqlProperty
 import org.apache.flink.sql.parser.dml.RichSqlInsert
 import org.apache.flink.table.api.ValidationException
-import org.apache.flink.table.planner.calcite.PreValidateReWriter.appendPartitionProjects
+import org.apache.flink.table.planner.calcite.PreValidateReWriter.appendPartitionAndNullsProjects
+import org.apache.flink.table.planner.plan.schema.{CatalogSourceTable, FlinkPreparingTableBase, LegacyCatalogSourceTable}
 
 import org.apache.calcite.plan.RelOptTable
 import org.apache.calcite.prepare.CalciteCatalogReader
@@ -47,16 +48,17 @@ class PreValidateReWriter(
  val typeFactory: RelDataTypeFactory) extends SqlBasicVisitor[Unit] {
  override def visit(call: SqlCall): Unit = {
  call match {
- case r: RichSqlInsert if r.getStaticPartitions.nonEmpty => r.getSource match {
+ case r: RichSqlInsert
+ if r.getStaticPartitions.nonEmpty || r.getTargetColumnList != null => r.getSource match {
  case select: SqlSelect =>
- appendPartitionProjects(r, validator, typeFactory, select, r.getStaticPartitions)
+ appendPartitionAndNullsProjects(r, validator, typeFactory, select, r.getStaticPartitions)
  case values: SqlCall if values.getKind == SqlKind.VALUES =>
- val newSource = appendPartitionProjects(r, validator, typeFactory, values,
+ val newSource = appendPartitionAndNullsProjects(r, validator, typeFactory, values,
  r.getStaticPartitions)
  r.setOperand(2, newSource)
  case source =>
  throw new ValidationException(
- s"INSERT INTO <table> PARTITION statement only support "
+ s"INSERT INTO <table> PARTITION [(COLUMN LIST)] statement only support "
  + s"SELECT and VALUES clause for now, '$source' is not supported yet.")
  }
  case _ =>
@@ -67,8 +69,8 @@ class PreValidateReWriter(
 object PreValidateReWriter {
  //~ Tools ------------------------------------------------------------------
  /**
- * Append the static partitions to the data source projection list. The columns are appended to
- * the corresponding positions.
+ * Append the static partitions and unspecified columns to the data source projection list.
+ * The columns are appended to the corresponding positions.
  *
  * <p>If we have a table A with schema (&lt;a&gt;, &lt;b&gt;, &lt;c&gt) whose
  * partition columns are (&lt;a&gt;, &lt;c&gt;), and got a query
@@ -83,13 +85,25 @@ object PreValidateReWriter {
  * </pre></blockquote>
  * Where the "tpe1" and "tpe2" are data types of column a and c of target table A.
  *
+ * <p>If we have a table A with schema (&lt;a&gt;, &lt;b&gt;, &lt;c&gt), and got a query
+ * <blockquote><pre>
+ * insert into A (a, b)
+ * select a, b from B
+ * </pre></blockquote>
+ * The query would be rewritten to:
+ * <blockquote><pre>
+ * insert into A
+ * select a, b, cast(null as tpeC) from B
+ * </pre></blockquote>
+ * Where the "tpeC" is data type of column c for target table A.
+ *
  * @param sqlInsert RichSqlInsert instance
  * @param validator Validator
  * @param typeFactory type factory
  * @param source Source to rewrite
  * @param partitions Static partition statements
  */
- def appendPartitionProjects(sqlInsert: RichSqlInsert,
+ def appendPartitionAndNullsProjects(sqlInsert: RichSqlInsert,
  validator: FlinkCalciteSqlValidator,
  typeFactory: RelDataTypeFactory,
  source: SqlCall,
@@ -103,8 +117,7 @@ object PreValidateReWriter {
  // just skip to let other validation error throw.
  return source
  }
- val targetRowType = createTargetRowType(typeFactory,
- calciteCatalogReader, table, sqlInsert.getTargetColumnList)
+ val targetRowType = createTargetRowType(typeFactory, table)
  // validate partition fields first.
  val assignedFields = new util.LinkedHashMap[Integer, SqlNode]
  val relOptTable = table match {
@@ -121,26 +134,83 @@ object PreValidateReWriter {
  assignedFields.put(targetField.getIndex,
  maybeCast(value, value.createSqlType(typeFactory), targetField.getType, typeFactory))
  }
+
+ // validate partial insert columns.
+
+ // the columnList may reorder fields (compare with fields of sink)
+ val targetPosition = new util.ArrayList[Int]()
+
+ if (sqlInsert.getTargetColumnList != null) {
+ val targetFields = new util.HashSet[Integer]
+ val targetColumns =
+ sqlInsert
+ .getTargetColumnList
+ .getList
+ .map(id => {
+ val targetField = SqlValidatorUtil.getTargetField(
+ targetRowType, typeFactory, id.asInstanceOf[SqlIdentifier],
+ calciteCatalogReader, relOptTable)
+ validateField(targetFields.add, id.asInstanceOf[SqlIdentifier], targetField)
+ targetField
+ })
+
+ val partitionColumns =
+ partitions
+ .getList
+ .map(property =>
+ SqlValidatorUtil.getTargetField(
+ targetRowType, typeFactory, property.asInstanceOf[SqlProperty].getKey,
+ calciteCatalogReader, relOptTable))
+
+ for (targetField <- targetRowType.getFieldList) {
+ if (!partitionColumns.contains(targetField)) {
+ if (!targetColumns.contains(targetField)) {
+ // padding null
+ val id = new SqlIdentifier(targetField.getName, SqlParserPos.ZERO)
+ if (!targetField.getType.isNullable) {
+ throw newValidationError(id, RESOURCE.columnNotNullable(targetField.getName))
+ }
+ validateField(idx => !assignedFields.contains(idx), id, targetField)
+ assignedFields.put(targetField.getIndex,
+ maybeCast(
+ SqlLiteral.createNull(SqlParserPos.ZERO),
+ typeFactory.createUnknownType(),
+ targetField.getType,
+ typeFactory))
+ } else {
+ // handle reorder
+ targetPosition.add(targetColumns.indexOf(targetField))
+ }
+ }
+ }
+ }
+
  source match {
  case select: SqlSelect =>
- rewriteSelect(validator, select, targetRowType, assignedFields)
+ rewriteSelect(validator, select, targetRowType, assignedFields, targetPosition)
  case values: SqlCall if values.getKind == SqlKind.VALUES =>
- rewriteValues(values, targetRowType, assignedFields)
+ rewriteValues(values, targetRowType, assignedFields, targetPosition)
  }
  }
 
  private def rewriteSelect(
  validator: FlinkCalciteSqlValidator,
  select: SqlSelect,
  targetRowType: RelDataType,
- assignedFields: util.LinkedHashMap[Integer, SqlNode]): SqlCall = {
+ assignedFields: util.LinkedHashMap[Integer, SqlNode],
+ targetPosition: util.List[Int]): SqlCall = {
  // Expands the select list first in case there is a star(*).
  // Validates the select first to register the where scope.
  validator.validate(select)
  val sourceList = validator.expandStar(select.getSelectList, select, false).getList
 
  val fixedNodes = new util.ArrayList[SqlNode]
- val currentNodes = new util.ArrayList[SqlNode](sourceList)
+ val currentNodes =
+ if (targetPosition.isEmpty) {
+ new util.ArrayList[SqlNode](sourceList)
+ } else {
+ reorder(new util.ArrayList[SqlNode](sourceList), targetPosition)
+ }
  0 until targetRowType.getFieldList.length foreach {
  idx =>
  if (assignedFields.containsKey(idx)) {
@@ -161,7 +231,8 @@ object PreValidateReWriter {
  private def rewriteValues(
  values: SqlCall,
  targetRowType: RelDataType,
- assignedFields: util.LinkedHashMap[Integer, SqlNode]): SqlCall = {
+ assignedFields: util.LinkedHashMap[Integer, SqlNode],
+ targetPosition: util.List[Int]): SqlCall = {
  val fixedNodes = new util.ArrayList[SqlNode]
  0 until values.getOperandList.size() foreach {
  valueIdx =>
@@ -171,7 +242,12 @@ object PreValidateReWriter {
  } else {
  Collections.singletonList(value)
  }
- val currentNodes = new util.ArrayList[SqlNode](valueAsList)
+ val currentNodes =
+ if (targetPosition.isEmpty) {
+ new util.ArrayList[SqlNode](valueAsList)
+ } else {
+ reorder(new util.ArrayList[SqlNode](valueAsList), targetPosition)
+ }
  val fieldNodes = new util.ArrayList[SqlNode]
  0 until targetRowType.getFieldList.length foreach {
  fieldIdx =>
@@ -191,41 +267,40 @@ object PreValidateReWriter {
  SqlStdOperatorTable.VALUES.createCall(values.getParserPosition, fixedNodes)
  }
 
+ private def reorder(
+ sourceList: util.ArrayList[SqlNode],
+ targetPosition: util.List[Int]): util.ArrayList[SqlNode] = {
+ val targetList = new Array[SqlNode](sourceList.size())
+ 0 until sourceList.size() foreach {
+ idx => targetList(targetPosition.get(idx)) = sourceList.get(idx)
+ }
+ new util.ArrayList[SqlNode](targetList.toList)
+ }
  /**
- * Derives a row-type for INSERT and UPDATE operations.
+ * Derives a physical row-type for INSERT and UPDATE operations.
  *
  * <p>This code snippet is almost inspired by
  * [[org.apache.calcite.sql.validate.SqlValidatorImpl#createTargetRowType]].
  * It is the best that the logic can be merged into Apache Calcite,
  * but this needs time.
  *
  * @param typeFactory TypeFactory
- * @param catalogReader CalciteCatalogReader
  * @param table Target table for INSERT/UPDATE
- * @param targetColumnList List of target columns, or null if not specified
  * @return Rowtype
  */
  private def createTargetRowType(
  typeFactory: RelDataTypeFactory,
- catalogReader: CalciteCatalogReader,
- table: SqlValidatorTable,
- targetColumnList: SqlNodeList): RelDataType = {
- val rowType = table.getRowType
- if (targetColumnList == null) return rowType
- val fields = new util.ArrayList[util.Map.Entry[String, RelDataType]]
- val assignedFields = new util.HashSet[Integer]
- val relOptTable = table match {
- case t: RelOptTable => t
- case _ => null
- }
- for (node <- targetColumnList) {
- val id = node.asInstanceOf[SqlIdentifier]
- val targetField = SqlValidatorUtil.getTargetField(rowType,
- typeFactory, id, catalogReader, relOptTable)
- validateField(assignedFields.add, id, targetField)
- fields.add(targetField)
+ table: SqlValidatorTable): RelDataType = {
+ table.unwrap(classOf[FlinkPreparingTableBase]) match {
+ case t: CatalogSourceTable =>
+ val schema = t.getCatalogTable.getSchema
+ typeFactory.asInstanceOf[FlinkTypeFactory].buildPhysicalRelNodeRowType(schema)
+ case t: LegacyCatalogSourceTable[_] =>
+ val schema = t.catalogTable.getSchema
+ typeFactory.asInstanceOf[FlinkTypeFactory].buildPhysicalRelNodeRowType(schema)
+ case _ =>
+ table.getRowType
  }
- typeFactory.createStructType(fields)
  }
 
  /** Check whether the field is valid. **/