[SPARK-XXXXX][SQL] Add INSERT INTO ... REPLACE ON/USING syntax

longvu-db · claude · longvu-db · commit 89955713c173 · 2026-03-24T09:52:15.000Z
This PR introduces two new SQL syntaxes for the `INSERT` command: - `INSERT INTO ... REPLACE ON <condition>` — replaces rows matching a condition - `INSERT INTO ... REPLACE USING (<columns>)` — replaces rows based on matching column values Similar to the [INSERT WITH SCHEMA EVOLUTION PR](apache#53732), Spark is only responsible for recognizing these syntaxes. Since no table format in open-source Spark implements these operations yet, users will receive an unsupported error if they try to use them. Data sources (e.g., Delta Lake) can implement support for these syntaxes by handling the `replaceCriteriaOpt` field in `InsertIntoStatement`. `INSERT INTO ... REPLACE ON/USING` provides SQL syntax for atomically replacing a subset of rows in a table — a common pattern for incremental data loading. This builds on the existing `INSERT INTO ... REPLACE WHERE` syntax (SPARK-40956) and extends it with more flexible matching semantics: - `REPLACE ON` allows matching via arbitrary boolean expressions (e.g., `t.id = s.id`) - `REPLACE USING` allows matching via a list of column names Yes. Two new SQL syntaxes are recognized by the parser: - `INSERT [WITH SCHEMA EVOLUTION] INTO table AS alias [BY NAME] REPLACE ON condition query` - `INSERT [WITH SCHEMA EVOLUTION] INTO table AS alias [BY NAME] REPLACE USING (col1, col2) query` Both currently throw `UNSUPPORTED_INSERT_REPLACE_ON` / `UNSUPPORTED_INSERT_REPLACE_USING`. - DDLParserSuite: Parser tests for REPLACE USING, REPLACE ON, and combined WITH SCHEMA EVOLUTION - PlanResolutionSuite: V2 table unsupported error tests - InsertSuite (core): V1 table unsupported error tests - InsertSuite (hive): Hive table unsupported error tests Yes. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
diff --git a/common/utils/src/main/resources/error/error-conditions.json b/common/utils/src/main/resources/error/error-conditions.json
@@ -7847,6 +7847,18 @@
     },
     "sqlState" : "42809"
   },
+  "UNSUPPORTED_INSERT_REPLACE_ON" : {
+    "message" : [
+      "INSERT INTO ... REPLACE ON is not supported for this table format."
+    ],
+    "sqlState" : "0A000"
+  },
+  "UNSUPPORTED_INSERT_REPLACE_USING" : {
+    "message" : [
+      "INSERT INTO ... REPLACE USING is not supported for this table format."
+    ],
+    "sqlState" : "0A000"
+  },
   "UNSUPPORTED_INSERT_WITH_SCHEMA_EVOLUTION" : {
     "message" : [
       "INSERT WITH SCHEMA EVOLUTION ... is unsupported for this table format."
diff --git a/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4 b/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4
@@ -575,6 +575,8 @@ insertInto
     : INSERT (WITH SCHEMA EVOLUTION)? OVERWRITE TABLE? identifierReference optionsClause? (partitionSpec (IF errorCapturingNot EXISTS)?)?  ((BY NAME) | identifierList)? #insertOverwriteTable
     | INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference optionsClause? partitionSpec? (IF errorCapturingNot EXISTS)? ((BY NAME) | identifierList)?   #insertIntoTable
     | INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference optionsClause? (BY NAME)? REPLACE whereClause              #insertIntoReplaceWhere
+    | INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference tableAlias optionsClause? (BY NAME)? REPLACE USING identifierList   #insertIntoReplaceUsing
+    | INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference tableAlias optionsClause? (BY NAME)? REPLACE ON replaceOnCondition=booleanExpression   #insertIntoReplaceOn
     | INSERT OVERWRITE LOCAL? DIRECTORY path=stringLit rowFormat? createFileFormat?                     #insertOverwriteHiveDir
     | INSERT OVERWRITE LOCAL? DIRECTORY (path=stringLit)? tableProvider (OPTIONS options=propertyList)? #insertOverwriteDir
     ;
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala
@@ -1016,7 +1016,7 @@ class Analyzer(
 
     def apply(plan: LogicalPlan)
         : LogicalPlan = plan.resolveOperatorsUpWithPruning(AlwaysProcess.fn, ruleId) {
-      case i @ InsertIntoStatement(table, _, _, _, _, _, _, _) =>
+      case i @ InsertIntoStatement(table, _, _, _, _, _, _, _, _) =>
         val relation = table match {
           case u: UnresolvedRelation if !u.isStreaming =>
             resolveRelation(u).getOrElse(u)
@@ -1152,13 +1152,20 @@ class Analyzer(
   object ResolveInsertInto extends ResolveInsertionBase {
     override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsWithPruning(
       AlwaysProcess.fn, ruleId) {
-      case i @ InsertIntoStatement(r: DataSourceV2Relation, _, _, _, _, _, _, _)
+      case i @ InsertIntoStatement(r: DataSourceV2Relation, _, _, _, _, _, _, _, _)
           if i.query.resolved =>
         // ifPartitionNotExists is append with validation, but validation is not supported
         if (i.ifPartitionNotExists) {
           throw QueryCompilationErrors.unsupportedIfNotExistsError(r.table.name)
         }
 
+        i.replaceCriteriaOpt.foreach {
+          case _: InsertReplaceOn =>
+            throw QueryCompilationErrors.unsupportedInsertReplaceOn()
+          case _: InsertReplaceUsing =>
+            throw QueryCompilationErrors.unsupportedInsertReplaceUsing()
+        }
+
         // Create a project if this is an INSERT INTO BY NAME query.
         val projectByName = if (i.userSpecifiedCols.nonEmpty) {
           Some(createProjectForByNameQuery(r.table.name, i))
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala
@@ -254,7 +254,7 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
     // not found first, instead of errors in the input query of the insert command, by doing a
     // top-down traversal.
     plan.foreach {
-      case InsertIntoStatement(u: UnresolvedRelation, _, _, _, _, _, _, _) =>
+      case InsertIntoStatement(u: UnresolvedRelation, _, _, _, _, _, _, _, _) =>
         u.tableNotFound(u.multipartIdentifier)
 
       // TODO (SPARK-27484): handle streaming write commands when we have them.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala
@@ -891,6 +891,10 @@ class AstBuilder extends DataTypeAstBuilder
    *     [TABLE] tableIdentifier [partitionSpec] ([BY NAME] | [identifierList])
    *   INSERT [WITH SCHEMA EVOLUTION] INTO
    *     [TABLE] tableIdentifier REPLACE whereClause
+   *   INSERT [WITH SCHEMA EVOLUTION] INTO
+   *     [TABLE] tableIdentifier tableAlias [BY NAME] REPLACE USING identifierList
+   *   INSERT [WITH SCHEMA EVOLUTION] INTO
+   *     [TABLE] tableIdentifier tableAlias [BY NAME] REPLACE ON booleanExpression
    *   INSERT OVERWRITE [LOCAL] DIRECTORY STRING [rowFormat] [createFileFormat]
    *   INSERT OVERWRITE [LOCAL] DIRECTORY [STRING] tableProvider [OPTIONS tablePropertyList]
    * }}}
@@ -961,6 +965,44 @@ class AstBuilder extends DataTypeAstBuilder
               withSchemaEvolution = ctx.EVOLUTION() != null)
           }
         })
+      case ctx: InsertIntoReplaceUsingContext =>
+        val options = Option(ctx.optionsClause())
+        val byName = ctx.NAME() != null
+        val replaceUsingCols =
+          Option(ctx.identifierList()).map(visitIdentifierList).getOrElse(Nil)
+        withIdentClause(ctx.identifierReference, Seq(query), (ident, otherPlans) => {
+          InsertIntoStatement(
+            table = createUnresolvedRelation(ctx.identifierReference, ident, options,
+              Seq(TableWritePrivilege.INSERT, TableWritePrivilege.DELETE), isStreaming = false),
+            partitionSpec = Map.empty,
+            userSpecifiedCols = Seq.empty,
+            query = otherPlans.head,
+            overwrite = true,
+            ifPartitionNotExists = false,
+            byName = byName,
+            withSchemaEvolution = ctx.EVOLUTION() != null,
+            replaceCriteriaOpt = Some(InsertReplaceUsing(replaceUsingCols)))
+        })
+      case ctx: InsertIntoReplaceOnContext =>
+        val options = Option(ctx.optionsClause())
+        val byName = ctx.NAME() != null
+        val replaceOnCond = expression(ctx.replaceOnCondition)
+        val tableAliasOpt =
+          getTableAliasWithoutColumnAlias(ctx.tableAlias(), "INSERT REPLACE ON")
+        withIdentClause(ctx.identifierReference, Seq(query), (ident, otherPlans) => {
+          val queryWithAlias = otherPlans.head
+          InsertIntoStatement(
+            table = createUnresolvedRelation(ctx.identifierReference, ident, options,
+              Seq(TableWritePrivilege.INSERT, TableWritePrivilege.DELETE), isStreaming = false),
+            partitionSpec = Map.empty,
+            userSpecifiedCols = Seq.empty,
+            query = queryWithAlias,
+            overwrite = true,
+            ifPartitionNotExists = false,
+            byName = byName,
+            withSchemaEvolution = ctx.EVOLUTION() != null,
+            replaceCriteriaOpt = Some(InsertReplaceOn(replaceOnCond, tableAliasOpt)))
+        })
       case dir: InsertOverwriteDirContext =>
         val (isLocal, storage, provider) = visitInsertOverwriteDir(dir)
         InsertIntoDir(isLocal, storage, provider, query, overwrite = true)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/statements.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/statements.scala
@@ -174,6 +174,7 @@ case class QualifiedColType(
  * @param byName               If true, reorder the data columns to match the column names of the
  *                             target table.
  * @param withSchemaEvolution  If true, enables automatic schema evolution for the operation.
+ * @param replaceCriteriaOpt  Optional replace criteria for INSERT REPLACE ON/USING operations.
  */
 case class InsertIntoStatement(
     table: LogicalPlan,
@@ -183,7 +184,8 @@ case class InsertIntoStatement(
     overwrite: Boolean,
     ifPartitionNotExists: Boolean,
     byName: Boolean = false,
-    withSchemaEvolution: Boolean = false) extends UnaryParsedStatement {
+    withSchemaEvolution: Boolean = false,
+    replaceCriteriaOpt: Option[InsertReplaceCriteria] = None) extends UnaryParsedStatement {
 
   require(overwrite || !ifPartitionNotExists,
     "IF NOT EXISTS is only valid in INSERT OVERWRITE")
@@ -196,3 +198,27 @@ case class InsertIntoStatement(
   override protected def withNewChildInternal(newChild: LogicalPlan): InsertIntoStatement =
     copy(query = newChild)
 }
+
+/**
+ * Sealed trait representing the replace criteria for INSERT REPLACE ON/USING operations.
+ */
+sealed trait InsertReplaceCriteria
+
+/**
+ * Replace criteria for INSERT INTO ... REPLACE ON <condition>.
+ * Rows matching the condition in the target table are replaced by rows from the source query.
+ *
+ * @param condition      The boolean expression used to match rows for replacement.
+ * @param tableAliasOpt Optional alias for the target table used in the condition.
+ */
+case class InsertReplaceOn(
+    condition: Expression,
+    tableAliasOpt: Option[String]) extends InsertReplaceCriteria
+
+/**
+ * Replace criteria for INSERT INTO ... REPLACE USING (<columns>).
+ * Rows are replaced based on matching values in the specified columns.
+ *
+ * @param columns The list of column names used for matching.
+ */
+case class InsertReplaceUsing(columns: Seq[String]) extends InsertReplaceCriteria
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala
@@ -591,6 +591,18 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
       messageParameters = Map.empty)
   }
 
+  def unsupportedInsertReplaceOn(): Throwable = {
+    new AnalysisException(
+      errorClass = "UNSUPPORTED_INSERT_REPLACE_ON",
+      messageParameters = Map.empty)
+  }
+
+  def unsupportedInsertReplaceUsing(): Throwable = {
+    new AnalysisException(
+      errorClass = "UNSUPPORTED_INSERT_REPLACE_USING",
+      messageParameters = Map.empty)
+  }
+
   def writeIntoViewNotAllowedError(identifier: TableIdentifier, t: TreeNode[_]): Throwable = {
     new AnalysisException(
       errorClass = "VIEW_WRITE_NOT_ALLOWED",
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DDLParserSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DDLParserSuite.scala
@@ -1874,6 +1874,74 @@ class DDLParserSuite extends AnalysisTest {
     }
   }
 
+  for (isByName <- Seq(true, false)) {
+    val byNameClause = if (isByName) "BY NAME " else ""
+    val sourceQuery = "SELECT * FROM source"
+    val testMsg = s"isByName=$isByName"
+
+    test(s"INSERT INTO REPLACE USING - $testMsg") {
+      val table = "testcat.ns1.ns2.tbl"
+      val insertSQLStmt = s"INSERT INTO $table AS t " +
+        s"${byNameClause}REPLACE USING (col1, col2) ${sourceQuery}"
+
+      parseCompare(
+        sql = insertSQLStmt,
+        expected = InsertIntoStatement(
+          table = UnresolvedRelation(Seq("testcat", "ns1", "ns2", "tbl")),
+          partitionSpec = Map.empty,
+          userSpecifiedCols = Seq.empty,
+          query = Project(Seq(UnresolvedStar(None)), UnresolvedRelation(Seq("source"))),
+          overwrite = true,
+          ifPartitionNotExists = false,
+          byName = isByName,
+          withSchemaEvolution = false,
+          replaceCriteriaOpt = Some(InsertReplaceUsing(Seq("col1", "col2"))))
+      )
+    }
+
+    test(s"INSERT INTO REPLACE ON - $testMsg") {
+      val table = "testcat.ns1.ns2.tbl"
+      val insertSQLStmt = s"INSERT INTO $table AS t " +
+        s"${byNameClause}REPLACE ON t.col1 = col2 ${sourceQuery}"
+
+      parseCompare(
+        sql = insertSQLStmt,
+        expected = InsertIntoStatement(
+          table = UnresolvedRelation(Seq("testcat", "ns1", "ns2", "tbl")),
+          partitionSpec = Map.empty,
+          userSpecifiedCols = Seq.empty,
+          query = Project(Seq(UnresolvedStar(None)), UnresolvedRelation(Seq("source"))),
+          overwrite = true,
+          ifPartitionNotExists = false,
+          byName = isByName,
+          withSchemaEvolution = false,
+          replaceCriteriaOpt = Some(InsertReplaceOn(
+            EqualTo(UnresolvedAttribute(Seq("t", "col1")), UnresolvedAttribute("col2")),
+            Some("t"))))
+      )
+    }
+
+    test(s"INSERT WITH SCHEMA EVOLUTION INTO REPLACE USING - $testMsg") {
+      val table = "testcat.ns1.ns2.tbl"
+      val insertSQLStmt = s"INSERT WITH SCHEMA EVOLUTION INTO $table AS t " +
+        s"${byNameClause}REPLACE USING (col1) ${sourceQuery}"
+
+      parseCompare(
+        sql = insertSQLStmt,
+        expected = InsertIntoStatement(
+          table = UnresolvedRelation(Seq("testcat", "ns1", "ns2", "tbl")),
+          partitionSpec = Map.empty,
+          userSpecifiedCols = Seq.empty,
+          query = Project(Seq(UnresolvedStar(None)), UnresolvedRelation(Seq("source"))),
+          overwrite = true,
+          ifPartitionNotExists = false,
+          byName = isByName,
+          withSchemaEvolution = true,
+          replaceCriteriaOpt = Some(InsertReplaceUsing(Seq("col1"))))
+      )
+    }
+  }
+
   test("delete from table: delete all") {
     parseCompare("DELETE FROM testcat.ns1.ns2.tbl",
       DeleteFromTable(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala
@@ -163,7 +163,7 @@ object DataSourceAnalysis extends Rule[LogicalPlan] {
       CreateDataSourceTableAsSelectCommand(tableDesc, mode, query, query.output.map(_.name))
 
     case InsertIntoStatement(l @ LogicalRelationWithTable(_: InsertableRelation, _),
-        parts, _, query, overwrite, false, _, _)
+        parts, _, query, overwrite, false, _, _, _)
         if parts.isEmpty =>
       InsertIntoDataSourceCommand(l, query, overwrite)
 
@@ -176,7 +176,7 @@ object DataSourceAnalysis extends Rule[LogicalPlan] {
       InsertIntoDataSourceDirCommand(storage, provider.get, query, overwrite)
 
     case i @ InsertIntoStatement(l @ LogicalRelationWithTable(t: HadoopFsRelation, table),
-        parts, _, query, overwrite, _, _, _)
+        parts, _, query, overwrite, _, _, _, _)
         if query.resolved =>
       // If the InsertIntoTable command is for a partitioned HadoopFsRelation and
       // the user has specified static partitions, we add a Project operator on top of the query
@@ -312,11 +312,11 @@ class FindDataSourceTable(sparkSession: SparkSession) extends Rule[LogicalPlan]
 
   override def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperators {
     case i @ InsertIntoStatement(UnresolvedCatalogRelation(tableMeta, options, false),
-        _, _, _, _, _, _, _) if DDLUtils.isDatasourceTable(tableMeta) =>
+        _, _, _, _, _, _, _, _) if DDLUtils.isDatasourceTable(tableMeta) =>
       i.copy(table = readDataSourceTable(tableMeta, options))
 
     case i @ InsertIntoStatement(UnresolvedCatalogRelation(tableMeta, _, false),
-        _, _, _, _, _, _, _) =>
+        _, _, _, _, _, _, _, _) =>
       i.copy(table = DDLUtils.readHiveTable(tableMeta))
 
     case append @ AppendData(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FallBackFileSourceV2.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FallBackFileSourceV2.scala
@@ -35,7 +35,7 @@ import org.apache.spark.sql.execution.datasources.v2.{ExtractV2Table, FileTable}
 class FallBackFileSourceV2(sparkSession: SparkSession) extends Rule[LogicalPlan] {
   override def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperators {
     case i @ InsertIntoStatement(
-        d @ ExtractV2Table(table: FileTable), _, _, _, _, _, _, _) =>
+        d @ ExtractV2Table(table: FileTable), _, _, _, _, _, _, _, _) =>
       val v1FileFormat = table.fallbackFileFormat.getDeclaredConstructor().newInstance()
       val relation = HadoopFsRelation(
         table.fileIndex,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala
@@ -466,6 +466,13 @@ object PreprocessTableInsertion extends ResolveInsertionBase {
       throw QueryCompilationErrors.unsupportedInsertWithSchemaEvolution()
     }
 
+    insert.replaceCriteriaOpt.foreach {
+      case _: InsertReplaceOn =>
+        throw QueryCompilationErrors.unsupportedInsertReplaceOn()
+      case _: InsertReplaceUsing =>
+        throw QueryCompilationErrors.unsupportedInsertReplaceUsing()
+    }
+
     val normalizedPartSpec = normalizePartitionSpec(
       insert.partitionSpec, partColNames, tblName, conf.resolver)
 
@@ -552,7 +559,7 @@ object PreprocessTableInsertion extends ResolveInsertionBase {
   }
 
   def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperators {
-    case i @ InsertIntoStatement(table, _, _, query, _, _, _, _)
+    case i @ InsertIntoStatement(table, _, _, query, _, _, _, _, _)
       if table.resolved && query.resolved =>
       table match {
         case relation: HiveTableRelation =>
@@ -661,7 +668,7 @@ object PreWriteCheck extends (LogicalPlan => Unit) {
   def apply(plan: LogicalPlan): Unit = {
     plan.foreach {
       case InsertIntoStatement(LogicalRelationWithTable(relation, _), partition,
-          _, query, _, _, _, _) =>
+          _, query, _, _, _, _, _) =>
         // Get all input data source relations of the query.
         val srcRelations = query.collect {
           case l: LogicalRelation => l.relation
@@ -690,7 +697,7 @@ object PreWriteCheck extends (LogicalPlan => Unit) {
               messageParameters = Map("relationId" -> toSQLId(relation.toString)))
         }
 
-      case InsertIntoStatement(t, _, _, _, _, _, _, _)
+      case InsertIntoStatement(t, _, _, _, _, _, _, _, _)
         if !t.isInstanceOf[LeafNode] ||
           t.isInstanceOf[Range] ||
           t.isInstanceOf[OneRowRelation] ||
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala
@@ -1249,17 +1249,17 @@ class PlanResolutionSuite extends SharedSparkSession with AnalysisTest {
       case InsertIntoStatement(
         _, _, _,
         UnresolvedInlineTable(_, Seq(Seq(UnresolvedAttribute(Seq("DEFAULT"))))),
-        _, _, _, _) =>
+        _, _, _, _, _) =>
 
       case _ => fail("Expect UpdateTable, but got:\n" + parsed1.treeString)
     }
     parsed2 match {
       case InsertIntoStatement(
         _, _, _,
         Project(Seq(UnresolvedAttribute(Seq("DEFAULT"))), _),
-        _, _, _, _) =>
+        _, _, _, _, _) =>
 
-      case _ => fail("Expect UpdateTable, but got:\n" + parsed1.treeString)
+      case _ => fail("Expect UpdateTable, but got:\n" + parsed2.treeString)
     }
   }
 
@@ -1325,6 +1325,28 @@ class PlanResolutionSuite extends SharedSparkSession with AnalysisTest {
     }
   }
 
+  test("INSERT INTO REPLACE ON is unsupported for V2 tables") {
+    checkError(
+      exception = intercept[AnalysisException] {
+        parseAndResolve(
+          "INSERT INTO testcat.tab AS t REPLACE ON t.i = 1 " +
+            "SELECT * FROM v2Table")
+      },
+      condition = "UNSUPPORTED_INSERT_REPLACE_ON"
+    )
+  }
+
+  test("INSERT INTO REPLACE USING is unsupported for V2 tables") {
+    checkError(
+      exception = intercept[AnalysisException] {
+        parseAndResolve(
+          "INSERT INTO testcat.tab AS t REPLACE USING (i) " +
+            "SELECT * FROM v2Table")
+      },
+      condition = "UNSUPPORTED_INSERT_REPLACE_USING"
+    )
+  }
+
   test("alter table: alter column") {
     Seq("v1Table" -> true, "v2Table" -> false, "testcat.tab" -> false).foreach {
       case (tblName, useV1Command) =>
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveStrategies.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveStrategies.scala
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala

Original file line number	Diff line number	Diff line change
`@@ -575,6 +575,8 @@ insertInto`
`575`	`575`	`: INSERT (WITH SCHEMA EVOLUTION)? OVERWRITE TABLE? identifierReference optionsClause? (partitionSpec (IF errorCapturingNot EXISTS)?)? ((BY NAME) \| identifierList)? #insertOverwriteTable`
`576`	`576`	`\| INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference optionsClause? partitionSpec? (IF errorCapturingNot EXISTS)? ((BY NAME) \| identifierList)? #insertIntoTable`
`577`	`577`	`\| INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference optionsClause? (BY NAME)? REPLACE whereClause #insertIntoReplaceWhere`
	`578`	`+ \| INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference tableAlias optionsClause? (BY NAME)? REPLACE USING identifierList #insertIntoReplaceUsing`
	`579`	`+ \| INSERT (WITH SCHEMA EVOLUTION)? INTO TABLE? identifierReference tableAlias optionsClause? (BY NAME)? REPLACE ON replaceOnCondition=booleanExpression #insertIntoReplaceOn`
`578`	`580`	`\| INSERT OVERWRITE LOCAL? DIRECTORY path=stringLit rowFormat? createFileFormat? #insertOverwriteHiveDir`
`579`	`581`	`\| INSERT OVERWRITE LOCAL? DIRECTORY (path=stringLit)? tableProvider (OPTIONS options=propertyList)? #insertOverwriteDir`
`580`	`582`	`;`