Skip to content

Commit

Permalink
[spark] Merge Into: When Not Matched By Source (#2517)
Browse files Browse the repository at this point in the history
  • Loading branch information
YannByron authored Dec 22, 2023
1 parent a33dc68 commit 554ae64
Show file tree
Hide file tree
Showing 12 changed files with 682 additions and 156 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.paimon.spark.SparkTable
import org.apache.paimon.spark.commands.MergeIntoPaimonTable

import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.catalyst.expressions.AttributeReference
import org.apache.spark.sql.catalyst.plans.logical.{MergeAction, MergeIntoTable}

/** A post-hoc resolution rule for MergeInto. */
case class PaimonMergeInto(spark: SparkSession) extends PaimonMergeIntoBase {

override def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
targetOutput: Seq[AttributeReference]): Seq[MergeAction] = {
Seq.empty
}

override def buildMergeIntoPaimonTable(
v2Table: SparkTable,
merge: MergeIntoTable,
alignedMatchedActions: Seq[MergeAction],
alignedNotMatchedActions: Seq[MergeAction],
alignedNotMatchedBySourceActions: Seq[MergeAction]): MergeIntoPaimonTable = {
if (alignedNotMatchedBySourceActions.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

MergeIntoPaimonTable(
v2Table,
merge.targetTable,
merge.sourceTable,
merge.mergeCondition,
alignedMatchedActions,
alignedNotMatchedActions,
alignedNotMatchedBySourceActions
)
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,49 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.spark.sql.catalyst.expressions.Expression
import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, MergeAction, MergeIntoTable}

object PaimonMergeIntoResolver extends PaimonMergeIntoResolverBase {

def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
target: LogicalPlan,
source: LogicalPlan,
resolve: (Expression, LogicalPlan) => Expression): Seq[MergeAction] = {
Seq.empty
}

def build(
merge: MergeIntoTable,
resolvedCond: Expression,
resolvedMatched: Seq[MergeAction],
resolvedNotMatched: Seq[MergeAction],
resolvedNotMatchedBySource: Seq[MergeAction]): MergeIntoTable = {
if (resolvedNotMatchedBySource.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

merge.copy(
mergeCondition = resolvedCond,
matchedActions = resolvedMatched,
notMatchedActions = resolvedNotMatched)
}

}
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.paimon.spark.SparkTable
import org.apache.paimon.spark.commands.MergeIntoPaimonTable

import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.catalyst.expressions.AttributeReference
import org.apache.spark.sql.catalyst.plans.logical.{MergeAction, MergeIntoTable}

/** A post-hoc resolution rule for MergeInto. */
case class PaimonMergeInto(spark: SparkSession) extends PaimonMergeIntoBase {

override def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
targetOutput: Seq[AttributeReference]): Seq[MergeAction] = {
Seq.empty
}

override def buildMergeIntoPaimonTable(
v2Table: SparkTable,
merge: MergeIntoTable,
alignedMatchedActions: Seq[MergeAction],
alignedNotMatchedActions: Seq[MergeAction],
alignedNotMatchedBySourceActions: Seq[MergeAction]): MergeIntoPaimonTable = {
if (alignedNotMatchedBySourceActions.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

MergeIntoPaimonTable(
v2Table,
merge.targetTable,
merge.sourceTable,
merge.mergeCondition,
alignedMatchedActions,
alignedNotMatchedActions,
alignedNotMatchedBySourceActions
)
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,49 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.spark.sql.catalyst.expressions.Expression
import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, MergeAction, MergeIntoTable}

object PaimonMergeIntoResolver extends PaimonMergeIntoResolverBase {

def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
target: LogicalPlan,
source: LogicalPlan,
resolve: (Expression, LogicalPlan) => Expression): Seq[MergeAction] = {
Seq.empty
}

def build(
merge: MergeIntoTable,
resolvedCond: Expression,
resolvedMatched: Seq[MergeAction],
resolvedNotMatched: Seq[MergeAction],
resolvedNotMatchedBySource: Seq[MergeAction]): MergeIntoTable = {
if (resolvedNotMatchedBySource.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

merge.copy(
mergeCondition = resolvedCond,
matchedActions = resolvedMatched,
notMatchedActions = resolvedNotMatched)
}

}
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.paimon.spark.SparkTable
import org.apache.paimon.spark.commands.MergeIntoPaimonTable

import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.catalyst.expressions.AttributeReference
import org.apache.spark.sql.catalyst.plans.logical.{MergeAction, MergeIntoTable}

/** A post-hoc resolution rule for MergeInto. */
case class PaimonMergeInto(spark: SparkSession) extends PaimonMergeIntoBase {

override def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
targetOutput: Seq[AttributeReference]): Seq[MergeAction] = {
Seq.empty
}

override def buildMergeIntoPaimonTable(
v2Table: SparkTable,
merge: MergeIntoTable,
alignedMatchedActions: Seq[MergeAction],
alignedNotMatchedActions: Seq[MergeAction],
alignedNotMatchedBySourceActions: Seq[MergeAction]): MergeIntoPaimonTable = {
if (alignedNotMatchedBySourceActions.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

MergeIntoPaimonTable(
v2Table,
merge.targetTable,
merge.sourceTable,
merge.mergeCondition,
alignedMatchedActions,
alignedNotMatchedActions,
alignedNotMatchedBySourceActions
)
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,49 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.catalyst.analysis

import org.apache.spark.sql.catalyst.expressions.Expression
import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, MergeAction, MergeIntoTable}

object PaimonMergeIntoResolver extends PaimonMergeIntoResolverBase {

def resolveNotMatchedBySourceActions(
merge: MergeIntoTable,
target: LogicalPlan,
source: LogicalPlan,
resolve: (Expression, LogicalPlan) => Expression): Seq[MergeAction] = {
Seq.empty
}

def build(
merge: MergeIntoTable,
resolvedCond: Expression,
resolvedMatched: Seq[MergeAction],
resolvedNotMatched: Seq[MergeAction],
resolvedNotMatchedBySource: Seq[MergeAction]): MergeIntoTable = {
if (resolvedNotMatchedBySource.nonEmpty) {
throw new RuntimeException("WHEN NOT MATCHED BY SOURCE is not supported here.")
}

merge.copy(
mergeCondition = resolvedCond,
matchedActions = resolvedMatched,
notMatchedActions = resolvedNotMatched)
}

}
Loading

0 comments on commit 554ae64

Please sign in to comment.