Skip to content

Commit

Permalink
[paypal#247] [spark] Bump Spark Version to 2.4.7 | Bump Spark Version…
Browse files Browse the repository at this point in the history
… to 2.4.7 along with other stack to align with gcp_dataproc_1.5.x
  • Loading branch information
Dee-Pac committed Nov 8, 2020
1 parent a83d31f commit c4b6716
Show file tree
Hide file tree
Showing 28 changed files with 39 additions and 49 deletions.
2 changes: 1 addition & 1 deletion gimel-dataapi/gimel-common/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -150,7 +150,7 @@ under the License.
</dependency>
<dependency>
<groupId>org.apache.spark</groupId>
<artifactId>spark-streaming-kafka-${kafka.binary.version}_${scala.binary.version}</artifactId>
<artifactId>spark-streaming-kafka-${spark.kafka.connector.version}</artifactId>
<version>${spark.version}</version>
<scope>${spark.packaging.scope}</scope>
</dependency>
Expand Down
14 changes: 12 additions & 2 deletions gimel-dataapi/gimel-connectors/gimel-hbase/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -47,8 +47,18 @@ under the License.
<dependency>
<groupId>com.hortonworks</groupId>
<artifactId>shc-core</artifactId>
<version>${hortonworks.shc.version}-${spark.binary.version}-s_${scala.binary.version}</version>
<version>1.1.1-2.1-s_2.11</version>
<scope>${packaging.scope}</scope>
<exclusions>
<exclusion>
<groupId>org.apache.spark</groupId>
<artifactId>*</artifactId>
</exclusion>
<exclusion>
<groupId>org.scala-lang</groupId>
<artifactId>*</artifactId>
</exclusion>
</exclusions>
</dependency>
<dependency>
<groupId>org.apache.hbase</groupId>
Expand Down Expand Up @@ -179,7 +189,7 @@ under the License.
<plugin>
<groupId>org.apache.maven.plugins</groupId>
<artifactId>maven-shade-plugin</artifactId>
<version>3.0.0</version>
<version>${maven.shade.plugin.version}</version>
<configuration>
<relocations>
<relocation>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -98,7 +98,11 @@ class ExtendedJdbcRDD[T: ClassTag](
protected var finished = false
val logger = Logger(this.getClass.getName)

context.addTaskCompletionListener { context => closeIfNeeded() }
context.addTaskCompletionListener{
(context: org.apache.spark.TaskContext) =>
closeIfNeeded()
"dummy"
}

val conn: Connection = getConnection()

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -349,6 +349,9 @@ class JDBCUtilities(sparkSession: SparkSession) extends Serializable {
st
}

// private def handlePartition(partition:Iterator[Row]):Unit = {
//
// }
/**
* This method inserts into given table in given mode
*
Expand All @@ -374,10 +377,8 @@ class JDBCUtilities(sparkSession: SparkSession) extends Serializable {
}
case _ => // do nothing
}


// For each partition create a temp table to insert
dataFrame.foreachPartition { batch =>
dataFrame.foreachPartition { batch: Iterator[Row] =>

// create logger inside the executor
val logger = Logger(this.getClass.getName)
Expand Down Expand Up @@ -572,7 +573,7 @@ class JDBCUtilities(sparkSession: SparkSession) extends Serializable {
*/
private def updateTable(dataFrame: DataFrame, jdbcConnectionUtility: JDBCConnectionUtility,
jdbcHolder: JDBCArgsHolder) {
dataFrame.foreachPartition { batch =>
dataFrame.foreachPartition { batch: Iterator[Row] =>
if (batch.nonEmpty) {
// create logger inside the executor
val logger = Logger(this.getClass.getName)
Expand Down Expand Up @@ -630,7 +631,7 @@ class JDBCUtilities(sparkSession: SparkSession) extends Serializable {
*/
private def upsertTable(dataFrame: DataFrame, jDBCConnectionUtility: JDBCConnectionUtility,
jdbcHolder: JDBCArgsHolder) {
dataFrame.foreachPartition { batch =>
dataFrame.foreachPartition { batch: Iterator[Row] =>
// create logger inside the executor
val logger = Logger(this.getClass.getName)
if (batch.nonEmpty) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ under the License.
</parent>
<modelVersion>4.0.0</modelVersion>

<artifactId>gimel-kafka-2.2</artifactId>
<artifactId>gimel-kafka</artifactId>
<version>2.4.7-SNAPSHOT</version>

<dependencies>
Expand All @@ -37,6 +37,14 @@ under the License.
<artifactId>gimel-common</artifactId>
<version>${gimel.version}-SNAPSHOT</version>
<exclusions>
<exclusion>
<groupId>org.apache.hbase</groupId>
<artifactId>*</artifactId>
</exclusion>
<exclusion>
<groupId>org.apache.hadoop</groupId>
<artifactId>*</artifactId>
</exclusion>
<exclusion>
<groupId>com.fasterxml.jackson.core</groupId>
<artifactId>jackson-core</artifactId>
Expand All @@ -51,45 +59,18 @@ under the License.
</exclusion>
</exclusions>
</dependency>
<dependency>
<groupId>com.databricks</groupId>
<artifactId>spark-avro_${scala.binary.version}</artifactId>
<version>3.2.0</version>
<scope>${packaging.scope}</scope>
</dependency>
<dependency>
<groupId>org.apache.spark</groupId>
<artifactId>spark-sql-kafka-${spark.kafka.connector.version}</artifactId>
<version>${spark.version}</version>
<scope>${packaging.scope}</scope>
<exclusions>
<exclusion>
<groupId>org.apache.kafka</groupId>
<artifactId>kafka-clients</artifactId>
</exclusion>
</exclusions>
</dependency>
<!--kafka Clients-->
<dependency>
<groupId>org.apache.kafka</groupId>
<artifactId>kafka-clients</artifactId>
<version>${kafka.version}</version>
</dependency>
<dependency>
<groupId>com.fasterxml.jackson.core</groupId>
<artifactId>jackson-core</artifactId>
<version>${jackson.version}</version>
</dependency>
<dependency>
<groupId>com.fasterxml.jackson.core</groupId>
<artifactId>jackson-annotations</artifactId>
<version>${jackson.version}</version>
</dependency>
<dependency>
<groupId>com.fasterxml.jackson.core</groupId>
<artifactId>jackson-databind</artifactId>
<version>${jackson.version}</version>
</dependency>

<!-- Test dependencies -->
<!-- To reuse some of the common testing utilities -->
Expand Down Expand Up @@ -163,12 +144,6 @@ under the License.
<version>${confluent.version}</version>
<scope>test</scope>
</dependency>
<dependency>
<groupId>org.apache.avro</groupId>
<artifactId>avro</artifactId>
<version>1.7.7</version>
<scope>test</scope>
</dependency>
<!-- Kafka local testing utility needs Netty 3.x at test scope for the minicluster -->
<dependency>
<groupId>io.netty</groupId>
Expand Down Expand Up @@ -234,7 +209,7 @@ under the License.
<plugin>
<groupId>org.apache.maven.plugins</groupId>
<artifactId>maven-shade-plugin</artifactId>
<version>3.2.1</version>
<version>${maven.shade.plugin.version}</version>
<configuration>
<relocations>
<relocation>
Expand Down
10 changes: 5 additions & 5 deletions gimel-dataapi/pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -43,11 +43,11 @@ under the License.
<module>gimel-connectors/gimel-hive</module>
<module>gimel-connectors/gimel-restapi</module>
<module>gimel-connectors/gimel-s3</module>
<module>gimel-connectors/gimel-kafka</module>
<module>gimel-connectors/gimel-jdbc</module>
<module>gimel-connectors/gimel-hbase</module>
<module>gimel-connectors/gimel-cassandra-2.0</module>
<module>gimel-connectors/gimel-aerospike-3.14</module>
<module>gimel-connectors/gimel-kafka-2.2</module>
<module>gimel-connectors/gimel-druid-0.82</module>
<module>gimel-core</module>
<module>gimel-sql</module>
Expand All @@ -67,9 +67,9 @@ under the License.
<jackson.version>2.6.7</jackson.version>
<java.version>1.8</java.version>
<jersey.version>1.19.4</jersey.version>
<kafka.paypal.monitoring.version>1.3.2</kafka.paypal.monitoring.version>
<kafka.version>2.2.1</kafka.version>
<kafka.binary.version>0-10</kafka.binary.version>
<!-- <kafka.paypal.monitoring.version>1.3.2</kafka.paypal.monitoring.version>-->
<kafka.version>2.1.1</kafka.version>
<!-- <kafka.binary.version>0-10</kafka.binary.version>-->
<protobuf.javaformatter.version>1.4</protobuf.javaformatter.version>
<gimel.logging.spark.binary.version>2.3</gimel.logging.spark.binary.version>
<gimel.logging.version>0.4.3-SNAPSHOT</gimel.logging.version>
Expand All @@ -80,7 +80,7 @@ under the License.
<teradata.version>15.10.00.22</teradata.version>
<zookeeper.version>3.4.13</zookeeper.version>
<curator.version>2.13.0</curator.version>
<spark.kafka.connector.version>0-10_2.11</spark.kafka.connector.version>
<spark.kafka.connector.version>0-10_2.12</spark.kafka.connector.version>
<spark.sftp.version>1.1.3</spark.sftp.version>
<!-- These are added because of conflict in hbase-testing-utility-->
<netty.hadoop.version>3.9.9.Final</netty.hadoop.version>
Expand Down

0 comments on commit c4b6716

Please sign in to comment.