Skip to content

Commit 9fb185f

Browse files
authored
Bump to Spark 3.2.2 (#170)
* Bumping to Spark 3.2.2 * Page update * Fixing SPARK-35132 * Bumping netty to 4.1.68.Final
1 parent a0c9ad1 commit 9fb185f

13 files changed

Lines changed: 58 additions & 24 deletions

build.sbt

Lines changed: 15 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ import sbtassembly.AssemblyPlugin.autoImport.ShadeRule
33
import scala.util.Properties
44

55
name := """sequila"""
6-
val DEFAULT_SPARK_3_VERSION = "3.1.2"
6+
val DEFAULT_SPARK_3_VERSION = "3.2.2"
77
lazy val sparkVersion = Properties.envOrElse("SPARK_VERSION", DEFAULT_SPARK_3_VERSION)
88

99
version := s"${sys.env.getOrElse("VERSION", "0.1.0")}"
@@ -18,6 +18,16 @@ val DEFAULT_HADOOP_VERSION = "3.1.2"
1818

1919
lazy val hadoopVersion = Properties.envOrElse("SPARK_HADOOP_VERSION", DEFAULT_HADOOP_VERSION)
2020

21+
val nettyVersion = "4.1.68.Final"
22+
dependencyOverrides += "io.netty" % "netty-all" % nettyVersion
23+
dependencyOverrides += "io.netty" % "netty-buffer" % nettyVersion
24+
dependencyOverrides += "io.netty" % "netty-codec" % nettyVersion
25+
dependencyOverrides += "io.netty" % "netty-common" % nettyVersion
26+
dependencyOverrides += "io.netty" % "netty-handler" % nettyVersion
27+
dependencyOverrides += "io.netty" % "netty-resolver" % nettyVersion
28+
dependencyOverrides += "io.netty" % "netty-transport" % nettyVersion
29+
dependencyOverrides += "io.netty" % "netty-transport-native-epoll" % nettyVersion
30+
dependencyOverrides += "io.netty" % "netty-transport-native-unix-common" % nettyVersion
2131
dependencyOverrides += "com.google.guava" % "guava" % "15.0"
2232
dependencyOverrides += "org.apache.orc" % "orc-core" % "1.6.9"
2333
dependencyOverrides += "org.apache.logging.log4j" % "log4j-core" % "2.3"
@@ -30,7 +40,7 @@ libraryDependencies += "org.apache.spark" %% "spark-core" % sparkVersion
3040
libraryDependencies += "org.apache.spark" %% "spark-sql" % sparkVersion
3141
libraryDependencies += "com.github.mrpowers" %% "spark-fast-tests" % "0.21.3"
3242
libraryDependencies += "com.github.mrpowers" %% "spark-daria" % "0.38.2"
33-
libraryDependencies += "com.holdenkarau" %% "spark-testing-base" % "3.1.2_1.1.0" % "test" excludeAll ExclusionRule(organization = "javax.servlet") excludeAll (ExclusionRule("org.apache.hadoop"))
43+
libraryDependencies += "com.holdenkarau" %% "spark-testing-base" % "3.2.0_1.2.0" % "test" excludeAll ExclusionRule(organization = "javax.servlet") excludeAll (ExclusionRule("org.apache.hadoop"))
3444
libraryDependencies += "org.bdgenomics.adam" %% "adam-core-spark3" % "0.36.0" excludeAll (ExclusionRule("org.seqdoop"))
3545
libraryDependencies += "org.bdgenomics.adam" %% "adam-apis-spark3" % "0.36.0" excludeAll (ExclusionRule("org.seqdoop"))
3646
libraryDependencies += "org.bdgenomics.adam" %% "adam-cli-spark3" % "0.36.0" excludeAll (ExclusionRule("org.seqdoop"))
@@ -156,7 +166,8 @@ publishTo := {
156166
if (!version.value.toLowerCase.contains("snapshot")) {
157167
sonatypePublishToBundle.value
158168
} else {
159-
val nexus = "http://zsibio.ii.pw.edu.pl/nexus/repository/"
169+
val nexus = "https://zsibio.ii.pw.edu.pl/nexus/repository/"
160170
Some("snapshots" at nexus + "maven-snapshots")
161171
}
162-
}
172+
}
173+
ThisBuild / useCoursier := true

page/content/en/_index.html

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -82,14 +82,14 @@ <h2 class="text-center">Getting started</h2>
8282
<div class="text-left">
8383
{{< highlight bash>}}
8484
# ensure you have Apache Spark and GraalVM installed
85-
sdk install spark 3.1.2
85+
sdk install spark 3.2.2
8686
sdk install java 21.3.0.r11-grl
8787
# set Apache Spark and JDK using sdkman
88-
sdk use spark 3.1.2
88+
sdk use spark 3.2.2
8989
# use GraalVM for best performance
9090
sdk use java 21.3.0.r11-grl
9191
# in case you prefer to use a Python interface
92-
pip install pysequila==0.3.3
92+
pip install pysequila==0.4.0
9393
# download sample data
9494
mkdir -p data
9595
#BAM
@@ -130,7 +130,7 @@ <h2 class="text-center">Getting started</h2>
130130
{{< highlight bash>}}
131131
pyspark --master local[1] \
132132
--driver-memory 4g \
133-
--packages org.biodatageeks:sequila_2.12:1.0.0
133+
--packages org.biodatageeks:sequila_2.12:1.1.0
134134
{{< / highlight >}}
135135
{{< highlight python>}}
136136
from pysequila import SequilaSession
@@ -187,7 +187,7 @@ <h2 class="text-center">Getting started</h2>
187187
{{< highlight bash>}}
188188
pyspark --master local[1] \
189189
--driver-memory 4g \
190-
--packages org.biodatageeks:sequila_2.12:1.0.0
190+
--packages org.biodatageeks:sequila_2.12:1.1.0
191191
{{< / highlight >}}
192192
{{< highlight python>}}
193193
from pysequila import SequilaSession
@@ -256,7 +256,7 @@ <h2 class="text-center">Getting started</h2>
256256
{{< highlight bash>}}
257257
pyspark --master local[1] \
258258
--driver-memory 4g \
259-
--packages org.biodatageeks:sequila_2.12:1.0.0
259+
--packages org.biodatageeks:sequila_2.12:1.1.0
260260
{{< / highlight >}}
261261
{{< highlight python>}}
262262
targets_df = ss.read\

project/plugins.sbt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,3 +9,5 @@ addSbtPlugin("com.julianpeeters" % "sbt-avrohugger" % "2.0.0-RC19")
99
addSbtPlugin("org.xerial.sbt" % "sbt-sonatype" % "3.9.4")
1010
addSbtPlugin("com.jsuereth" % "sbt-pgp" % "2.0.1")
1111
addSbtPlugin("org.scalastyle" %% "scalastyle-sbt-plugin" % "1.0.0")
12+
13+
addSbtPlugin("net.virtual-void" % "sbt-dependency-graph" % "0.10.0-RC1")

src/main/scala/org/biodatageeks/sequila/datasources/BAM/SequilaDataSourceStrategy.scala

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -102,6 +102,7 @@ case class SequilaDataSourceStrategy(spark: SparkSession) extends Strategy
102102
l.output.toStructType,
103103
Set.empty,
104104
Set.empty,
105+
None,
105106
toCatalystRDD(l, baseRelation.buildScan()),
106107
baseRelation,
107108
None) :: Nil
@@ -215,6 +216,7 @@ case class SequilaDataSourceStrategy(spark: SparkSession) extends Strategy
215216
projects.map(_.toAttribute).toStructType,
216217
Set.empty,
217218
Set.empty,
219+
None,
218220
scanBuilder(requestedColumns, candidatePredicates, pushedFilters),
219221
relation.relation,
220222
relation.catalogTable.map(_.identifier))
@@ -229,6 +231,7 @@ case class SequilaDataSourceStrategy(spark: SparkSession) extends Strategy
229231
requestedColumns.toStructType,
230232
Set.empty,
231233
Set.empty,
234+
None,
232235
scanBuilder(requestedColumns, candidatePredicates, pushedFilters),
233236
relation.relation,
234237
relation.catalogTable.map(_.identifier))

src/main/scala/org/biodatageeks/sequila/pileup/PileupStrategy.scala

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -119,4 +119,5 @@ case class PileupPlan [T<:BDGAlignInputFormat](plan:LogicalPlan, spark:SparkSess
119119
conf
120120
}
121121

122+
override protected def withNewChildrenInternal(newChildren: IndexedSeq[SparkPlan]): SparkPlan = this
122123
}

src/main/scala/org/biodatageeks/sequila/rangejoins/methods/IntervalTree/IntervalTreeJoinOptim.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -100,4 +100,6 @@ case class IntervalTreeJoinOptim(left: SparkPlan,
100100
}
101101

102102
}
103+
104+
override protected def withNewChildrenInternal(newLeft: SparkPlan, newRight: SparkPlan): SparkPlan = copy(left = newLeft, right = newRight)
103105
}

src/main/scala/org/biodatageeks/sequila/rangejoins/methods/IntervalTree/IntervalTreeJoinOptimChromosome.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -115,4 +115,6 @@ case class IntervalTreeJoinOptimChromosome(left: SparkPlan,
115115
.stats
116116
.sizeInBytes != Long.MaxValue)
117117
}
118+
119+
override protected def withNewChildrenInternal(newLeft: SparkPlan, newRight: SparkPlan): SparkPlan = copy(left = newLeft, right = newRight)
118120
}

src/main/scala/org/biodatageeks/sequila/rangejoins/methods/genApp/IntervalTreeJoin.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -62,4 +62,6 @@ case class IntervalTreeJoin(left: SparkPlan,
6262
}
6363

6464
}
65+
66+
override protected def withNewChildrenInternal(newLeft: SparkPlan, newRight: SparkPlan): SparkPlan = copy(left = newLeft, right = newRight)
6567
}

src/main/scala/org/biodatageeks/sequila/rangejoins/methods/genApp/IntervalTreeJoinChromosome.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -65,4 +65,6 @@ IntervalTreeJoinChromosome(left: SparkPlan,
6565
}
6666

6767
}
68+
69+
override protected def withNewChildrenInternal(newLeft: SparkPlan, newRight: SparkPlan): SparkPlan = copy(left = newLeft, right = newRight)
6870
}

src/main/scala/org/biodatageeks/sequila/utvf/GenomicIntervalStrategy.scala

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,4 +31,6 @@ case class GenomicIntervalPlan(plan: LogicalPlan, spark: SparkSession,interval:G
3131
)
3232
}
3333
def children: Seq[SparkPlan] = Nil
34+
35+
override protected def withNewChildrenInternal(newChildren: IndexedSeq[SparkPlan]): SparkPlan = this
3436
}

0 commit comments

Comments
 (0)