Skip to content

Commit 46b0d77

Browse files
authored
Support Spark 2.4.7 & 3.0.1 (#667)
1 parent 54a42cf commit 46b0d77

File tree

4 files changed

+44
-3
lines changed

4 files changed

+44
-3
lines changed

azure-pipelines.yml

+40-1
Original file line numberDiff line numberDiff line change
@@ -284,6 +284,15 @@ stages:
284284
env:
285285
SPARK_HOME: $(Build.BinariesDirectory)\spark-2.4.6-bin-hadoop2.7
286286

287+
- task: DotNetCoreCLI@2
288+
displayName: 'E2E tests for Spark 2.4.7'
289+
inputs:
290+
command: test
291+
projects: '**/Microsoft.Spark*.E2ETest/*.csproj'
292+
arguments: '--configuration $(buildConfiguration)'
293+
env:
294+
SPARK_HOME: $(Build.BinariesDirectory)\spark-2.4.7-bin-hadoop2.7
295+
287296
- task: DotNetCoreCLI@2
288297
displayName: 'E2E tests for Spark 3.0.0'
289298
inputs:
@@ -293,6 +302,16 @@ stages:
293302
env:
294303
SPARK_HOME: $(Build.BinariesDirectory)\spark-3.0.0-bin-hadoop2.7
295304

305+
306+
- task: DotNetCoreCLI@2
307+
displayName: 'E2E tests for Spark 3.0.1'
308+
inputs:
309+
command: test
310+
projects: '**/Microsoft.Spark*.E2ETest/*.csproj'
311+
arguments: '--configuration $(buildConfiguration)'
312+
env:
313+
SPARK_HOME: $(Build.BinariesDirectory)\spark-3.0.1-bin-hadoop2.7
314+
296315
- stage: ForwardCompatibility
297316
displayName: E2E Forward Compatibility Tests
298317
dependsOn: Build
@@ -558,7 +577,16 @@ stages:
558577
env:
559578
SPARK_HOME: $(Build.BinariesDirectory)\spark-2.4.6-bin-hadoop2.7
560579

561-
# Spark 3.0.0 uses Arrow 0.15.1, which contains a new Arrow spec. This breaks backward
580+
- task: DotNetCoreCLI@2
581+
displayName: 'E2E tests for Spark 2.4.7'
582+
inputs:
583+
command: test
584+
projects: '**/Microsoft.Spark*.E2ETest/*.csproj'
585+
arguments: '--configuration $(buildConfiguration) --filter $(TestsToFilterOut)'
586+
env:
587+
SPARK_HOME: $(Build.BinariesDirectory)\spark-2.4.7-bin-hadoop2.7
588+
589+
# Spark 3.0.* uses Arrow 0.15.1, which contains a new Arrow spec. This breaks backward
562590
# compatibility when using Microsoft.Spark.Worker with incompatible versions of Arrow.
563591
# Skip Arrow tests until the backward compatibility Worker version is updated.
564592
- task: DotNetCoreCLI@2
@@ -571,3 +599,14 @@ stages:
571599
(FullyQualifiedName!=Microsoft.Spark.E2ETest.IpcTests.DataFrameTests.TestVectorUdf)"
572600
env:
573601
SPARK_HOME: $(Build.BinariesDirectory)\spark-3.0.0-bin-hadoop2.7
602+
603+
- task: DotNetCoreCLI@2
604+
displayName: 'E2E tests for Spark 3.0.1'
605+
inputs:
606+
command: test
607+
projects: '**/Microsoft.Spark*.E2ETest/*.csproj'
608+
arguments: "--configuration $(buildConfiguration) --filter $(TestsToFilterOut)&\
609+
(FullyQualifiedName!=Microsoft.Spark.E2ETest.IpcTests.DataFrameTests.TestGroupedMapUdf)&\
610+
(FullyQualifiedName!=Microsoft.Spark.E2ETest.IpcTests.DataFrameTests.TestVectorUdf)"
611+
env:
612+
SPARK_HOME: $(Build.BinariesDirectory)\spark-3.0.1-bin-hadoop2.7

script/download-spark-distros.cmd

+2
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,8 @@ curl -k -L -o spark-2.4.3.tgz https://archive.apache.org/dist/spark/spark-2.4.3/
2424
curl -k -L -o spark-2.4.4.tgz https://archive.apache.org/dist/spark/spark-2.4.4/spark-2.4.4-bin-hadoop2.7.tgz && tar xzvf spark-2.4.4.tgz
2525
curl -k -L -o spark-2.4.5.tgz https://archive.apache.org/dist/spark/spark-2.4.5/spark-2.4.5-bin-hadoop2.7.tgz && tar xzvf spark-2.4.5.tgz
2626
curl -k -L -o spark-2.4.6.tgz https://archive.apache.org/dist/spark/spark-2.4.6/spark-2.4.6-bin-hadoop2.7.tgz && tar xzvf spark-2.4.6.tgz
27+
curl -k -L -o spark-2.4.7.tgz https://archive.apache.org/dist/spark/spark-2.4.7/spark-2.4.7-bin-hadoop2.7.tgz && tar xzvf spark-2.4.7.tgz
2728
curl -k -L -o spark-3.0.0.tgz https://archive.apache.org/dist/spark/spark-3.0.0/spark-3.0.0-bin-hadoop2.7.tgz && tar xzvf spark-3.0.0.tgz
29+
curl -k -L -o spark-3.0.1.tgz https://archive.apache.org/dist/spark/spark-3.0.1/spark-3.0.1-bin-hadoop2.7.tgz && tar xzvf spark-3.0.1.tgz
2830

2931
endlocal

src/scala/microsoft-spark-2.4.x/src/main/scala/org/apache/spark/deploy/dotnet/DotnetRunner.scala

+1-1
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ import scala.util.Try
3535
object DotnetRunner extends Logging {
3636
private val DEBUG_PORT = 5567
3737
private val supportedSparkVersions =
38-
Set[String]("2.4.0", "2.4.1", "2.4.3", "2.4.4", "2.4.5", "2.4.6")
38+
Set[String]("2.4.0", "2.4.1", "2.4.3", "2.4.4", "2.4.5", "2.4.6", "2.4.7")
3939

4040
val SPARK_VERSION = DotnetUtils.normalizeSparkVersion(spark.SPARK_VERSION)
4141

src/scala/microsoft-spark-3.0.x/src/main/scala/org/apache/spark/deploy/dotnet/DotnetRunner.scala

+1-1
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@ import scala.util.Try
3434
*/
3535
object DotnetRunner extends Logging {
3636
private val DEBUG_PORT = 5567
37-
private val supportedSparkVersions = Set[String]("3.0.0")
37+
private val supportedSparkVersions = Set[String]("3.0.0", "3.0.1")
3838

3939
val SPARK_VERSION = DotnetUtils.normalizeSparkVersion(spark.SPARK_VERSION)
4040

0 commit comments

Comments
 (0)