File tree 2 files changed +6
-4
lines changed
2 files changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -39,20 +39,21 @@ WORKDIR ${SPARK_HOME}
39
39
# Remember to also update `tests/conftest`'s spark setting
40
40
ENV SPARK_VERSION=3.5.4
41
41
ENV ICEBERG_SPARK_RUNTIME_VERSION=3.5_2.12
42
- ENV ICEBERG_VERSION=1.8.0
42
+ ENV ICEBERG_VERSION=1.7.2
43
43
ENV PYICEBERG_VERSION=0.9.0
44
44
45
+ ENV BASE_ARTIFACT_URL=https://repository.apache.org/content/repositories/orgapacheiceberg-1187
45
46
RUN curl --retry 5 -s -C - https://archive.apache.org/dist/spark/spark-${SPARK_VERSION}/spark-${SPARK_VERSION}-bin-hadoop3.tgz -o spark-${SPARK_VERSION}-bin-hadoop3.tgz \
46
47
&& tar xzf spark-${SPARK_VERSION}-bin-hadoop3.tgz --directory /opt/spark --strip-components 1 \
47
48
&& rm -rf spark-${SPARK_VERSION}-bin-hadoop3.tgz
48
49
49
50
# Download iceberg spark runtime
50
- RUN curl --retry 5 -s https://repo1.maven.org/maven2 /org/apache/iceberg/iceberg-spark-runtime-${ICEBERG_SPARK_RUNTIME_VERSION}/${ICEBERG_VERSION}/iceberg-spark-runtime-${ICEBERG_SPARK_RUNTIME_VERSION}-${ICEBERG_VERSION}.jar \
51
+ RUN curl --retry 5 -s ${BASE_ARTIFACT_URL} /org/apache/iceberg/iceberg-spark-runtime-${ICEBERG_SPARK_RUNTIME_VERSION}/${ICEBERG_VERSION}/iceberg-spark-runtime-${ICEBERG_SPARK_RUNTIME_VERSION}-${ICEBERG_VERSION}.jar \
51
52
-Lo /opt/spark/jars/iceberg-spark-runtime-${ICEBERG_SPARK_RUNTIME_VERSION}-${ICEBERG_VERSION}.jar
52
53
53
54
54
55
# Download AWS bundle
55
- RUN curl --retry 5 -s https://repo1.maven.org/maven2 /org/apache/iceberg/iceberg-aws-bundle/${ICEBERG_VERSION}/iceberg-aws-bundle-${ICEBERG_VERSION}.jar \
56
+ RUN curl --retry 5 -s ${BASE_ARTIFACT_URL} /org/apache/iceberg/iceberg-aws-bundle/${ICEBERG_VERSION}/iceberg-aws-bundle-${ICEBERG_VERSION}.jar \
56
57
-Lo /opt/spark/jars/iceberg-aws-bundle-${ICEBERG_VERSION}.jar
57
58
58
59
COPY spark-defaults.conf /opt/spark/conf
Original file line number Diff line number Diff line change @@ -2420,7 +2420,7 @@ def spark() -> "SparkSession":
2420
2420
# Remember to also update `dev/Dockerfile`
2421
2421
spark_version = "." .join (importlib .metadata .version ("pyspark" ).split ("." )[:2 ])
2422
2422
scala_version = "2.12"
2423
- iceberg_version = "1.8.0 "
2423
+ iceberg_version = "1.7.2 "
2424
2424
2425
2425
os .environ ["PYSPARK_SUBMIT_ARGS" ] = (
2426
2426
f"--packages org.apache.iceberg:iceberg-spark-runtime-{ spark_version } _{ scala_version } :{ iceberg_version } ,"
@@ -2432,6 +2432,7 @@ def spark() -> "SparkSession":
2432
2432
2433
2433
spark = (
2434
2434
SparkSession .builder .appName ("PyIceberg integration test" )
2435
+ .config ("spark.jars.repositories" , "https://repository.apache.org/content/repositories/orgapacheiceberg-1187/" )
2435
2436
.config ("spark.sql.session.timeZone" , "UTC" )
2436
2437
.config ("spark.sql.shuffle.partitions" , "1" )
2437
2438
.config ("spark.default.parallelism" , "1" )
You can’t perform that action at this time.
0 commit comments