From 80fb9d04dc95aa0307c9eb5f3998c8f24a47d78d Mon Sep 17 00:00:00 2001 From: Dongjoon Hyun Date: Thu, 13 Feb 2025 18:31:48 +0800 Subject: [PATCH] [SPARK-51200][BUILD] Add SparkR deprecation info to `README.md` and `make-distribution.sh` help ### What changes were proposed in this pull request? This PR aims to add `SparkR` deprecation info additionally to the following for developers. - `README.md` - `make-distribution.sh` help message ### Why are the changes needed? `SparkR` is deprecated properly by the following. - #47842 This PR adds a little more because `README.md` and `make-distribution.sh` are the starting point for downstream Spark distribution developers. ### Does this PR introduce _any_ user-facing change? No behavior change. Only the documentation and help message of developer script. ### How was this patch tested? Manual review. ``` $ dev/make-distribution.sh --help 2> /dev/null make-distribution.sh - tool for making binary distributions of Spark usage: make-distribution.sh [--name] [--tgz] [--pip] [--r] [--connect] [--mvn ] See Spark's "Building Spark" doc for correct Maven options. SparkR is deprecated from Apache Spark 4.0.0 and will be removed in a future version. ``` ### Was this patch authored or co-authored using generative AI tooling? No Closes #49931 from dongjoon-hyun/SPARK-51200. Authored-by: Dongjoon Hyun Signed-off-by: Kent Yao --- README.md | 2 +- dev/make-distribution.sh | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 552b71215cb92..e0f97a4ca51cb 100644 --- a/README.md +++ b/README.md @@ -1,7 +1,7 @@ # Apache Spark Spark is a unified analytics engine for large-scale data processing. It provides -high-level APIs in Scala, Java, Python, and R, and an optimized engine that +high-level APIs in Scala, Java, Python, and R (Deprecated), and an optimized engine that supports general computation graphs for data analysis. It also supports a rich set of higher-level tools including Spark SQL for SQL and DataFrames, pandas API on Spark for pandas workloads, MLlib for machine learning, GraphX for graph processing, diff --git a/dev/make-distribution.sh b/dev/make-distribution.sh index 081e6a1b97116..0fe4d95a24802 100755 --- a/dev/make-distribution.sh +++ b/dev/make-distribution.sh @@ -47,6 +47,7 @@ function exit_with_usage { cl_options="[--name] [--tgz] [--pip] [--r] [--connect] [--mvn ]" echo "make-distribution.sh $cl_options " echo "See Spark's \"Building Spark\" doc for correct Maven options." + echo "SparkR is deprecated from Apache Spark 4.0.0 and will be removed in a future version." echo "" exit 1 }