in scala-spark-sdk/src/main/scala/software/amazon/sagemaker/featurestore/sparksdk/helpers/DataFrameRepartitioner.scala [25:36]
def getParallelism(inputDataFrame: DataFrame): Int = {
val sparkContext = inputDataFrame.sparkSession.sparkContext
val configuredParallelism = sparkContext.getConf.get("spark.default.parallelism", null)
val systemParallelism = sparkContext.defaultParallelism
// Worship customer's configuration, else return the parallelism of default
if (configuredParallelism != null) {
configuredParallelism.toInt
} else {
systemParallelism
}
}