spark开发环境安装配置
https://downloads.lightbend.com/scala/2.11.12/scala-2.11.12.zip
https://www.scala-lang.org/download/all.html
https://www.python.org/ftp/python/3.8.6/python-3.8.6-amd64.exe
https://archive.apache.org/dist/spark/spark-2.4.6/
JAR_PATH=/data1/XXXXX/jars/XXXXXToRedisTask_20221216.jar
DAY_GEN=/data1/XXXXXXX/day_gen.sh
export HADOOP_USER_NAME=XXXX
export SPARK_HOME=/usr/local/share/spark
echo $JAR_PATH
echo $DAY_GEN
source ${DAY_GEN}
echo ${v_day}
v_job_stat=0
${SPARK_HOME}/bin/spark-submit --class com.XXXXXToRedisSaddTask \
--queue xxxxxxxxx \
--master yarn \
--deploy-mode cluster \
--name XXXXXXXToRedisSaddTask \
--conf spark.serializer=org.apache.spark.serializer.KryoSerializer \
--conf spark.kryoserializer.buffer.mb=256 \
--conf spark.kryoserializer.buffer.max=1024 \
--conf spark.sql.broadcastTimeout=6000 \
--conf spark.storage.memoryFraction=0.6 \
--conf spark.shuffle.memoryFraction=0.8 \
--conf spark.default.parallelism=2000 \
--conf spark.sql.shuffle.partitions=2000 \
--conf spark.driver.maxResultSize=88G \
--conf spark.executor.memoryOverhead=4G \
--conf spark.executor.extraJavaOptions="-XX:MaxDirectMemorySize=4096m" \
--conf spark.shuffle.registration.timeout=120000 \
--conf spark.shuffle.registration.maxAttempst=10 \
--conf spark.reducer.maxBlocksInFlightPerAddress=1000 \
--conf spark.reducer.maxReqsInFlight=1000 \
--conf spark.maxRemoteBlockSizeFetchToMem=512m \
--conf spark.shuffle.io.maxRetries=15 \
--conf spark.shuffle.io.retryWait=6s \
--conf spark.yarn.maxAppAttempts=1 \
--conf spark.shuffle.io.connectionTimeout=120000 \
--conf spark.shuffle.service.index.cache.size=6144m \
--conf spark.yarn.executor.memoryOverhead=6G \
--conf spark.dynamicAllocation.enabled=false \
--num-executors 50 \
--driver-memory 20G \
--executor-memory 40G \
--executor-cores 20 \
${JAR_PATH} --dayno=${v_day}
v_job_stat=`expr ${v_job_stat} + $?`
#########################################################################
# 返回作业执行状态码
#########################################################################
echo "v_job_stat = ${v_job_stat}"
exit ${v_job_stat}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
人生在勤,不索何获,坚持自有收获
浙公网安备 33010602011771号