From 73ae9b135b188b1f5b3c9bf52b1679a42e3a4c3b Mon Sep 17 00:00:00 2001 From: fly6516 Date: Tue, 22 Apr 2025 13:39:30 +0800 Subject: [PATCH] =?UTF-8?q?fix:=20=E8=AE=BE=E7=BD=AE=20PySpark=20=E7=9A=84?= =?UTF-8?q?=20Python=E7=8E=AF=E5=A2=83=E5=8F=98=E9=87=8F?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - 添加 PYSPARK_PYTHON 和 PYSPARK_DRIVER_PYTHON 环境变量设置 - 指定 Python 3.6 作为 PySpark 的 Python 版本 --- data_prepare.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/data_prepare.py b/data_prepare.py index be45763..5c44f82 100644 --- a/data_prepare.py +++ b/data_prepare.py @@ -3,6 +3,8 @@ import os # Set Java environment variable os.environ['JAVA_HOME'] = '/opt/module/jdk1.8.0_171' +os.environ["PYSPARK_PYTHON"]="/usr/local/bin/python3.6" +os.environ["PYSPARK_DRIVER_PYTHON"]="/usr/local/bin/python3.6" # Parse ratings data into (userID, movieID, rating) def get_ratings_tuple(entry):