diff --git a/5-1.py b/5-1.py index 2c76a21..ee8ef5f 100644 --- a/5-1.py +++ b/5-1.py @@ -158,12 +158,12 @@ print(similaritiesFullRDD.count()) print("Number of similarity records: {}".format(similaritiesFullRDD.count())) # 计算并测试相似度 -similarity_test = similarities_full_rdd.filter(lambda x: x[0][0] == 'b00005lzly' and x[0][ +similarity_test = similaritiesFullRDD.filter(lambda x: x[0][0] == 'b00005lzly' and x[0][ 1] == 'http://www.google.com/base/feeds/snippets/13823221823254120257').collect() print(len(similarity_test)) # 测试 assert len(similarity_test) == 1, "incorrect len(similarity_test)" -assert similarities_full_rdd.count() == 2441088, "incorrect similarities_full_rdd.count()" +assert similaritiesFullRDD.count() == 2441088, "incorrect similaritiesFullRDD.count()" sc.stop()