Создайте союз списка RDD
# Build the union of a list of RDDs
path = os.path.join(tempdir, "union-text.txt")
with open(path, "w") as testFile:
_ = testFile.write("Hello")
textFile = sc.textFile(path)
textFile.collect()
# ['Hello']
parallelized = sc.parallelize(["World!"])
sorted(sc.union([textFile, parallelized]).collect())
# ['Hello', 'World!']
Ethercourt.ml