def create_python_rdd(jrdd, serializer):
"""Creates a Python RDD from a RDD from Scala.
Args:
jrdd (org.apache.spark.api.java.JavaRDD): The RDD that came from Scala.
serializer (:class:`~geopyspark.AvroSerializer` or pyspark.serializers.AutoBatchedSerializer(AvroSerializer)):
An instance of ``AvroSerializer`` that is either alone, or wrapped by ``AutoBatchedSerializer``.
Returns:
RDD
"""
pysc = get_spark_context()
if isinstance(serializer, AutoBatchedSerializer):
return RDD(jrdd, pysc, serializer)
else:
return RDD(jrdd, pysc, AutoBatchedSerializer(serializer))
评论列表
文章目录