isogram · June 2, 2020 07:33
diff --git a/create_empty_dataframe_pyspark.py b/create_empty_dataframe_pyspark.py
 from pyspark.sql.types import StringType, FloatType, StructField, StructType
 from pyspark.sql import SparkSession, SQLContext, Row
 import pyspark

 # spark initialization
 spark_context = pyspark.SparkContext.getOrCreate()
 spark_session = SparkSession(spark_context) \
                    .builder \
                    .enableHiveSupport() \
                    .getOrCreate()
 sqlContext = SQLContext(spark_context)

 field = [
    StructField("FIELDNAME_1",StringType(), True),
    StructField("FIELDNAME_2", FloatType(), True),
    StructField("FIELDNAME_3", StringType(), True)
 ]
 schema = StructType(field)
 df = sqlContext.createDataFrame(spark_context.emptyRDD(), schema)

 df.printSchema()
	from pyspark.sql.types import StringType, FloatType, StructField, StructType
	from pyspark.sql import SparkSession, SQLContext, Row
	import pyspark

	# spark initialization
	spark_context = pyspark.SparkContext.getOrCreate()
	spark_session = SparkSession(spark_context) \
	.builder \
	.enableHiveSupport() \
	.getOrCreate()
	sqlContext = SQLContext(spark_context)

	field = [
	StructField("FIELDNAME_1",StringType(), True),
	StructField("FIELDNAME_2", FloatType(), True),
	StructField("FIELDNAME_3", StringType(), True)
	]
	schema = StructType(field)
	df = sqlContext.createDataFrame(spark_context.emptyRDD(), schema)

	df.printSchema()
No results found