netanel246 · November 20, 2017 20:42
diff --git a/renameDataframeColumns.scala b/renameDataframeColumns.scala
 // Gets the schema from the CSV files
 val crimesSchema = spark.read
      .option("inferSchema", true)
      .option("header","true")
      .csv(dataPath)
      .schema

 // Creates Structured Stream over the CSV files 
 val crimes = spark.readStream
      .schema(crimesSchema)
      .csv(dataPath)

 import spark.implicits._

 // Map of (oldColumnName -> newColumnName)
 val columnsToBottom = crimes.columns
      .map(col => (col, col.replace(" ", "_")))
      .toMap

 // Update columns names by the columnsToBottom
 val renamedCrimes = columnsToBottom.foldLeft(crimes)((acc, pair) => acc.withColumnRenamed(pair._1, pair._2))
	// Gets the schema from the CSV files
	val crimesSchema = spark.read
	.option("inferSchema", true)
	.option("header","true")
	.csv(dataPath)
	.schema

	// Creates Structured Stream over the CSV files
	val crimes = spark.readStream
	.schema(crimesSchema)
	.csv(dataPath)

	import spark.implicits._

	// Map of (oldColumnName -> newColumnName)
	val columnsToBottom = crimes.columns
	.map(col => (col, col.replace(" ", "_")))
	.toMap

	// Update columns names by the columnsToBottom
	val renamedCrimes = columnsToBottom.foldLeft(crimes)((acc, pair) => acc.withColumnRenamed(pair._1, pair._2))