Zifah · February 9, 2019 21:26 · Sarvesh-CSE · Feb 8, 2020 · Zifah · Feb 21, 2020
diff --git a/databricks_write_to_azure_blob.py b/databricks_write_to_azure_blob.py
 # Configure blob storage account access key globally
 spark.conf.set(
  "fs.azure.account.key.%s.blob.core.windows.net" % storage_name,
  sas_key)

 output_container_path = "wasbs://%s@%s.blob.core.windows.net" % (output_container_name, storage_name)
 output_blob_folder = "%s/wrangled_data_folder" % output_container_path

 # write the dataframe as a single file to blob storage
 (dataframe
 .coalesce(1)
 .write
 .mode("overwrite")
 .option("header", "true")
 .format("com.databricks.spark.csv")
 .save(output_blob_folder))

 # Get the name of the wrangled-data CSV file that was just saved to Azure blob storage (it starts with 'part-')
 files = dbutils.fs.ls(output_blob_folder)
 output_file = [x for x in files if x.name.startswith("part-")]

 # Move the wrangled-data CSV file from a sub-folder (wrangled_data_folder) to the root of the blob container
 # While simultaneously changing the file name
 dbutils.fs.mv(output_file[0].path, "%s/predict-transform-output.csv" % output_container_path)
	# Configure blob storage account access key globally
	spark.conf.set(
	"fs.azure.account.key.%s.blob.core.windows.net" % storage_name,
	sas_key)

	output_container_path = "wasbs://%s@%s.blob.core.windows.net" % (output_container_name, storage_name)
	output_blob_folder = "%s/wrangled_data_folder" % output_container_path

	# write the dataframe as a single file to blob storage
	(dataframe
	.coalesce(1)
	.write
	.mode("overwrite")
	.option("header", "true")
	.format("com.databricks.spark.csv")
	.save(output_blob_folder))

	# Get the name of the wrangled-data CSV file that was just saved to Azure blob storage (it starts with 'part-')
	files = dbutils.fs.ls(output_blob_folder)
	output_file = [x for x in files if x.name.startswith("part-")]

	# Move the wrangled-data CSV file from a sub-folder (wrangled_data_folder) to the root of the blob container
	# While simultaneously changing the file name
	dbutils.fs.mv(output_file[0].path, "%s/predict-transform-output.csv" % output_container_path)