We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 48c8b66 commit 7969010Copy full SHA for 7969010
scripts/spark/setup/load_data_to_hdfs.py
@@ -70,13 +70,14 @@ def get_schema(self):
70
return self.parse_schema_file()
71
72
def transfer_data(self):
73
+ spinner = Halo(text=f"Reading and writing data from /data/output.csv to {self.hdfs_path}")
74
+ spinner.start()
75
try:
76
self.start_spark_session()
77
schema = self.get_schema()
78
79
logging.info(f"Reading and writing data from /data/output.csv to {self.hdfs_path}")
- spinner = Halo(text=f"Reading and writing data from /data/output.csv to {self.hdfs_path}")
- spinner.start()
80
+
81
df = (self.spark.read.option("header", "true")
82
.option("mode", "DROPMALFORMED")
83
.option("overwrite", "true")
0 commit comments