# Binary Files
# Reading a binary file into a DataFrame
path = "your_file_path" #ex. "/databricks-datasets/learning-spark/cctvVideos/train_images/"
binary_files_df = (spark.read.format("binaryFile")
.option("pathGlobFilter", "*.jpg")
.load(path))
binary_files_df.show()
# To ignore partitioning data discovery in a directory, you can set recursiveFileLookup to True
binary_files_df = (spark.read.format("binaryFile")
.option("pathGlobFilter", "*.jpg")
.option("recursiveFileLookup", "true")
.load(path))
binary_files_df.show()