import daft


            
              # Load a dataframe from filepaths in an S3 bucket
df = daft.from_glob_path("images/") #非常方便的查阅图片，以表格的形式查看。


            
              df = daft.read_video_frames(r"D:\installed\WeChat_Files\WeChat Files\***\FileStorage\Video\2023-06",
                            
                            
                                image_height=480,
    image_width=640,
    is_key_frame=True, # select only the key frames
                            ) # 非常方便的查阅微信其中的视频


            
              # 1. Download column of image URLs as a column of bytes
# 2. Decode the column of bytes into a column of images
df = df.with_column("image", df["path"].url.download().image.decode())


            
              # Resize each image into 32x32
df = df.with_column("resized", df["image"].image.resize(32, 32))


            
              df.show(30)

path Utf8	size Int64	num_rows Int64	image Image[MIXED]	resized Image[MIXED]
file://images/04f74b7e993e63e14585ba2910b3e621.jpg	28232	None
file://images/06be93e2f39d125b9613c52e30f6c869.png	1190735	None
file://images/0883060accc117cbbfd8e3fa5ac8cf76.jpg	20942	None
file://images/0ab7961a2a845ddb60a70d1c752daefd.png	6570	None
file://images/10f932613dfc7fc269383721a6582ecc.jpg	20610	None
...	...	...	...	...
file://images/97cbb121fcca528db938da5e45b8614a.png	21522	None
file://images/98510fd03b6e6f1ed8654c93d45b3865.png	30553	None
file://images/99052cb843dea940169f21645b94c07b.jpg	54497	None
file://images/9fd70385aa6d5e757795a4c9fb44308c.jpg	77239	None
file://images/a0927e56a04be9b8a17b977c01fba775.jpg	36374	None

Daft：简化多模态数据处理