import pandas as pd
d = {
'Image Index':
['00000013_005.jpeg', '00000013_026.jpeg',
'00000017_001.jpeg', '00000042_002.jpg',
'00000084_000.jpg', '00000099_003.jpg'],
'labels':
['Emphysima', 'Emphysima',
'No finding', 'No finding',
'Effusion', 'Effusion']}
df = pd.DataFrame(data=d)
df.head()
Image Index labels
0 00000013_005.jpeg Emphysima
1 00000013_026.jpeg Emphysima
2 00000017_001.jpeg No finding
3 00000042_002.jpg No finding
4 00000084_000.jpg Effusion
现在,根据你的需要,你可以试试这个
from pathlib import Path
from PIL import Image
# iterate over the unique label
for item_name in df.labels.unique():
# create folder according to the label name
item_folder = Path(f"{item_name}/")
item_folder.mkdir(parents=True, exist_ok=True)
# store id and gt for unique labels
id = []
gt = []
# iterate over all possible number of unique labels
for id_label in df.loc[df['labels'] == item_name].values.tolist():
# id_label :['image_id', 'label']
id.append(id_label[0]) # image_id
gt.append(id_label[1]) # label
img = Image.open(id_label[0]) # read the image
img.save(f'{item_folder}/{id_label[0]}') # and save to target folder
# save the individual ground truth
# to the concern directory
label = pd.DataFrame({
'Image Index': id,
'labels': gt
})
label.to_csv(f'{item_folder}/{item_folder}.csv', index=False)
如果我理解您的要求,您可以按以下方式之一进行:
数据
现在,根据你的需要,你可以试试这个
它将按
labels
名称创建一个目录,并将相应的映像保存到此目录,并仅使用它们的标签创建一个新的data frame
相关问题 更多 >
编程相关推荐