UnidentifiedImageError:无法识别图像文件

batch_size = 16 # Data augmentation and preprocess train_datagen = ImageDataGenerator(rescale=1./255, shear_range=0.2, zoom_range=0.2, horizontal_flip=True, validation_split=0.20) # set validation split # Train dataset train_generator = train_datagen.flow_from_directory( 'PetImages/train', target_size=(244, 244), batch_size=batch_size, class_mode='binary', subset='training') # set as training data # Validation dataset validation_generator = train_datagen.flow_from_directory( 'PetImages/train', target_size=(244, 244), batch_size=batch_size, class_mode='binary', subset='validation') # set as validation data test_datagen = ImageDataGenerator(rescale=1./255) # Test dataset test_datagen = test_datagen.flow_from_directory( 'PetImages/test')

3条回答

网友

1楼 · 编辑于 2024-10-16 17:21:21

我以前遇到过这个问题。因此，我开发了一个python脚本来测试有效图像文件的培训和测试目录。文件扩展名必须是jpg、png、bmp或gif中的一个，因此它首先检查扩展名是否正确。然后它尝试使用cv2读取图像。如果未输入有效图像，则会创建异常。在每种情况下，都会打印出错误的文件名。最后，一个名为bad_list的列表包含坏文件路径列表。注意：目录名称必须为“test”和“train”

import os
import cv2
bad_list=[]
dir=r'c:\'PetImages'
subdir_list=os.listdir(dir) # create a list of the sub directories in the directory ie train or test
for d in subdir_list:  # iterate through the sub directories train and test
    dpath=os.path.join (dir, d) # create path to sub directory
    if d in ['test', 'train']:
        class_list=os.listdir(dpath) # list of classes ie dog or cat
       # print (class_list)
        for klass in class_list: # iterate through the two classes
            class_path=os.path.join(dpath, klass) # path to class directory
            #print(class_path)
            file_list=os.listdir(class_path) # create list of files in class directory
            for f in file_list: # iterate through the files
                fpath=os.path.join (class_path,f)
                index=f.rfind('.') # find index of period infilename
                ext=f[index+1:] # get the files extension
                if ext  not in ['jpg', 'png', 'bmp', 'gif']:
                    print(f'file {fpath}  has an invalid extension {ext}')
                    bad_list.append(fpath)                    
                else:
                    try:
                        img=cv2.imread(fpath)
                        size=img.shape
                    except:
                        print(f'file {fpath} is not a valid image file ')
                        bad_list.append(fpath)
                       
print (bad_list)

网友

2楼 · 编辑于 2024-10-16 17:21:21

我不知道这是否仍然相关，但对于将来会遇到同样问题的人：

在此特定情况下，dog_cat数据集中有两个损坏的文件：

cats/666.jpg
dogs/11702.jpg

只要移除它们，它就会工作

网友

3楼 · 编辑于 2024-10-16 17:21:21

尝试此功能检查图像的格式是否正确

import os
from PIL import Image
folder_path = 'data\img'
extensions = []
for fldr in os.listdir(folder_path):
    sub_folder_path = os.path.join(folder_path, fldr)
    for filee in os.listdir(sub_folder_path):
        file_path = os.path.join(sub_folder_path, filee)
        print('** Path: {}  **'.format(file_path), end="\r", flush=True)
        im = Image.open(file_path)
        rgb_im = im.convert('RGB')
        if filee.split('.')[1] not in extensions:
            extensions.append(filee.split('.')[1])

相关问题更多 >

编程相关推荐

热门问题

热门文章