训练 CNN 时数据基数不明确

Question

我正在尝试训练 CNN 进行图像分类。当我要训练模型时，我遇到了一个问题，它说我的数据基数不明确。

我已经检查过图像和标签集的大小是否相同，所以我不确定为什么会这样。这是我的代码：

import numpy as np
import os, shutil
import tensorflow as tf
from PIL import Image
import matplotlib.pyplot as plt
import glob

dataset_path = '/Users/eliasbrasildesouza/Downloads/Male_and_Female_face_dataset'

male_faces = os.path.join(dataset_path, 'Male_Faces')
female_faces = os.path.join(dataset_path, 'Female_Faces')

batch_size = 32
img_height = 180
img_width = 180

plt.figure(figsize=(10, 10))


image_files = os.listdir(male_faces)

# Loop for displaying only the first 9 images
for i in range(9):
    img_path = os.path.join(male_faces, image_files[i])
    
    # Read the image using PIL and convert it to a NumPy array
    img_array = np.asarray(Image.open(img_path))
    
    ax = plt.subplot(3, 3, i+1)
    plt.imshow(img_array.astype("uint8"))
    plt.title(f"Male {i+1}")  # You can modify this title as needed
    plt.axis('off')

plt.show()

plt.figure(figsize=(10, 10))


image_files = os.listdir(female_faces)

# Loop for displaying only the first 9 images
for i in range(9):
    img_path = os.path.join(female_faces, image_files[i])
    
    # Read the image using PIL and convert it to a NumPy array
    img_array = np.asarray(Image.open(img_path))
    
    ax = plt.subplot(3, 3, i+1)
    plt.imshow(img_array.astype("uint8"))
    plt.title(f"female {i+1}")  # You can modify this title as needed
    plt.axis('off')

plt.show()

male_file_types = set()
female_file_types = set()

for img in os.listdir(male_faces):
    img_path = os.path.join(male_faces, img)
    file_extension = os.path.splitext(img_path)[1]
    
    if file_extension not in male_file_types:
        male_file_types.add(file_extension)

male_file_types

for img in os.listdir(female_faces):
    img_path = os.path.join(female_faces, img)
    file_extension = os.path.splitext(img_path)[1]
    
    if file_extension not in female_file_types:
        female_file_types.add(file_extension)
    
female_file_types

male_file_types

female_file_types

male_images = []
female_images = []
labels = []

for file in os.listdir(male_faces):
    file_path = os.path.join(male_faces, file)
    file = np.asarray(Image.open(file_path))
    male_images.append(file)
    labels.append('male')   
        
for file in os.listdir(female_faces):
    file_path = os.path.join(female_faces, file)
    file = np.asarray(Image.open(file_path))
    female_images.append(file)
    labels.append('female')

len(male_images)

len(female_images)

X = male_images + female_images
y = labels

len(X)

len(y)

from sklearn.model_selection import train_test_split

print(y[0])

one_hot_labels = np.array([[1, 0] if label == 'female' else [0, 1] for label in y])

print(one_hot_labels)

y = one_hot_labels

for i in range(5):
    print(X[i].shape)

import cv2

X_resized = []

for array in X:
    X_resize = cv2.resize(array, (200, 200), interpolation=cv2.INTER_AREA)
    X_resized.append(X_resize)
        

X = X_resized

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

X_train, X_val, y_train, y_val = train_test_split(X_train, y_train, test_size=0.25, random_state=1)

model = tf.keras.Sequential([
    tf.keras.layers.InputLayer(input_shape=(200, 200, 3)),
    tf.keras.layers.Conv2D(32, kernel_size=(3, 3), activation='relu'),
    tf.keras.layers.MaxPooling2D(pool_size=(2, 2)),
    tf.keras.layers.Flatten(),
    tf.keras.layers.Dense(64, activation='relu'),
    tf.keras.layers.Dense(2, activation='softmax')
])

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Train the model
history = model.fit(X_train, y_train, epochs=10, batch_size=32, validation_data=(X_val, y_val))

# Evaluate the model on the validation set
loss, accuracy = model.evaluate(X_val, y_val)
print(f'Validation accuracy: {accuracy}')

这里是使用的数据集：https://www.kaggle.com/datasets/ashwingupta3012/male-and-female-faces-dataset

Answer 1

错误是因为传递给

X_train

方法的

model.fit

的维度和数据类型不正确。

X_train 应该是形状为

(n,200,200,3)

的张量，y_train 应该是

(n,2)

。

是例子的数量。

将列表转换为张量使用 -

X_train = [tf.convert_to_tensor(img_array) for img_array in X_train]
X_train = tf.stack(X_train)

训练 CNN 时数据基数不明确

问题描述投票：0回答：1

1个回答

最新问题

训练 CNN 时数据基数不明确

问题描述 投票：0回答：1

1个回答

最新问题

问题描述投票：0回答：1