ValueError: `labels.shape` должен быть равен `logits.shape`, за исключением последнего измерения. Получено: labels.shape

ValueError: `labels.shape` должен быть равен `logits.shape`, за исключением последнего измерения. Получено: labels.shape ⇐ Python

1 сообщение • Страница 1 из 1

Anonymous

ValueError: `labels.shape` должен быть равен `logits.shape`, за исключением последнего измерения. Получено: labels.shape

Цитата

Сообщение Anonymous » 15 июл 2024, 23:18

Я столкнулся с ошибкой несоответствия формы во время обучения сверточной нейронной сети (CNN) с использованием TensorFlow и Keras.
Я использую специальную архитектуру LeNet-5, определенную следующим образом:

Код: Выделить всё

import tensorflow as tf
from keras import layers, models

def create_lenet5(input_shape, num_classes):
model = models.Sequential([
layers.Conv2D(6, kernel_size=(5, 5), strides=(1, 1), activation='relu', input_shape=input_shape),
layers.MaxPooling2D(pool_size=(2, 2), strides=(2, 2)),
layers.Conv2D(16, kernel_size=(5, 5), strides=(1, 1), activation='relu'),
layers.MaxPooling2D(pool_size=(2, 2), strides=(2, 2)),
layers.Flatten(),
layers.Dense(120, activation='relu'),
layers.Dense(84, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
return model

В сообщении об ошибке указано, что метки имеют форму (240), что означает, что передается 240 меток вместо меньшего размера пакета.
Логиты (прогнозы) из модели) имеют форму (16, 14), что указывает на то, что модель выводит прогнозы для пакета размером 16 и 14 классов.
скрипт data_preprocessing:

Код: Выделить всё

import os
import cv2
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
import re

class DataPreprocessor:
def __init__(self, image_dir, annotation_file, target_size=(256, 256)):
self.image_dir = image_dir
self.annotation_file = annotation_file
self.target_size = target_size

# Load annotations
print("Loading annotations...")
self.annotations = pd.read_csv(annotation_file, encoding='utf-8')
print(f"Loaded {len(self.annotations)} annotations.")

def load_and_preprocess_image(self, file_path):
image = cv2.imread(file_path, cv2.IMREAD_GRAYSCALE)
if image is None:
print(f"Failed to load image: {file_path}")
return None
image = cv2.resize(image, self.target_size)
return image.astype(np.float32) / 255.0  # Normalize to [0, 1]

def batch_generator(self, X, y, batch_size):
num_samples = len(X)
while True:
indices = np.arange(num_samples)
np.random.shuffle(indices)
for start in range(0, num_samples, batch_size):
batch_indices = indices[start:start + batch_size]
batch_images = []
batch_labels = []

for idx in batch_indices:
image_path = X[idx]

if os.path.exists(image_path):
image = self.load_and_preprocess_image(image_path)
if image is not None:
batch_images.append(image)
label = self.process_labels(y[idx])
batch_labels.append(label)
else:
print(f"Processed image is None for: {image_path}")
else:
print(f"Image not found for: {image_path}.  Skipping...")

if batch_images and batch_labels:
batch_images = np.array(batch_images)  # Shape: (batch_size, 256, 256)
batch_labels = np.array(batch_labels)  # Shape: (batch_size, num_classes)

# Ensure correct shapes
if batch_images.ndim == 3:
batch_images = np.expand_dims(batch_images, axis=-1)  # Shape: (batch_size, 256, 256, 1)

# Ensure batch_labels are 2D
if batch_labels.ndim == 1:
batch_labels = np.expand_dims(batch_labels, axis=0)  # Shape: (1, num_classes)

if batch_labels.ndim == 2 and batch_labels.shape[0] == 1:
batch_labels = np.repeat(batch_labels, len(batch_images), axis=0)

print(f"Yielding batch: images shape {batch_images.shape}, labels shape {batch_labels.shape}")  # Debug output

if batch_images.shape[0] == batch_labels.shape[0]:  # Ensure batch sizes match
yield batch_images, batch_labels
else:
print(f"Warning: Batch size mismatch - images: {batch_images.shape[0]}, labels: {batch_labels.shape[0]}")
else:
print("Warning: Empty batch detected, skipping this batch...")

def load_dataset_paths_and_labels(self):
print("Loading dataset paths and labels...")
image_paths = []
labels = []
total_images = len(self.annotations)

for i in range(total_images):
image_name = self.annotations.iloc[i]['Image Index']
image_path = os.path.join(self.image_dir, image_name)
if os.path.exists(image_path):
image_paths.append(image_path)
labels.append(self.annotations.iloc[i]['Finding Labels'])  # Store as is
else:
print(f"Image not found for {image_name}. Skipping...")

# Print progress every 100 images
if (i + 1) % 100 == 0 or (i + 1) == total_images:
print(f"Loaded {i + 1}/{total_images} images and labels.")

return image_paths, labels

def process_labels(self, labels_str):
if isinstance(labels_str, bytes):
labels_str = labels_str.decode('utf-8')

label_list = re.split(r'\||,', labels_str)
label_dict = {
'Atelectasis': 0,
'Cardiomegaly': 1,
'Effusion': 2,
'Infiltration': 3,
'Mass': 4,
'Nodule': 5,
'Pneumonia': 6,
'Pneumothorax': 7,
'Consolidation': 8,
'Edema': 9,
'Emphysema': 10,
'Fibrosis': 11,
'Pleural_Thickening': 12,
'Hernia': 13,
'No Finding': 14
}

# Initialize an array for the one-hot encoded labels
label_array = np.zeros((len(label_dict),), dtype=np.int32)

# Process the labels
for label in label_list:
label = label.strip()
if label in label_dict:
label_array[label_dict[label]] = 1  # One-hot encoding

return label_array

def split_data(self, images, labels, test_size=0.3):
print("Splitting data...")
X_train, X_temp, y_train, y_temp = train_test_split(images, labels, test_size=test_size, random_state=42)
X_val, X_test, y_val, y_test = train_test_split(X_temp, y_temp, test_size=0.5, random_state=42)
print(f"Data split complete: {len(X_train)} training samples, {len(X_val)} validation samples, {len(X_test)} test samples.")
return X_train, X_val, X_test, y_train, y_val, y_test`

train:

Код: Выделить всё

import os
import tensorflow as tf
from utils.config import Config
from data_preprocessing import DataPreprocessor
from models.classification_model import create_lenet5

def main():
# Initialize DataPreprocessor
preprocessor = DataPreprocessor(Config.IMAGE_DIR, Config.ANNOTATION_FILE)

if preprocessor.annotations is None or preprocessor.annotations.empty:
print("Error: Annotations not loaded or empty.  Exiting...")
return

# Load dataset paths and labels
image_paths, labels = preprocessor.load_dataset_paths_and_labels()
X_train, X_val, X_test, y_train, y_val, y_test = preprocessor.split_data(image_paths, labels, test_size=0.3)
print(f"Data split complete: {len(X_train)} training samples, {len(X_val)} validation samples, {len(X_test)} test samples.")

# Create LeNet-5 model
model = create_lenet5(input_shape=preprocessor.target_size + (1,), num_classes=Config.NUM_CLASSES)

# Compile the model
model.compile(optimizer=tf.keras.optimizers.Adam(),
loss=tf.keras.losses.SparseCategoricalCrossentropy(),
metrics=[tf.keras.metrics.SparseCategoricalAccuracy()])

# Define callbacks (optional)
checkpoint_callback = tf.keras.callbacks.ModelCheckpoint(filepath='models/best_model.keras', save_best_only=True)
early_stopping_callback = tf.keras.callbacks.EarlyStopping(patience=10, restore_best_weights=True)

# Train the model using generators
train_generator = preprocessor.batch_generator(X_train, y_train, batch_size=Config.BATCH_SIZE)

# Training loop
for epoch in range(Config.EPOCHS):
print(f"Epoch {epoch + 1}/{Config.EPOCHS}")
epoch_loss = 0
epoch_accuracy = 0
steps = 0

# Debug: Check if the generator is yielding batches
try:
for batch_images, batch_labels in train_generator:
if batch_images is None or batch_labels is None:
print("Received None for batch_images or batch_labels. Skipping...")
continue

steps += 1
print(f"Training on batch: images shape {batch_images.shape}, labels shape {batch_labels.shape}")

# Train on the current batch
history = model.train_on_batch(batch_images, batch_labels)

epoch_loss += history[0]
epoch_accuracy += history[1]

print(f"Step {steps}: Loss = {history[0]}, Accuracy = {history[1]}")

# Optionally, break after a few steps for testing
if steps >= 10:  # Adjust this to control how many steps you want to test
break

except Exception as e:
print(f"Error during training: {e}")
break

avg_loss = epoch_loss / steps if steps > 0 else 0
avg_accuracy = epoch_accuracy / steps if steps > 0 else 0
print(f"Epoch {epoch + 1} completed: Avg Loss = {avg_loss}, Avg Accuracy = {avg_accuracy}")

# Save the final model
model.save('models/final_model.keras')

if __name__ == "__main__":
main()

Я создал пакетный генератор для пакетной обработки изображений и меток. Я включил операторы печати для отладки и проверки формы изображений и меток перед передачей их в модель.
Я использовал метод train_on_batch для обучения модели пакетами из генератора. Перед каждым этапом обучения я проверял, совпадают ли формы Batch_images и Batch_labels.

Подробнее здесь: https://stackoverflow.com/questions/787 ... st-dimensi

1721074734

Anonymous

Я столкнулся с ошибкой несоответствия формы во время обучения сверточной нейронной сети (CNN) с использованием TensorFlow и Keras.
Я использую специальную архитектуру LeNet-5, определенную следующим образом: 
[code]import tensorflow as tf
from keras import layers, models

def create_lenet5(input_shape, num_classes):
model = models.Sequential([
layers.Conv2D(6, kernel_size=(5, 5), strides=(1, 1), activation='relu', input_shape=input_shape),
layers.MaxPooling2D(pool_size=(2, 2), strides=(2, 2)),
layers.Conv2D(16, kernel_size=(5, 5), strides=(1, 1), activation='relu'),
layers.MaxPooling2D(pool_size=(2, 2), strides=(2, 2)),
layers.Flatten(),
layers.Dense(120, activation='relu'),
layers.Dense(84, activation='relu'),
layers.Dense(num_classes, activation='softmax')
])
return model
[/code]
В сообщении об ошибке указано, что метки имеют форму (240), что означает, что передается 240 меток вместо меньшего размера пакета.
Логиты (прогнозы) из модели) имеют форму (16, 14), что указывает на то, что модель выводит прогнозы для пакета размером 16 и 14 классов.
скрипт data_preprocessing:
[code]import os
import cv2
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
import re

class DataPreprocessor:
def __init__(self, image_dir, annotation_file, target_size=(256, 256)):
self.image_dir = image_dir
self.annotation_file = annotation_file
self.target_size = target_size

# Load annotations
print("Loading annotations...")
self.annotations = pd.read_csv(annotation_file, encoding='utf-8')
print(f"Loaded {len(self.annotations)} annotations.")

def load_and_preprocess_image(self, file_path):
image = cv2.imread(file_path, cv2.IMREAD_GRAYSCALE)
if image is None:
print(f"Failed to load image: {file_path}")
return None
image = cv2.resize(image, self.target_size)
return image.astype(np.float32) / 255.0  # Normalize to [0, 1]

def batch_generator(self, X, y, batch_size):
num_samples = len(X)
while True:
indices = np.arange(num_samples)
np.random.shuffle(indices)
for start in range(0, num_samples, batch_size):
batch_indices = indices[start:start + batch_size]
batch_images = []
batch_labels = []

for idx in batch_indices:
image_path = X[idx]

if os.path.exists(image_path):
image = self.load_and_preprocess_image(image_path)
if image is not None:
batch_images.append(image)
label = self.process_labels(y[idx])
batch_labels.append(label)
else:
print(f"Processed image is None for: {image_path}")
else:
print(f"Image not found for: {image_path}.  Skipping...")

if batch_images and batch_labels:
batch_images = np.array(batch_images)  # Shape: (batch_size, 256, 256)
batch_labels = np.array(batch_labels)  # Shape: (batch_size, num_classes)

# Ensure correct shapes
if batch_images.ndim == 3:
batch_images = np.expand_dims(batch_images, axis=-1)  # Shape: (batch_size, 256, 256, 1)

# Ensure batch_labels are 2D
if batch_labels.ndim == 1:
batch_labels = np.expand_dims(batch_labels, axis=0)  # Shape: (1, num_classes)

if batch_labels.ndim == 2 and batch_labels.shape[0] == 1:
batch_labels = np.repeat(batch_labels, len(batch_images), axis=0)

print(f"Yielding batch: images shape {batch_images.shape}, labels shape {batch_labels.shape}")  # Debug output

if batch_images.shape[0] == batch_labels.shape[0]:  # Ensure batch sizes match
yield batch_images, batch_labels
else:
print(f"Warning: Batch size mismatch - images: {batch_images.shape[0]}, labels: {batch_labels.shape[0]}")
else:
print("Warning: Empty batch detected, skipping this batch...")

def load_dataset_paths_and_labels(self):
print("Loading dataset paths and labels...")
image_paths = []
labels = []
total_images = len(self.annotations)

for i in range(total_images):
image_name = self.annotations.iloc[i]['Image Index']
image_path = os.path.join(self.image_dir, image_name)
if os.path.exists(image_path):
image_paths.append(image_path)
labels.append(self.annotations.iloc[i]['Finding Labels'])  # Store as is
else:
print(f"Image not found for {image_name}. Skipping...")

# Print progress every 100 images
if (i + 1) % 100 == 0 or (i + 1) == total_images:
print(f"Loaded {i + 1}/{total_images} images and labels.")

return image_paths, labels

def process_labels(self, labels_str):
if isinstance(labels_str, bytes):
labels_str = labels_str.decode('utf-8')

label_list = re.split(r'\||,', labels_str)
label_dict = {
'Atelectasis': 0,
'Cardiomegaly': 1,
'Effusion': 2,
'Infiltration': 3,
'Mass': 4,
'Nodule': 5,
'Pneumonia': 6,
'Pneumothorax': 7,
'Consolidation': 8,
'Edema': 9,
'Emphysema': 10,
'Fibrosis': 11,
'Pleural_Thickening': 12,
'Hernia': 13,
'No Finding': 14
}

# Initialize an array for the one-hot encoded labels
label_array = np.zeros((len(label_dict),), dtype=np.int32)

# Process the labels
for label in label_list:
label = label.strip()
if label in label_dict:
label_array[label_dict[label]] = 1  # One-hot encoding

return label_array

def split_data(self, images, labels, test_size=0.3):
print("Splitting data...")
X_train, X_temp, y_train, y_temp = train_test_split(images, labels, test_size=test_size, random_state=42)
X_val, X_test, y_val, y_test = train_test_split(X_temp, y_temp, test_size=0.5, random_state=42)
print(f"Data split complete: {len(X_train)} training samples, {len(X_val)} validation samples, {len(X_test)} test samples.")
return X_train, X_val, X_test, y_train, y_val, y_test`
[/code]
train:
[code]import os
import tensorflow as tf
from utils.config import Config
from data_preprocessing import DataPreprocessor
from models.classification_model import create_lenet5

def main():
# Initialize DataPreprocessor
preprocessor = DataPreprocessor(Config.IMAGE_DIR, Config.ANNOTATION_FILE)

if preprocessor.annotations is None or preprocessor.annotations.empty:
print("Error: Annotations not loaded or empty.  Exiting...")
return

# Load dataset paths and labels
image_paths, labels = preprocessor.load_dataset_paths_and_labels()
X_train, X_val, X_test, y_train, y_val, y_test = preprocessor.split_data(image_paths, labels, test_size=0.3)
print(f"Data split complete: {len(X_train)} training samples, {len(X_val)} validation samples, {len(X_test)} test samples.")

# Create LeNet-5 model
model = create_lenet5(input_shape=preprocessor.target_size + (1,), num_classes=Config.NUM_CLASSES)

# Compile the model
model.compile(optimizer=tf.keras.optimizers.Adam(),
loss=tf.keras.losses.SparseCategoricalCrossentropy(),
metrics=[tf.keras.metrics.SparseCategoricalAccuracy()])

# Define callbacks (optional)
checkpoint_callback = tf.keras.callbacks.ModelCheckpoint(filepath='models/best_model.keras', save_best_only=True)
early_stopping_callback = tf.keras.callbacks.EarlyStopping(patience=10, restore_best_weights=True)

# Train the model using generators
train_generator = preprocessor.batch_generator(X_train, y_train, batch_size=Config.BATCH_SIZE)

# Training loop
for epoch in range(Config.EPOCHS):
print(f"Epoch {epoch + 1}/{Config.EPOCHS}")
epoch_loss = 0
epoch_accuracy = 0
steps = 0

# Debug: Check if the generator is yielding batches
try:
for batch_images, batch_labels in train_generator:
if batch_images is None or batch_labels is None:
print("Received None for batch_images or batch_labels. Skipping...")
continue

steps += 1
print(f"Training on batch: images shape {batch_images.shape}, labels shape {batch_labels.shape}")

# Train on the current batch
history = model.train_on_batch(batch_images, batch_labels)

epoch_loss += history[0]
epoch_accuracy += history[1]

print(f"Step {steps}: Loss = {history[0]}, Accuracy = {history[1]}")

# Optionally, break after a few steps for testing
if steps >= 10:  # Adjust this to control how many steps you want to test
break

except Exception as e:
print(f"Error during training: {e}")
break

avg_loss = epoch_loss / steps if steps > 0 else 0
avg_accuracy = epoch_accuracy / steps if steps > 0 else 0
print(f"Epoch {epoch + 1} completed: Avg Loss = {avg_loss}, Avg Accuracy = {avg_accuracy}")

# Save the final model
model.save('models/final_model.keras')

if __name__ == "__main__":
main()
[/code]
Я создал пакетный генератор для пакетной обработки изображений и меток. Я включил операторы печати для отладки и проверки формы изображений и меток перед передачей их в модель.
Я использовал метод train_on_batch для обучения модели пакетами из генератора. Перед каждым этапом обучения я проверял, совпадают ли формы Batch_images и Batch_labels. 

Подробнее здесь: [url]https://stackoverflow.com/questions/78751134/valueerror-labels-shape-must-equal-logits-shape-except-for-the-last-dimensi[/url]

Ответить Пред. тема След. тема

1 сообщение • Страница 1 из 1

Быстрый ответ

Заголовок:

Имя пользователя:

Изменение регистра текста:

Смайлики

Ещё смайлики…

К этому ответу прикреплено по крайней мере одно вложение.

Если вы не хотите добавлять вложения, оставьте поля пустыми. Можно прикреплять файлы, перетаскивая их в окно сообщения.

Максимально разрешённый размер вложения: 15 МБ.

Имя файла:

Комментарий к файлу:

Имя файла	Комментарий к файлу	Размер	Статус

Похожие темы

Ответы

Просмотры

Последнее сообщение

InvalidargumentError: должен иметь updates.shape = indicse.shape + params.shape [1:] или обновления.shape = [] в TF-Agen

Последнее сообщение Anonymous « 14 авг 2025, 17:56
Добавлено в форуме Python

Anonymous » 14 авг 2025, 17:56 » в форуме Python

У меня есть проблема с этим простым кодом.
Я ищу код воспродажа, совместим с графическими операциями и функциями TF.

import tensorflow as tf
import numpy as np
!pip install tf_agents
import tf_agents

from tf_agents.replay_buffers import...

0 Ответы

2 Просмотры

Последнее сообщение Anonymous
14 авг 2025, 17:56
Проблема в моем коде из-за tf.shape и Tensor.shape. `tf.shape` и `Tensor.shape`, оба не работают

Последнее сообщение Anonymous « 04 янв 2024, 19:57
Добавлено в форуме Python

Anonymous » 04 янв 2024, 19:57 » в форуме Python

Я написал конвейер обнаружения объектов DETR с нуля в Tensorflow.
DETR: Ссылка на Kaggle Notebook: содержит весь код; Создайте собственную копию блокнота, чтобы воспроизвести проблему

DETR: ссылка на Github

Я протестировал все отдельные...

0 Ответы

63 Просмотры

Последнее сообщение Anonymous
04 янв 2024, 19:57
ValueError: аргументы «target» и «output» должны иметь одинаковую форму. Получено: target.shape=(Нет, 512), output.shape

Последнее сообщение Anonymous « 13 май 2024, 10:32
Добавлено в форуме Python

Anonymous » 13 май 2024, 10:32 » в форуме Python

Я пытался обучить модель bert для решения проблемы мультиклассификации:

Я получил эту ошибку при запуске кода ниже

Целевой и выходной аргументы должны иметь одинаковую форму. Получено: target.shape=(Нет, 512), output.shape=(Нет, 3)

import...

0 Ответы

180 Просмотры

Последнее сообщение Anonymous
13 май 2024, 10:32
Аргументы `target` и` output 'должны иметь одинаковый ранг (ndim). Получено: target.shape = (none,), output.shape = (нет

Последнее сообщение Anonymous « 14 апр 2025, 00:09
Добавлено в форуме Python

Anonymous » 14 апр 2025, 00:09 » в форуме Python

Я пытался создать нейронную сеть, которая может идентифицировать изображения, но когда я иду и пытаюсь подготовить свою модель, я получаю следующую ошибку:
ValueError Traceback (most recent call last)
in ()
1 # Train the model
----> 2 history =...

0 Ответы

28 Просмотры

Последнее сообщение Anonymous
14 апр 2025, 00:09
Ошибка: метод add(Shape) в типе ArrayList неприменим для аргументов (Shape.Rectangle).

Последнее сообщение Anonymous « 27 апр 2024, 23:05
Добавлено в форуме JAVA

Anonymous » 27 апр 2024, 23:05 » в форуме JAVA

Я пытаюсь добавить новую фигуру в ArrayList, но получаю сообщение об ошибке: Метод add(Shape) в типе ArrayList неприменим для аргументов (Shape.Rectangle)
Shape.Rectangle — это созданный мной собственный класс. Аргументами для него являются...

0 Ответы

54 Просмотры

Последнее сообщение Anonymous
27 апр 2024, 23:05

Вернуться в «Python»