Почему моя ИНС на C# не сходится, несмотря на настройку гиперпараметров? - Цифровое Кемерово

Почему моя ИНС на C# не сходится, несмотря на настройку гиперпараметров? ⇐ C#

Ответить Пред. тема След. тема

1 сообщение • Страница 1 из 1

Anonymous

Почему моя ИНС на C# не сходится, несмотря на настройку гиперпараметров?

Цитата

Сообщение Anonymous » 22 май 2024, 02:33

У меня есть ИНС, реализованная с нуля на C#. Однако не сходилось, в чем может быть проблема? Я пробовал разные функции активации, другой набор данных. Набор данных генерируется случайным образом, но ИНС в Python работает с тем же набором данных, поэтому можно обучить нейронную сеть данным.

Код: Выделить всё

private NeuralNetworkData ReLU(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
for (int i = 0; i < res.Length; i++)
{
res[i, 0] = MathF.Max(0, (float)x.Data[i,0]);
}
return new NeuralNetworkData( res);
}
private NeuralNetworkData Softmax(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
double max = x.ToVector().Max(x => x);
double[] exps = x.ToVector().Select(x => Math.Exp(x - max)).ToArray();
double sumExps = exps.Sum();

for (int i = 0; i < res.Length; i++)
{
res[i, 0] = exps[i] / sumExps;
}
return new NeuralNetworkData(res);
}
private NeuralNetworkData ReLUDerivative(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
for (int i = 0; i < res.Length; i++)
{
res[i, 0] = x.Data[i, 0] > 0 ? 1 : 0;
}
return new NeuralNetworkData(res);
}
private void FeedForward(int index, int epoch)
{
if (epoch is 0 && index is 0)
{
Weights1 = Weights1.Transpose();
Weights2 = Weights2.Transpose();
}
Input = Scale(DataFile.Data[index].Values).ToMatrix();
Z1 = (Weights1 * Input) + Bias1;
Hidden = ReLU(Z1);
Z2 = (Weights2 * Hidden) + Bias2;
Output =  Softmax(Z2);

//Console.WriteLine($"N1: {Output[0]}, N2: {Output[1]}, N3: {Output[2]}");
}
private double Error(int index)
{
double localError = 0;
for (int i = 0; i < Output.Data.GetLength(0); i++)
{
localError -= (DataFile.Data[index].Label[i] * Math.Log(Output.Data[i, 0] + 1e-9));
}

return localError;
}
private NeuralNetworkData ElementWiseMultiply(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[] res = new double[first.Data.GetLength(0)];
for (int i = 0; i < res.Length; i++)
{
res[i] = first.Data[i, 0] * second.Data[i, 0];
}
return res.ToMatrix();
}
else
{
throw new Exception("Two vectors are not the same length!");
}
}
private void Backpropagate(int index)
{
Delta2 = Output - DataFile.Data[index].Label.ToMatrix();
Output_Gradient = Delta2 * Hidden.Transpose();
Bias2_Gradient = Delta2;

Delta1 = ElementWiseMultiply(Weights2.Transpose() * Delta2 , ReLUDerivative(Z1));

Hidden_Gradient = Delta1 * Input.Transpose();
Bias1_Gradient = Delta1;

Weights2 = Weights2 - (LearningRate * Output_Gradient);
Bias2 = Bias2 - (LearningRate * Bias2_Gradient);

Weights1 = Weights1 - (LearningRate * Hidden_Gradient);
Bias1 = Bias1 - (LearningRate * Bias1_Gradient);
}
private double[] Scale(double[] data)
{
double[] res = new double[data.Length];
double sum = data.Sum();
for (int i = 0; i < res.Length; i++)
{
res[i] = data[i] / sum;
}
return res;
}
}
public static class DoubleExtensions
{
public static bool Any(this double[,] matrix, Func func)
{
for (int i = 0; i < matrix.GetLength(0); i++)
{
for (int j = 0; j < matrix.GetLength(1); j++)
{
if (!func.Invoke(matrix[i, j]))
{
return true;
}
}
}
return false;
}
public static bool All(this double[,] matrix, Func func)
{
List isTrue = new List();
for (int i = 0; i < matrix.GetLength(0); i++)
{
for (int j = 0; j < matrix.GetLength(1);  j++)
{
if (func.Invoke(matrix[i, j]))
{
isTrue.Add(true);
}
else
{
isTrue.Add(false);
}
}
}
return isTrue.All(x => x is true);
}
public static NeuralNetworkData ToMatrix(this double[] vector)
{
if (vector.Any(x => x != 0))
{
double[,] res = new double[vector.Length,1];
for (int i = 0; i < res.GetLength(0); i++)
{
res[i, 0] = vector[i];
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("No input.");
}
}
public static NeuralNetworkData Transpose(this NeuralNetworkData matrix)
{
if (matrix != null)
{
double[,] res = new double[matrix.Data.GetLength(1), matrix.Data.GetLength(0)];
for (int i = 0; i < matrix.Data.GetLength(0); i++)
{
for (int j = 0; j < matrix.Data.GetLength(1); j++)
{
res[j, i] = matrix.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("No input provided!");
}
}
public static double[] ToVector(this NeuralNetworkData matrix)
{
if (matrix.Data.GetLength(1) == 1)
{
double[] res = new double[matrix.Data.GetLength(0)];
for (int i = 0; i < res.Length; i++)
{
res[i] = matrix.Data[i, 0];
}

return (res);
}
else
{
throw new Exception("Matrix too big!");
}
}
public static double[] Multiply(this double[] first, double second)
{
double[] res = new double[first.Length];
for (int i = 0; i < res.Length; i++)
{
res[i] = first[i] * second;
}
return res;
}
}

Вот данные NeuralNetworkData:

Код: Выделить всё

public class NeuralNetworkData
{

private void FillMatrix()
{
for (int i = 0; i < Data.GetLength(0); i++)
{
for (int j = 0; j < Data.GetLength(1); j++)
{
Data[i, j] = rnd.NextDouble() * 0.01;
}
}
}
public static NeuralNetworkData operator *(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) != second.Data.GetLength(0))
throw new Exception("Matrices cannot be multiplied!");

double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];

for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1); j++)
{
double sum = 0;
for (int k = 0; k < first.Data.GetLength(1); k++)
{
sum += first.Data[i, k] * second.Data[k, j];
}
res[i, j] = sum;
}
}

return new NeuralNetworkData(res);
}
public static NeuralNetworkData operator *(double first, NeuralNetworkData second)
{
double[,] res = new double[second.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < second.Data.GetLength(0); i++)
{
for (int j = 0; j < second.Data.GetLength(1); j++)
{
res[i, j] = second.Data[i, j] * first;
}
}
return new NeuralNetworkData(res);
}
public static NeuralNetworkData operator +(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) == second.Data.GetLength(1) &&
first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1);  j++)
{
res[i, j] = first.Data[i, j] + second.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("Not the same length.");
}
}
public static NeuralNetworkData operator -(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) == second.Data.GetLength(1) &&
first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1); j++)
{
res[i, j] = first.Data[i, j] - second.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("Not the same length.");
}
}
}

Заранее спасибо за все советы.
Я пробовал разные скорости обучения, разное количество нейронов в скрытом слое. К сожалению, ничего не помогло.

Подробнее здесь: https://stackoverflow.com/questions/785 ... parameters

Реклама

1716334419

Anonymous

У меня есть ИНС, реализованная с нуля на C#. Однако не сходилось, в чем может быть проблема? Я пробовал разные функции активации, другой набор данных.  Набор данных генерируется случайным образом, но ИНС в Python работает с тем же набором данных, поэтому можно обучить нейронную сеть данным.
[code]
private NeuralNetworkData ReLU(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
for (int i = 0; i < res.Length; i++)
{
res[i, 0] = MathF.Max(0, (float)x.Data[i,0]);
}
return new NeuralNetworkData( res);
}
private NeuralNetworkData Softmax(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
double max = x.ToVector().Max(x => x);
double[] exps = x.ToVector().Select(x => Math.Exp(x - max)).ToArray();
double sumExps = exps.Sum();

for (int i = 0; i < res.Length; i++)
{
res[i, 0] = exps[i] / sumExps;
}
return new NeuralNetworkData(res);
}
private NeuralNetworkData ReLUDerivative(NeuralNetworkData x)
{
double[,] res = new double[x.Data.GetLength(0), x.Data.GetLength(1)];
for (int i = 0; i < res.Length; i++)
{
res[i, 0] = x.Data[i, 0] > 0 ? 1 : 0;
}
return new NeuralNetworkData(res);
}
private void FeedForward(int index, int epoch)
{
if (epoch is 0 && index is 0)
{
Weights1 = Weights1.Transpose();
Weights2 = Weights2.Transpose();
}
Input = Scale(DataFile.Data[index].Values).ToMatrix();
Z1 = (Weights1 * Input) + Bias1;
Hidden = ReLU(Z1);
Z2 = (Weights2 * Hidden) + Bias2;
Output =  Softmax(Z2);

//Console.WriteLine($"N1: {Output[0]}, N2: {Output[1]}, N3: {Output[2]}");
}
private double Error(int index)
{
double localError = 0;
for (int i = 0; i < Output.Data.GetLength(0); i++)
{
localError -= (DataFile.Data[index].Label[i] * Math.Log(Output.Data[i, 0] + 1e-9));
}

return localError;
}
private NeuralNetworkData ElementWiseMultiply(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[] res = new double[first.Data.GetLength(0)];
for (int i = 0; i < res.Length; i++)
{
res[i] = first.Data[i, 0] * second.Data[i, 0];
}
return res.ToMatrix();
}
else
{
throw new Exception("Two vectors are not the same length!");
}
}
private void Backpropagate(int index)
{
Delta2 = Output - DataFile.Data[index].Label.ToMatrix();
Output_Gradient = Delta2 * Hidden.Transpose();
Bias2_Gradient = Delta2;

Delta1 = ElementWiseMultiply(Weights2.Transpose() * Delta2 , ReLUDerivative(Z1));

Hidden_Gradient = Delta1 * Input.Transpose();
Bias1_Gradient = Delta1;

Weights2 = Weights2 - (LearningRate * Output_Gradient);
Bias2 = Bias2 - (LearningRate * Bias2_Gradient);

Weights1 = Weights1 - (LearningRate * Hidden_Gradient);
Bias1 = Bias1 - (LearningRate * Bias1_Gradient);
}
private double[] Scale(double[] data)
{
double[] res = new double[data.Length];
double sum = data.Sum();
for (int i = 0; i < res.Length; i++)
{
res[i] = data[i] / sum;
}
return res;
}
}
public static class DoubleExtensions
{
public static bool Any(this double[,] matrix, Func func)
{
for (int i = 0; i < matrix.GetLength(0); i++)
{
for (int j = 0; j < matrix.GetLength(1); j++)
{
if (!func.Invoke(matrix[i, j]))
{
return true;
}
}
}
return false;
}
public static bool All(this double[,] matrix, Func func)
{
List isTrue = new List();
for (int i = 0; i < matrix.GetLength(0); i++)
{
for (int j = 0; j < matrix.GetLength(1);  j++)
{
if (func.Invoke(matrix[i, j]))
{
isTrue.Add(true);
}
else
{
isTrue.Add(false);
}
}
}
return isTrue.All(x => x is true);
}
public static NeuralNetworkData ToMatrix(this double[] vector)
{
if (vector.Any(x => x != 0))
{
double[,] res = new double[vector.Length,1];
for (int i = 0; i < res.GetLength(0); i++)
{
res[i, 0] = vector[i];
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("No input.");
}
}
public static NeuralNetworkData Transpose(this NeuralNetworkData matrix)
{
if (matrix != null)
{
double[,] res = new double[matrix.Data.GetLength(1), matrix.Data.GetLength(0)];
for (int i = 0; i < matrix.Data.GetLength(0); i++)
{
for (int j = 0; j < matrix.Data.GetLength(1); j++)
{
res[j, i] = matrix.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("No input provided!");
}
}
public static double[] ToVector(this NeuralNetworkData matrix)
{
if (matrix.Data.GetLength(1) == 1)
{
double[] res = new double[matrix.Data.GetLength(0)];
for (int i = 0; i < res.Length; i++)
{
res[i] = matrix.Data[i, 0];
}

return (res);
}
else
{
throw new Exception("Matrix too big!");
}
}
public static double[] Multiply(this double[] first, double second)
{
double[] res = new double[first.Length];
for (int i = 0; i < res.Length; i++)
{
res[i] = first[i] * second;
}
return res;
}
}

[/code]
Вот данные NeuralNetworkData:
[code]public class NeuralNetworkData
{

private void FillMatrix()
{
for (int i = 0; i < Data.GetLength(0); i++)
{
for (int j = 0; j < Data.GetLength(1); j++)
{
Data[i, j] = rnd.NextDouble() * 0.01;
}
}
}
public static NeuralNetworkData operator *(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) != second.Data.GetLength(0))
throw new Exception("Matrices cannot be multiplied!");

double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];

for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1); j++)
{
double sum = 0;
for (int k = 0; k < first.Data.GetLength(1); k++)
{
sum += first.Data[i, k] * second.Data[k, j];
}
res[i, j] = sum;
}
}

return new NeuralNetworkData(res);
}
public static NeuralNetworkData operator *(double first, NeuralNetworkData second)
{
double[,] res = new double[second.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < second.Data.GetLength(0); i++)
{
for (int j = 0; j < second.Data.GetLength(1); j++)
{
res[i, j] = second.Data[i, j] * first;
}
}
return new NeuralNetworkData(res);
}
public static NeuralNetworkData operator +(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) == second.Data.GetLength(1) &&
first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1);  j++)
{
res[i, j] = first.Data[i, j] + second.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("Not the same length.");
}
}
public static NeuralNetworkData operator -(NeuralNetworkData first, NeuralNetworkData second)
{
if (first.Data.GetLength(1) == second.Data.GetLength(1) &&
first.Data.GetLength(0) == second.Data.GetLength(0))
{
double[,] res = new double[first.Data.GetLength(0), second.Data.GetLength(1)];
for (int i = 0; i < res.GetLength(0); i++)
{
for (int j = 0; j < res.GetLength(1); j++)
{
res[i, j] = first.Data[i, j] - second.Data[i, j];
}
}
return new NeuralNetworkData(res);
}
else
{
throw new Exception("Not the same length.");
}
}
}
[/code]
Заранее спасибо за все советы.
Я пробовал разные скорости обучения, разное количество нейронов в скрытом слое. К сожалению, ничего не помогло. 

Подробнее здесь: [url]https://stackoverflow.com/questions/78514773/why-is-my-ann-in-c-sharp-not-converging-despite-tuning-hyperparameters[/url]

Ответить Пред. тема След. тема

1 сообщение • Страница 1 из 1

Быстрый ответ

Заголовок:

Имя пользователя:

Изменение регистра текста:

Смайлики

Ещё смайлики…

К этому ответу прикреплено по крайней мере одно вложение.

Если вы не хотите добавлять вложения, оставьте поля пустыми. Можно прикреплять файлы, перетаскивая их в окно сообщения.

Максимально разрешённый размер вложения: 15 МБ.

Имя файла:

Комментарий к файлу:

Имя файла	Комментарий к файлу	Размер	Статус

Похожие темы

Ответы

Просмотры

Последнее сообщение

Модель всегда классифицирует изображения как кошек с высокой уверенностью, несмотря на настройку гиперпараметров

Последнее сообщение Anonymous « 10 ноя 2024, 03:01
Добавлено в форуме Python

Anonymous » 10 ноя 2024, 03:01 » в форуме Python

Я пытаюсь обучить модель на изображениях, используя приведенный ниже код. Моя структура каталогов следующая:

Папка PetImages размером примерно 1 ГБ расположена рядом с моим файлом main.py скрипт.
Внутри папки PetImages есть две подпапки: Cats и...

0 Ответы

10 Просмотры

Последнее сообщение Anonymous
10 ноя 2024, 03:01
Получение гиперпараметров LightGBM после обучения модели

Последнее сообщение Гость « 21 сен 2023, 22:48
Добавлено в форуме Python

Гость » 21 сен 2023, 22:48 » в форуме Python

Я использовал optuna для создания сотен моделей для набора данных. Несколько моделей оказались полезными, я случайно не сохранил гиперпараметры для хороших.

Я сохранил модель в формате .txt. Можно ли как-нибудь извлечь гиперпараметры из уже...

0 Ответы

57 Просмотры

Последнее сообщение Гость
21 сен 2023, 22:48
Оптимизация гиперпараметров Optuna во вложенном цикле CV предполагает идентичные гиперпараметры.

Последнее сообщение Anonymous « 02 янв 2024, 20:46
Добавлено в форуме Python

Anonymous » 02 янв 2024, 20:46 » в форуме Python

Я выполняю вложенное CV, при этом Optuna работает во внутреннем цикле, а лучшая модель затем оценивается на оставшихся данных внешнего цикла.

Однако Optuna предлагает одни и те же параметры для всех разделений CV, несмотря на разные данные.

я =...

0 Ответы

46 Просмотры

Последнее сообщение Anonymous
02 янв 2024, 20:46
ElasticNetCV в Python: получить полную сетку гиперпараметров с соответствующим MSE?

Последнее сообщение Anonymous « 26 июн 2024, 11:49
Добавлено в форуме Python

Anonymous » 26 июн 2024, 11:49 » в форуме Python

Я установил ElasticNetCV в Python с тремя разбиениями:
import numpy as np
from sklearn.linear_model import LinearRegression

#Sample data:
num_samples = 100 # Number of samples
num_features = 1000 # Number of features
X = np.random.rand(num_samples,...

0 Ответы

9 Просмотры

Последнее сообщение Anonymous
26 июн 2024, 11:49
Оптимизация гиперпараметров для повышения точности классификации с использованием набора данных NSL-KDD в scikit-learn

Последнее сообщение Anonymous « 30 окт 2024, 23:16
Добавлено в форуме Python

Anonymous » 30 окт 2024, 23:16 » в форуме Python

Я работаю с набором данных NSL-KDD, и моя задача — повысить точность алгоритмов классификации с помощью scikit-learn. В частности, я заинтересован в достижении показателя точности более 80%.
Я реализовал различные алгоритмы классификации из...

0 Ответы

13 Просмотры

Последнее сообщение Anonymous
30 окт 2024, 23:16

Вернуться в «C#»

Programmiererforum