2022-04-07 22:07:32 +02:00
|
|
|
#include <stdlib.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <string.h>
|
|
|
|
|
2022-04-08 15:53:29 +02:00
|
|
|
#include "neural_network.c"
|
|
|
|
#include "neuron_io.c"
|
|
|
|
#include "mnist.c"
|
|
|
|
|
|
|
|
|
2022-04-07 22:07:32 +02:00
|
|
|
void help(char* call) {
|
|
|
|
printf("Usage: %s ( train | recognize ) [OPTIONS]\n\n", call);
|
|
|
|
printf("OPTIONS:\n");
|
|
|
|
printf("\ttrain:\n");
|
2022-04-08 15:53:29 +02:00
|
|
|
printf("\t\t--batches | -b [int]\tNombre de batches.\n");
|
|
|
|
printf("\t\t--couches | -c [int]\tNombres de couches.\n");
|
|
|
|
printf("\t\t--neurons | -n [int]\tNombre de neurones sur la première couche.\n");
|
|
|
|
printf("\t\t--recover | -r [FILENAME]\tRécupérer depuis un modèle existant.\n");
|
|
|
|
printf("\t\t--images | -i [FILENAME]\tFichier contenant les images.\n");
|
|
|
|
printf("\t\t--labels | -l [FILENAME]\tFichier contenant les labels.\n");
|
|
|
|
printf("\t\t--out | -o [FILENAME]\tFichier où écrire le réseau de neurones.\n");
|
2022-04-07 22:07:32 +02:00
|
|
|
printf("\trecognize:\n");
|
2022-04-08 15:53:29 +02:00
|
|
|
printf("\t\t--modele | -m [FILENAME]\tFichier contenant le réseau de neurones.\n");
|
|
|
|
printf("\t\t--in | -i [FILENAME]\tFichier contenant les images à reconnaître.\n");
|
|
|
|
printf("\t\t--out | -o (text|json)\tFormat de sortie.\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void ecrire_image_dans_reseau(int** image, Reseau* reseau, int height, int width) {
|
|
|
|
for (int i=0; i < height; i++) {
|
|
|
|
for (int j=0; j < width; j++) {
|
|
|
|
reseau->couches[0]->neurones[i*height+j]->activation = (float)image[i][j] / 255.0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void train(int batches, int couches, int neurons, char* recovery, char* image_file, char* label_file, char* out) {
|
2022-04-08 16:07:44 +02:00
|
|
|
// Entraînement du réseau sur le set de données MNIST
|
2022-04-08 15:53:29 +02:00
|
|
|
Reseau* reseau;
|
|
|
|
|
|
|
|
//int* repartition = malloc(sizeof(int)*couches);
|
|
|
|
int* sortie_voulue;
|
|
|
|
int repartition[5] = {784, 100, 75, 40, 10};
|
|
|
|
//generer_repartition(couches, repartition);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* On repart d'un réseau déjà créée stocké dans un fichier
|
|
|
|
* ou on repart de zéro si aucune backup n'est fournie
|
|
|
|
* */
|
|
|
|
if (! recovery) {
|
|
|
|
reseau = malloc(sizeof(Reseau));
|
|
|
|
creation_du_reseau_neuronal(reseau, repartition, couches);
|
|
|
|
} else {
|
|
|
|
reseau = lire_reseau(recovery);
|
|
|
|
printf("Backup restorée.\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
// Chargement des images du set de données MNIST
|
|
|
|
int* parameters = read_mnist_images_parameters(image_file);
|
|
|
|
int nb_images = parameters[0];
|
|
|
|
int height = parameters[1];
|
|
|
|
int width = parameters[2];
|
|
|
|
|
|
|
|
int*** images = read_mnist_images(image_file);
|
|
|
|
unsigned int* labels = read_mnist_labels(label_file);
|
|
|
|
|
|
|
|
for (int i=0; i < batches; i++) {
|
|
|
|
printf("Batch [%d/%d]\n", i, batches);
|
|
|
|
for (int j=0; j < nb_images; j++) {
|
|
|
|
printf("\rImage [%d/%d]", j, nb_images);
|
|
|
|
ecrire_image_dans_reseau(images[j], reseau, height, width);
|
|
|
|
sortie_voulue = creation_de_la_sortie_voulue(reseau, labels[j]);
|
|
|
|
forward_propagation(reseau);
|
|
|
|
backward_propagation(reseau, sortie_voulue);
|
|
|
|
}
|
|
|
|
printf("\n");
|
2022-04-08 16:07:44 +02:00
|
|
|
modification_du_reseau_neuronal(reseau);
|
2022-04-08 15:53:29 +02:00
|
|
|
ecrire_reseau(out, reseau);
|
|
|
|
}
|
2022-04-07 22:07:32 +02:00
|
|
|
}
|
|
|
|
|
2022-04-08 16:07:44 +02:00
|
|
|
void recognize(char* modele, char* entree, char* sortie) {
|
|
|
|
Reseau* reseau = lire_reseau(modele);
|
|
|
|
|
|
|
|
int* parameters = read_mnist_images_parameters(entree);
|
|
|
|
int nb_images = parameters[0];
|
|
|
|
int height = parameters[1];
|
|
|
|
int width = parameters[2];
|
|
|
|
|
|
|
|
int*** images = read_mnist_images(entree);
|
|
|
|
|
|
|
|
for (int i=0; i < nb_images; i++) {
|
|
|
|
printf("Image %d\n", i);
|
|
|
|
ecrire_image_dans_reseau(images[i], reseau, height, width);
|
|
|
|
forward_propagation(reseau);
|
|
|
|
for (int j=0; j < reseau->couches[reseau->nb_couches-1]->nb_neurones; j++) {
|
|
|
|
printf("Probabilité %d: %f\n", j, reseau->couches[reseau->nb_couches-1]->neurones[j]->activation);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2022-04-08 15:53:29 +02:00
|
|
|
|
2022-04-07 22:07:32 +02:00
|
|
|
int main(int argc, char* argv[]) {
|
|
|
|
if (argc < 2) {
|
|
|
|
printf("Pas d'action spécifiée\n");
|
|
|
|
help(argv[0]);
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (! strcmp(argv[1], "train")) {
|
|
|
|
int batches = 5;
|
|
|
|
int couches = 5;
|
|
|
|
int neurons = 784;
|
|
|
|
char* images = NULL;
|
|
|
|
char* labels = NULL;
|
2022-04-08 15:53:29 +02:00
|
|
|
char* recovery = NULL;
|
2022-04-07 22:07:32 +02:00
|
|
|
char* out = NULL;
|
|
|
|
int i=2;
|
|
|
|
while (i < argc) {
|
|
|
|
// Utiliser un switch serait sans doute plus élégant
|
|
|
|
if ((! strcmp(argv[i], "--batches"))||(! strcmp(argv[i], "-b"))) {
|
|
|
|
batches = strtol(argv[i+1], NULL, 10);
|
|
|
|
i += 2;
|
|
|
|
} else
|
|
|
|
if ((! strcmp(argv[i], "--couches"))||(! strcmp(argv[i], "-c"))) {
|
|
|
|
couches = strtol(argv[i+1], NULL, 10);
|
|
|
|
i += 2;
|
|
|
|
} else if ((! strcmp(argv[i], "--neurons"))||(! strcmp(argv[i], "-n"))) {
|
|
|
|
neurons = strtol(argv[i+1], NULL, 10);
|
|
|
|
i += 2;
|
|
|
|
} else if ((! strcmp(argv[i], "--images"))||(! strcmp(argv[i], "-i"))) {
|
|
|
|
images = argv[i+1];
|
|
|
|
i += 2;
|
|
|
|
} else if ((! strcmp(argv[i], "--labels"))||(! strcmp(argv[i], "-l"))) {
|
|
|
|
labels = argv[i+1];
|
|
|
|
i += 2;
|
2022-04-08 15:53:29 +02:00
|
|
|
} else if ((! strcmp(argv[i], "--recover"))||(! strcmp(argv[i], "-r"))) {
|
|
|
|
recovery = argv[i+1];
|
|
|
|
i += 2;
|
2022-04-07 22:07:32 +02:00
|
|
|
} else if ((! strcmp(argv[i], "--out"))||(! strcmp(argv[i], "-o"))) {
|
|
|
|
out = argv[i+1];
|
|
|
|
i += 2;
|
|
|
|
} else {
|
|
|
|
printf("%s : Argument non reconnu\n", argv[i]);
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (! images) {
|
|
|
|
printf("Pas de fichier d'images spécifié\n");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (! labels) {
|
|
|
|
printf("Pas de fichier de labels spécifié\n");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (! out) {
|
|
|
|
printf("Pas de fichier de sortie spécifié, default: out.bin\n");
|
|
|
|
out = "out.bin";
|
|
|
|
}
|
|
|
|
// Entraînement en sourçant neural_network.c
|
2022-04-08 15:53:29 +02:00
|
|
|
train(batches, couches, neurons, recovery, images, labels, out);
|
2022-04-07 22:07:32 +02:00
|
|
|
exit(0);
|
|
|
|
}
|
|
|
|
if (! strcmp(argv[1], "recognize")) {
|
|
|
|
char* in = NULL;
|
|
|
|
char* modele = NULL;
|
|
|
|
char* out = NULL;
|
|
|
|
int i=2;
|
|
|
|
while(i < argc) {
|
|
|
|
if ((! strcmp(argv[i], "--in"))||(! strcmp(argv[i], "-i"))) {
|
|
|
|
in = argv[i+1];
|
|
|
|
i += 2;
|
|
|
|
} else if ((! strcmp(argv[i], "--modele"))||(! strcmp(argv[i], "-m"))) {
|
|
|
|
modele = argv[i+1];
|
|
|
|
i += 2;
|
|
|
|
} else if ((! strcmp(argv[i], "--out"))||(! strcmp(argv[i], "-o"))) {
|
|
|
|
out = argv[i+1];
|
|
|
|
i += 2;
|
|
|
|
} else {
|
|
|
|
printf("%s : Argument non reconnu\n", argv[i]);
|
|
|
|
i++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (! in) {
|
|
|
|
printf("Pas d'entrée spécifiée\n");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (! modele) {
|
|
|
|
printf("Pas de modèle spécifié\n");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
if (! out) {
|
|
|
|
out = "text";
|
|
|
|
}
|
2022-04-08 16:07:44 +02:00
|
|
|
recognize(modele, in, out);
|
2022-04-07 22:07:32 +02:00
|
|
|
// Reconnaissance puis affichage des données sous le format spécifié
|
|
|
|
exit(0);
|
|
|
|
}
|
|
|
|
printf("Option choisie non reconnue: %s\n", argv[1]);
|
|
|
|
help(argv[0]);
|
|
|
|
return 1;
|
|
|
|
}
|