2025-04-22 21:23:53 +02:00
11 changed files with 39 additions and 98 deletions
--- a/src/cnn/free.c
+++ b/src/cnn/free.c
@ -181,7 +181,6 @@ void free_network(Network* network) {
        // et que cela soit le cas UNIQUEMENT pour la mémoire allouée au réseau
        // Représente un gain de 45mn sur VGG16
        (void)network;
        free_all_memory();
    #else
        for (int i=network->size-2; i>=0; i--) {
--- a/src/cnn/test_network.c
+++ b/src/cnn/test_network.c
@ -1,8 +1,7 @@
 #include <stdbool.h>
 #include <assert.h>
 #include <string.h>
 #include <stdlib.h>
 #include <stdio.h>
 #include <stdbool.h>
 #include <string.h>
 #include "../common/include/memory_management.h"
 #include "../common/include/mnist.h"
@ -184,13 +183,12 @@ void recognize_mnist(Network* network, char* input_file, char* out) {
 }
 void recognize_jpg(Network* network, char* input_file, char* out) {
-    int width; // Dimensions de l'image, qui doit être carrée
+    int width, height; // Dimensions de l'image
    int maxi;
    imgRawImage* image = loadJpegImageFile(input_file);
    width = image->width;
-
+    height = image->height;
    assert(image->width == image->height);
    if (! strcmp(out, "json")) {
        printf("{\n");
--- a/src/cnn/train.c
+++ b/src/cnn/train.c
@ -127,7 +127,7 @@ void* train_thread(void* parameters) {
 void train(int dataset_type, char* images_file, char* labels_file, char* data_dir, int epochs, char* out, char* recover) {
    #ifdef USE_CUDA
-    bool compatibility = cuda_setup(true);
+    bool compatibility = check_cuda_compatibility();
    if (!compatibility) {
        printf("Exiting.\n");
        exit(1);
--- a/src/common/include/utils.h
+++ b/src/common/include/utils.h
@ -60,10 +60,8 @@ extern "C"
 #endif
 /*
 * Vérification de la compatibilité CUDA
 * spécifier avec "verbose" si il faut afficher
 * la carte utilisée notamment
 */
-bool cuda_setup(bool verbose);
+bool check_cuda_compatibility();
 #ifdef __CUDACC__
 extern "C"
--- a/src/common/utils.c
+++ b/src/common/utils.c
@ -1,7 +1,6 @@
 #include <stdbool.h>
 #include <stdlib.h>
 #include <stdio.h>
 #ifdef USE_CUDA
    #ifndef __CUDACC__
        #include "cuda_runtime.h"
@ -43,65 +42,39 @@ int i_div_up(int a, int b) { // Partie entière supérieure de a/b
 #ifdef __CUDACC__
 extern "C"
 #endif
-bool cuda_setup(bool verbose) {
+bool check_cuda_compatibility() {
    #ifdef __CUDACC__
    int nDevices;
    int selected_device = 0;
    cudaDeviceProp selected_prop;
    cudaDeviceProp prop;
    cudaGetDeviceCount(&nDevices);
-    if (nDevices <= 0) { // I've seen weird issues when there is no GPU at all
+    if (nDevices == 0) {
-        if (verbose) {
+        printf("Pas d'utilisation du GPU\n\n");
            printf("Pas d'utilisation du GPU\n\n");
        }
        return false;
    }
-    if (verbose) {
+    printf("GPUs disponibles:\n");
        printf("GPUs disponibles:\n");
    }
    cudaGetDeviceProperties(&selected_prop, selected_device);
    for (int i=0; i < nDevices; i++) {
        cudaGetDeviceProperties(&prop, i);
-
+        printf(" - %s\n\t - Compute Capability: %d.%d\n\t - Memory available: ", prop.name, prop.major, prop.minor);
-        if (verbose) {
+        printf_memory(prop.totalGlobalMem);
-            printf(" - %s\n\t - Compute Capability: %d.%d\n\t - Memory available: ", prop.name, prop.major, prop.minor);
+        printf("\n\t - Shared Memory per block: ");
-            printf_memory(prop.totalGlobalMem);
+        printf_memory(prop.sharedMemPerBlock);
-            printf("\n\t - Shared Memory per block: ");
+        printf("\n\n");
            printf_memory(prop.sharedMemPerBlock);
            printf("\n\n");
        }
        if (prop.clockRate*prop.multiProcessorCount >= selected_prop.clockRate*selected_prop.multiProcessorCount) { // This criteria approximately matches the best device
            selected_prop = prop;
            selected_device = i;
        }
    }
-    cudaSetDevice(selected_device); // Select the best device for computation
+    cudaGetDeviceProperties(&prop, 0);
-    if (verbose) {
+    printf("Utilisation du GPU: " BLUE "%s" RESET "\n\n", prop.name);
        printf("Utilisation du GPU: " BLUE "%s" RESET "\n\n", selected_prop.name);
    }
-    if (BLOCKSIZE_x*BLOCKSIZE_y*BLOCKSIZE_z > prop.maxThreadsPerBlock) {
+    if (prop.sharedMemPerBlock != MEMORY_BLOCK) {
        printf_error((char*)"La taille de bloc sélectionnée est trop grande.\n");
        printf("\tMaximum accepté: %d\n", selected_prop.maxThreadsPerBlock);
        exit(1);
    }
    if (selected_prop.sharedMemPerBlock != MEMORY_BLOCK) { // C'est un warning, on l'affiche dans tous les cas
        printf_warning((char*)"La taille des blocs mémoire du GPU et celle utilisée dans le code diffèrent.\n");
        printf("\tCela peut mener à une utilisation supplémentaire de VRAM.\n");
-        printf("\tChanger MEMORY_BLOCK à %ld dans src/include/memory_management.h\n", selected_prop.sharedMemPerBlock);
+        printf("\tChanger MEMORY_BLOCK à %ld dans src/include/memory_management.h\n", prop.sharedMemPerBlock);
    }
    return true;
    #else
-    if (verbose) {
+    printf("Pas d'utilisation du GPU\n\n");
        printf("Pas d'utilisation du GPU\n\n");
    }
    return false;
    #endif
 }
--- a/src/common/utils.cu
+++ b/src/common/utils.cu
@ -1,7 +1,6 @@
 #include <stdbool.h>
 #include <stdlib.h>
 #include <stdio.h>
 #ifdef USE_CUDA
    #ifndef __CUDACC__
        #include "cuda_runtime.h"
@ -43,65 +42,39 @@ int i_div_up(int a, int b) { // Partie entière supérieure de a/b
 #ifdef __CUDACC__
 extern "C"
 #endif
-bool cuda_setup(bool verbose) {
+bool check_cuda_compatibility() {
    #ifdef __CUDACC__
    int nDevices;
    int selected_device = 0;
    cudaDeviceProp selected_prop;
    cudaDeviceProp prop;
    cudaGetDeviceCount(&nDevices);
-    if (nDevices <= 0) { // I've seen weird issues when there is no GPU at all
+    if (nDevices == 0) {
-        if (verbose) {
+        printf("Pas d'utilisation du GPU\n\n");
            printf("Pas d'utilisation du GPU\n\n");
        }
        return false;
    }
-    if (verbose) {
+    printf("GPUs disponibles:\n");
        printf("GPUs disponibles:\n");
    }
    cudaGetDeviceProperties(&selected_prop, selected_device);
    for (int i=0; i < nDevices; i++) {
        cudaGetDeviceProperties(&prop, i);
-
+        printf(" - %s\n\t - Compute Capability: %d.%d\n\t - Memory available: ", prop.name, prop.major, prop.minor);
-        if (verbose) {
+        printf_memory(prop.totalGlobalMem);
-            printf(" - %s\n\t - Compute Capability: %d.%d\n\t - Memory available: ", prop.name, prop.major, prop.minor);
+        printf("\n\t - Shared Memory per block: ");
-            printf_memory(prop.totalGlobalMem);
+        printf_memory(prop.sharedMemPerBlock);
-            printf("\n\t - Shared Memory per block: ");
+        printf("\n\n");
            printf_memory(prop.sharedMemPerBlock);
            printf("\n\n");
        }
        if (prop.clockRate*prop.multiProcessorCount >= selected_prop.clockRate*selected_prop.multiProcessorCount) { // This criteria approximately matches the best device
            selected_prop = prop;
            selected_device = i;
        }
    }
-    cudaSetDevice(selected_device); // Select the best device for computation
+    cudaGetDeviceProperties(&prop, 0);
-    if (verbose) {
+    printf("Utilisation du GPU: " BLUE "%s" RESET "\n\n", prop.name);
        printf("Utilisation du GPU: " BLUE "%s" RESET "\n\n", selected_prop.name);
    }
-    if (BLOCKSIZE_x*BLOCKSIZE_y*BLOCKSIZE_z > prop.maxThreadsPerBlock) {
+    if (prop.sharedMemPerBlock != MEMORY_BLOCK) {
        printf_error((char*)"La taille de bloc sélectionnée est trop grande.\n");
        printf("\tMaximum accepté: %d\n", selected_prop.maxThreadsPerBlock);
        exit(1);
    }
    if (selected_prop.sharedMemPerBlock != MEMORY_BLOCK) { // C'est un warning, on l'affiche dans tous les cas
        printf_warning((char*)"La taille des blocs mémoire du GPU et celle utilisée dans le code diffèrent.\n");
        printf("\tCela peut mener à une utilisation supplémentaire de VRAM.\n");
-        printf("\tChanger MEMORY_BLOCK à %ld dans src/include/memory_management.h\n", selected_prop.sharedMemPerBlock);
+        printf("\tChanger MEMORY_BLOCK à %ld dans src/include/memory_management.h\n", prop.sharedMemPerBlock);
    }
    return true;
    #else
-    if (verbose) {
+    printf("Pas d'utilisation du GPU\n\n");
        printf("Pas d'utilisation du GPU\n\n");
    }
    return false;
    #endif
 }
--- a/src/scripts/convolution_benchmark.cu
+++ b/src/scripts/convolution_benchmark.cu
@ -217,7 +217,7 @@ int main(int argc, char* argv[]) {
    /*
    printf("Checking CUDA compatibility.\n");
-    bool cuda_compatible = cuda_setup(true);
+    bool cuda_compatible = check_cuda_compatibility();
    if (!cuda_compatible) {
        printf(RED "CUDA not compatible, skipping tests.\n" RESET);
        return 0;
--- a/test/cnn_convolution.cu
+++ b/test/cnn_convolution.cu
@ -192,7 +192,7 @@ void run_convolution_test(int input_width, int output_width, int rows, int colum
 int main() {
    printf("Checking CUDA compatibility.\n");
-    bool cuda_compatible = cuda_setup(true);
+    bool cuda_compatible = check_cuda_compatibility();
    if (!cuda_compatible) {
        printf(RED "CUDA not compatible, skipping tests.\n" RESET);
        return 0;
--- a/test/cnn_function.cu
+++ b/test/cnn_function.cu
@ -91,7 +91,7 @@ void test1(int activation, bool use_local_kernel) {
 int main() {
    printf("Checking CUDA compatibility.\n");
-    bool cuda_compatible = cuda_setup(true);
+    bool cuda_compatible = check_cuda_compatibility();
    if (!cuda_compatible) {
        printf(RED "CUDA not compatible, skipping tests.\n" RESET);
        return 0;
--- a/test/cnn_matrix_multiplication.cu
+++ b/test/cnn_matrix_multiplication.cu
@ -127,7 +127,7 @@ void run_matrices_test(int n, int p, int q) {
 int main() {
    printf("Checking CUDA compatibility.\n");
-    bool cuda_compatible = cuda_setup(true);
+    bool cuda_compatible = check_cuda_compatibility();
    if (!cuda_compatible) {
        printf(RED "CUDA not compatible, skipping tests.\n" RESET);
        return 0;
--- a/test/memory_management.cu
+++ b/test/memory_management.cu
@ -18,7 +18,7 @@ __global__ void check_access(int* array, int range) {
 int main() {
    printf("Checking CUDA compatibility.\n");
-    bool cuda_compatible = cuda_setup(true);
+    bool cuda_compatible = check_cuda_compatibility();
    if (!cuda_compatible) {
        printf(RED "CUDA not compatible, skipping tests.\n" RESET);
        return 0;