avec tensorflow

cyberax64 · Sep 7, 2020 · 9502a1d · 9502a1d
1 parent c3c72fd
commit 9502a1d
Show file tree

Hide file tree

Showing 2 changed files with 239 additions and 30 deletions.
diff --git a/main_numpy.py b/main_numpy.py
@@ -122,40 +122,39 @@ def get_data(data_file, train, test):
 class AIExampleNumpy:
     """Réseau de neuronnes Perceptron multicouches avec numpy."""
 
-    def __init__(self, data, learningrate):
-        """ data = datas mis en forme
-            learningrate = coeff important
-        """
-
-        self.learningrate = learningrate
+    def __init__(self, data):
 
+        print("Création de l'objet ...")
         # Les datas
         [self.x_train, self.y_train, self.x_test, self.y_test] = data
 
         # Réseau de neurones: colonne 16 en entrée, 2 nodes de 100, sortie de 26 caractères
         self.layers = [16, 100, 100, 26]
+
         # Fonction d'activation: imite l'activation d'un neuronne
         self.activations = [relu, relu, sigmoid]
 
-    def training(self):
-        """Apprentissage avec 16 000 lignes"""
-
-        # Matrice diagonale de 1
-        diagonale = np.eye(26, 26)
+        # Matrice self.diagonale de 1
+        self.diagonale = np.eye(26, 26)
 
         # globals() Return a dictionary representing the current global symbol table.
         self.activations_prime = [globals()[fonction.__name__ + '_prime'] \
                                             for fonction in self.activations]
 
-        node_dict = {}
-
         # Liste des poids
         # Initialisation des poids des nodes, pour ne pas à être à 0
         # Construit 3 matrices (100x16, 100x100, 26x100)
         # /np.sqrt() résultat expérimental de l'initialisation de Xavier Glorot et He
-        weight_list = [np.random.randn(self.layers[k+1], self.layers[k]) / \
+        self.weight_init = [np.random.randn(self.layers[k+1], self.layers[k]) / \
                        np.sqrt(self.layers[k]) for k in range(len(self.layers)-1)]
 
+    def training(self, learningrate):
+        """Apprentissage avec 16 000 lignes"""
+
+        node_dict = {}
+        # Récupération des poids initiaux
+        weight_list = self.weight_init
+
         # vecteur_ligne = image en ligne à la 1ère itération
         # nombre_lettre = nombre correspondant à la lettre de l'image
         # i pour itération, vecteur_colonne = x_train de i, nombre_lettre = y_train de i
@@ -178,7 +177,7 @@ def training(self):
                 node_dict[k+1] = vecteur_colonne
 
             # Retro propagation, delta_a = écart entre la sortie réelle et attendue
-            delta_a = vecteur_colonne - diagonale[:,[nombre_lettre]]
+            delta_a = vecteur_colonne - self.diagonale[:,[nombre_lettre]]
             # Parcours des nodes en sens inverse pour corriger proportionnellemnt
             # les poids en fonction de l'erreur par rapport à la valeur souhaitée
             # Descente du Gradient stochastique
@@ -187,14 +186,13 @@ def training(self):
                 delta_w = np.dot(delta_z, node_dict[k].T)
                 delta_a = np.dot(weight_list[k].T, delta_z)
                 # Pour converger vers le minimum d'erreur
-                weight_list[k] -= self.learningrate * delta_w
+                weight_list[k] -= learningrate * delta_w
 
         return weight_list
 
     def testing(self, weight_list):
         """Teste avec les images de testing, retourne le ratio de bon résultats"""
 
-        # #print("Testing...")
         # Nombre de bonnes reconnaissance
         success = 0
 
@@ -223,8 +221,8 @@ def testing(self, weight_list):
     test = 4000
     data = get_data(data_file, train, test)
     print(f"Get data done. {data[0].shape, data[1].shape, data[2].shape, data[3].shape}")
-    for i in range(10):
-        print(f"Train Value {i} = {data[0][i]}")
+    for i in range(3):
+        print(f"\nTrain Value {i} = {data[0][i]}")
         print(f"Train Label {i} = {data[1][i]}")
         print(f"Test Value {i} = {data[2][i]}")
         print(f"Test Label {i} = {data[3][i]}")
@@ -234,17 +232,19 @@ def testing(self, weight_list):
     # 0.0222  # meilleur résultat
     t = time()
     result = []
-    for k in range(100):
-        learningrate = 0.0200 + (k * 0.00005)
+    print()
+    for j in range(10):
+        print(f"Initialisation {j}:")
+        aie = AIExampleNumpy(data)
+        for k in range(10):
+            learningrate = 0.021 + (k * 0.0005)
+            weight_list = aie.training(learningrate)
+            resp = aie.testing(weight_list)
+            result.append([learningrate, resp])
+
+            print(f"    {k}: Learningrate: {round(learningrate, 4)} Résultat {round(resp, 2)} %")
+        print()
 
-        aie = AIExampleNumpy(data, learningrate)
-
-        weight_list = aie.training()
-        resp = aie.testing(weight_list)
-        result.append([learningrate, resp])
-
-        print(f"Learningrate: {learningrate} Résultat {round(resp, 2)} %")
     print("Temps de calcul par cycle:", round((time()-t)/100, 2), "s")
-
     best = sorted(result, key=operator.itemgetter(1), reverse=True)
-    print(f"Meilleur résultat: learningrate={best[0][0]} efficacité={best[0][1]}")
+    print(f"Meilleur résultat: learningrate = {best[0][0]} efficacité = {round(best[0][1], 4)}")
diff --git a/main_tensorflow.py b/main_tensorflow.py
@@ -0,0 +1,209 @@
+#!/usr/bin/env python3-
+
+########################################################################
+# This file is part of AI Example.
+#
+# AI Example is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# AI Example is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+########################################################################
+
+
+import os
+from time import time
+import operator
+import numpy as np
+from tensorflow import keras
+
+"""
+Exemple construit sur documentation tensorflow:
+    https://www.tensorflow.org/tutorials/keras/classification
+"""
+
+epochs = 50
+
+
+CHARS_DICT = {  "A": 0, "B": 1, "C": 2, "D": 3, "E": 4, "F": 5, "G": 6, "H": 7,
+                "I": 8, "J": 9, "K": 10, "L": 11, "M": 12, "N": 13,
+                "O": 14, "P": 15, "Q": 16, "R": 17, "S": 18, "T": 19, "U": 20,
+                "V": 21, "W": 22, "X": 23, "Y": 24, "Z": 25}
+
+
+def main(data):
+    # Chargement des images
+    [train_images, train_labels, test_images, test_labels] = data
+    class_names = get_class_names()
+
+    # Construire le réseau de neuronnes nécessite de configurer les couches du
+    # modèle et ensuite de le compiler.
+    model = build_the_model()
+    model = compile_the_model(model)
+
+    # Apprentissage
+    model = training_the_model(model, train_images, train_labels, epochs)
+
+    # Test de l'efficacité
+    test_loss, test_acc = model.evaluate(test_images, test_labels)
+    print("\nTesting ......    \nEfficacité sur les tests:", round(test_acc, 4))
+
+
+def get_data(data_file, train, test):
+    """La partie la plus ennuyeuse de l'apprentissage automatique !
+    T,2,8,3,5,1,8,13,0,6,6,10,8,0,8,0,8
+    x_train = data pour training = 16000x16
+    y_train = labels = 16000x1
+    x_test = data pour testing = 4000x16
+    y_test = labels = 4000x1
+    """
+
+    print("\nGet datas ...")
+    with open(data_file) as f:
+        text = f.read()
+    f.close()
+
+    # Les datas dans un dict
+    #                 1 2 3 4 5 6 7  8 9 10 11 12 13 14 15 16
+    # data = {0: [T, [2,8,3,5,1,8,13,0,6, 6,10, 8, 0, 8, 0, 8]]}
+
+    data = {}
+    n = 0
+    for line in text.splitlines():
+        d = line.split(',')
+        data[n] = [d[0], []]
+        for i in range(1, 17):
+            data[n][1].append(int(d[i]))
+        n += 1
+
+    # Création des arrays
+    x_train = np.zeros((train, 16), dtype=np.uint8)
+    x_test = np.zeros((test, 16), dtype=np.uint8)
+    y_train = np.zeros((train), dtype=np.uint8)
+    y_test = np.zeros((test), dtype=np.uint8)
+
+    # Remplissage des arrays
+    i = 0
+    for k, v in data.items():
+
+        # Conversion de la lettre en nombre entier = numéro de l'objet
+        label = CHARS_DICT[v[0]]
+
+        # Les valeurs de la lettre
+        values = v[1]
+
+        # Insertion par lignes
+        if i < train:
+            x_train[i] = values
+            y_train[i] =  label
+        else:
+            x_test[i - train] =  v[1]
+            y_test[i - train] =  label
+        i += 1
+
+    return [x_train, y_train, x_test, y_test]
+
+
+def get_class_names():
+    """Liste des 26 noms d'objets"""
+
+    L = "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
+    return list(L)
+
+
+def build_the_model():
+    """Set up the layers:
+        The basic building block of a neural network is the *layer*. Layers
+        extract representations from the data fed into them. Hopefully, these
+        representations are meaningful for the problem at hand.
+
+        Most of deep learning consists of chaining together simple layers. Most
+        layers, such as `tf.keras.layers.Dense`, have parameters that are
+        learned during training.
+
+        The first layer in this network, `tf.keras.layers.Flatten`, transforms
+        the format of the images
+        from a two-dimensional array (of 40 by 40 pixels)
+        to a one-dimensional array (of 40 * 40 = 1600 pixels).
+        Think of this layer as unstacking rows of pixels in the image and
+        lining them up. This layer has no parameters to learn; it only
+        reformats the data.
+
+        After the pixels are flattened, the network consists of a sequence
+        of two `tf.keras.layers.Dense` layers. These are densely connected,
+        or fully connected, neural layers. The first `Dense` layer has 128
+        nodes (or neurons).
+
+        The second (and last) layer is a 27-node *softmax* layer that returns
+        an array of 27 probability scores that sum to 1. Each node contains
+        a score that indicates the probability that the current image belongs
+        to one of the 27 classes.
+    """
+
+    print("\nBuild the model ...")
+    model = keras.Sequential([  keras.layers.Flatten(input_shape=(16, 1)),
+                                keras.layers.Dense(128, activation='relu'),
+                                keras.layers.Dense(26, activation='softmax') ])
+    return model
+
+
+def compile_the_model(model):
+    """Compile the model:
+        Before the model is ready for training, it needs a few more settings.
+        These are added during the model's *compile* step:
+
+            * *Optimizer*
+                This is how the model is updated based on the data it sees and its
+                loss function.
+
+            * *Loss function*
+                This measures how accurate the model is during training.
+                You want to minimize this function to "steer" the model in the
+                right direction.
+
+            * *Metrics*
+                Used to monitor the training and testing steps. The following
+                example uses *accuracy*, the fraction of the images that are
+                correctly classified.
+    """
+
+    print("\nCompile the model ...")
+    model.compile(  optimizer='adam',
+                    loss='sparse_categorical_crossentropy',
+                    metrics=['accuracy'] )
+    return model
+
+
+def training_the_model(model, train_images, train_labels, epochs):
+    """Training the neural network model requires the following steps:
+
+        1. Feed the training data to the model. In this example, the training
+        data is in the `train_images` and `train_labels` arrays.
+        2. The model learns to associate images and labels.
+        3. You ask the model to make predictions about a test set—in this
+        example, the `test_images` array. Verify that the predictions match the
+        labels from the `test_labels` array.
+
+    To start training, call the `model.fit` method—so called because it "fits"
+    the model to the training data:
+    """
+
+    print("\nTraining the model ...")
+    model.fit(train_images, train_labels, epochs=epochs)
+    return model
+
+
+if __name__ == "__main__":
+
+    data_file = './letter-recognition.data'
+    train = 16000
+    test = 4000
+    data = get_data(data_file, train, test)
+    t = time()
+    main(data)
+    print(f"Calcul en {round(time() - t, 1)} secondes")