feat: add learning program

2026-01-25 03:34:21 +00:00 · 2025-06-01 21:42:15 +02:00
parent 5da7c7a22b
commit 705feb01fc
2 changed files with 66 additions and 8 deletions
--- a/main.py
+++ b/main.py
@@ -1 +1,53 @@
-import network
+from network import *
+
+def data(size:int, max_val: int):
+    def int_to_bits(n: int):
+        return [(n >> i) & 1 
+            for i in reversed(range(size))
+        ]
+   
+    return [(int_to_bits(i),[i / max_val]) 
+        for i in range(max_val + 1)
+    ]
+
+def train_network(network: NeuralNetwork, epochs=10000, learning_rate=0.1, 
+                  verbose: bool = False, size_data: int = 8, max_val: int = 255):
+    
+    train_data = data(size_data, max_val)
+    
+    for epoch in range(epochs):
+        for bits, target in train_data:
+            network.backward(bits, target, learning_rate)
+
+        if verbose and epoch % 100 == 0:
+            output = network.forward(bits)[0]
+            loss = (output - target[0]) ** 2
+
+            print(f"Epoch: {epoch}, Loss: {loss:.6f}")
+
+def main():
+    size = 8
+    max_val = (1 << size) - 1
+
+    network = NeuralNetwork([8, 16, 1])
+
+    print("Start training...")
+    train_network(network, verbose=True, size_data=size, epochs=45_000)
+    print("End training...")
+
+    while True:
+        string = input("Enter 8 bit number (ex: 01101001) or 'quit' to close: ") \
+            .strip().lower()
+        
+        if (string == 'quit'): break
+        if (len(string) != 8 or any (char not in '01' for char in string)):
+            print("Error: please enter exactly 8 bits (only 0 or 1).") 
+            continue
+        
+        bits_input = [int(char) for char in string]
+        output = network.forward(bits_input)[0] * max_val
+
+        print(f"Estimated value: {output} (approx: {round(output)})\n")
+
+if __name__ == "__main__":
+    main()
--- a/network.py
+++ b/network.py
@@ -30,14 +30,16 @@ class Neuron:
        # last output sigmoid(z)
        self.last_output = 0

-    def forward(self, x):
+    def forward(self, x, activate=True):
        """
        x               : list of input values to the neuron
        """
        # computes the weighted sum of inputs and add the bias
        self.z = sum(w * xi for w, xi in zip(self.weight, x)) + self.bias
        # normalize the output between 0 and 1
-        self.last_output = sigmoid(self.z)
+        if activate: self.last_output = sigmoid(self.z)
+        else: self.last_output = self.z
+
        return self.last_output
    
    # adjust weight and bias of neuron
@@ -54,6 +56,9 @@ class Neuron:
        dy_dz = sigmoid_deriv(self.z)
        # dz/dw = x
        dz_dw = x
+
+        assert len(dz_dw) >= self.isize, "too many value for input size"
+
        # dz/db = 1
        dz_db = 1

@@ -78,10 +83,10 @@ class Layer:
        # list of neurons
        self.neurons = [Neuron(input_size) for _ in range(output_size)]

-    def forward(self, inputs):
+    def forward(self, inputs, activate=True):
        self.inputs = inputs
        #  give the same inputs to each neuron in the layer
-        return [neuron.forward(inputs) for neuron in self.neurons]
+        return [neuron.forward(inputs, activate) for neuron in self.neurons]

    # adjust weight and bias of the layer (all neurons)
    def backward(self, dcost_dy_list, learning_rate=0.1):
@@ -105,8 +110,9 @@ class NeuralNetwork:

    def forward(self, inputs):
        output = inputs
-        for layer in self.layers:
-            output = layer.forward(output)
+        for i, layer in enumerate(self.layers):
+            activate = (i != len(self.layers) - 1)  # deactivate sigmoid latest neuron
+            output = layer.forward(output, activate=activate)
        return output

    def backward(self, inputs, targets, learning_rate=0.1):
@@ -117,7 +123,7 @@ class NeuralNetwork:
        output = self.forward(inputs)

        # computes the initial gradient of the cost function for each neuron
-        # by using Mean Squared Error: dC/dy = 2 * (output - target)
+        # by using Mean Squared Error's derivate: dC/dy = 2 * (output - target)
        dcost_dy_list = [2 * (o - t) for o, t in zip(output, targets)]

        grad = dcost_dy_list