Initial work on genetic algorithm for tris

2022-12-22 21:35:16 +01:00 · 2022-12-22 21:35:16 +01:00 · 1f875e6f2b
parent d6e5e148aa
commit 1f875e6f2b
6 changed files with 418 additions and 60 deletions
--- a/src/main.nim
+++ b/src/main.nim
@ -3,7 +3,11 @@ import nn/util/activations
 import nn/util/losses


-var net = newNeuralNetwork(@[2, 3, 2], activationFunc=newActivation(sigmoid, func (x, y: float): float = 0.0), 
-                          lossFunc=newLoss(mse, mse), weightRange=(-1.0, +1.0), learnRate=0.05)
-var prediction = net.predict(newMatrix[float](@[2.7, 3.0]))
-echo prediction
+const InitialSize = 50
+
+
+var networks: seq[NeuralNetwork] = @[]
+for _ in 0..<InitialSize:
+    networks.add(newNeuralNetwork(@[9, 8, 10, 9], activationFunc=newActivation(sigmoid, func (x, y: float): float = 0.0), 
+                          lossFunc=newLoss(mse, func (x, y: float): float = 0.0), weightRange=(-1.0, +1.0), learnRate=0.05))
+
--- a/src/nn/layer.nim
+++ b/src/nn/layer.nim
@ -74,10 +74,12 @@ proc compute*(self: Layer, data: Matrix[float]): Matrix[float] =
    ## Computes the output of a given layer with
    ## the given input data and returns it as a
    ## one-dimensional array
-    result = ((self.weights * data).sum() + self.biases).apply(self.activation.function, axis= -1)
+    result = (self.weights.dot(data).sum() + self.biases).apply(self.activation.function, axis= -1)


-proc cost*(self: Layer, x: Matrix[float], Y: Matrix[float]): float =
+proc cost*(self: Layer, x, y: Matrix[float]): float =
    ## Returns the total cost of this layer
-    
+    for i in 0..x.shape.cols:
+        result += self.loss.function(x[0, i], y[0, i])
+    result /= float(x.shape.cols)
    
--- a/src/nn/network.nim
+++ b/src/nn/network.nim
@ -26,8 +26,9 @@ import std/strformat

 type 
    NeuralNetwork* = ref object
-        ## A generic neural network
-        layers*: seq[Layer]
+        ## A generic feed-forward 
+        ## neural network
+        layers: seq[Layer]


 proc newNeuralNetwork*(layers: seq[int], activationFunc: Activation, lossFunc: Loss, learnRate: float, 
@ -57,3 +58,10 @@ proc classify*(self: NeuralNetwork, data: Matrix[float]): int =
    ## Performs a prediction and returns the label
    ## with the highest likelyhood
    result = maxIndex(self.predict(data).raw[])
+
+
+proc cost*(self: NeuralNetwork, x, y: Matrix[float]): float =
+    ## Returns the total average cost of the network
+    for layer in self.layers:
+        result += layer.cost(x, y)
+    result /= float(self.layers.len())
--- a/src/nn/util/matrix.nim
+++ b/src/nn/util/matrix.nim
@ -13,7 +13,10 @@
 # limitations under the License.

 from std/strformat import `&`
-from std/sequtils import zip
+import std/random
+
+
+randomize()


 type
@ -34,8 +37,8 @@ proc getSize(shape: tuple[rows, cols: int]): int =
    ## Helper to get the size required for the
    ## underlying data array for a matrix of the
    ## given shape
-    if shape.cols == 0:
-        return shape.rows
+    if shape.rows == 0:
+        return shape.cols
    return shape.cols * shape.rows


@ -53,7 +56,7 @@ proc newMatrix*[T](data: seq[T]): Matrix[T] =
    result.order = RowMajor


-proc newMatrix*[T](data: seq[seq[T]], order: MatrixOrder = RowMajor): Matrix[T] {.raises: [ValueError].} =
+proc newMatrix*[T](data: seq[seq[T]], order: MatrixOrder = RowMajor): Matrix[T] =
    ## Initializes a new matrix from a given 
    ## 2D sequence
    new(result)
@ -81,12 +84,52 @@ proc newMatrix*[T](data: seq[seq[T]], order: MatrixOrder = RowMajor): Matrix[T]
                idx = col


-proc zeros*[T](shape: tuple[rows, cols: int], order: MatrixOrder = RowMajor): Matrix[T] =
+proc zeros*[T: int | float](shape: tuple[rows, cols: int], order: MatrixOrder = RowMajor): Matrix[T] =
    ## Creates a new matrix of the given shape
    ## filled with zeros
    new(result)
    new(result.data)
    result.data[] = @[]
+    let size = shape.getSize()
+    result.shape = shape
+    when T is int:
+        for _ in 0..<size:
+            result.data[].add(0)
+    when T is float:
+        for _ in 0..<size:
+            result.data[].add(0.0)
+
+
+proc ones*[T: int | float](shape: tuple[rows, cols: int], order: MatrixOrder = RowMajor): Matrix[T] =
+    ## Creates a new matrix of the given shape
+    ## filled with ones
+    new(result)
+    new(result.data)
+    result.data[] = @[]
+    let size = shape.getSize()
+    result.shape = shape
+    when T is int:
+        for _ in 0..<size:
+            result.data[].add(1)
+    when T is float:
+        for _ in 0..<size:
+            result.data[].add(1.0)
+
+proc rand*[T: int | float](shape: tuple[rows, cols: int], order: MatrixOrder = RowMajor): Matrix[T] =
+    ## Creates a new matrix of the given shape
+    ## filled with random values between 0 and
+    ## 1
+    new(result)
+    new(result.data)
+    result.data[] = @[]
+    let size = shape.getSize()
+    result.shape = shape
+    when T is int:
+        for _ in 0..<size:
+            result.data[].add(rand(0..1))
+    when T is float:
+        for _ in 0..<size:
+            result.data[].add(rand(0.0..1.0))


 # Simple one-line helpers and forward declarations
@ -105,7 +148,7 @@ func getIndex[T](self: Matrix[T], row, col: int): int =
        result = col * self.shape.rows + row


-proc `[]`*[T](self: Matrix[T], row, col: int): T {.raises: [IndexDefect, ValueError].} =
+proc `[]`*[T](self: Matrix[T], row, col: int): T =
    ## Gets the element the given row and
    ## column into the matrix
    var idx = self.getIndex(row, col)
@ -115,7 +158,7 @@ proc `[]`*[T](self: Matrix[T], row, col: int): T {.raises: [IndexDefect, ValueEr
    return self.data[idx]


-proc `[]`*[T](self: Matrix[T], row: int): MatrixView[T] {.raises: [IndexDefect, ValueError].} =
+proc `[]`*[T](self: Matrix[T], row: int): MatrixView[T] =
    ## Gets a single row in the matrix. No data copies
    ## occur and a view into the original matrix is
    ## returned
@ -128,7 +171,7 @@ proc `[]`*[T](self: Matrix[T], row: int): MatrixView[T] {.raises: [IndexDefect,
    result.row = row


-proc `[]`*[T](self: MatrixView[T], col: int): T {.raises: [IndexDefect, ValueError].} =
+proc `[]`*[T](self: MatrixView[T], col: int): T =
    ## Gets the element the given row into
    ## the matrix view
    var idx = self.m.getIndex(self.row, col)
@ -138,7 +181,7 @@ proc `[]`*[T](self: MatrixView[T], col: int): T {.raises: [IndexDefect, ValueErr
    result = self.m.data[idx]


-proc `[]=`*[T](self: Matrix[T], row, col: int, val: T) {.raises: [IndexDefect, ValueError].} =
+proc `[]=`*[T](self: Matrix[T], row, col: int, val: T) =
    ## Sets the element at the given row and
    ## column into the matrix to value val
    var idx = self.getIndex(row, col)
@ -148,7 +191,7 @@ proc `[]=`*[T](self: Matrix[T], row, col: int, val: T) {.raises: [IndexDefect, V
    self.data[idx] = val


-proc `[]=`*[T](self: MatrixView[T], col: int, val: T) {.raises: [IndexDefect, ValueError].} =
+proc `[]=`*[T](self: MatrixView[T], col: int, val: T) =
    ## Sets the element at the given row 
    ## into the matrix view to the value 
    ## val
@ -161,7 +204,7 @@ proc `[]=`*[T](self: MatrixView[T], col: int, val: T) {.raises: [IndexDefect, Va
    

 # Shape management
-proc reshape*[T](self: Matrix[T], shape: tuple[rows, cols: int]): Matrix[T] {.raises: [ValueError].} =
+proc reshape*[T](self: Matrix[T], shape: tuple[rows, cols: int]): Matrix[T] =
    ## Reshapes the given matrix. No data copies occur
    when not defined(release):
        if shape.getSize() != self.data[].len():
@ -170,7 +213,7 @@ proc reshape*[T](self: Matrix[T], shape: tuple[rows, cols: int]): Matrix[T] {.ra
    result.shape = shape


-proc reshape*[T](self: Matrix[T], rows, cols: int): Matrix[T] {.raises: [ValueError].} =
+proc reshape*[T](self: Matrix[T], rows, cols: int): Matrix[T] =
    ## Reshapes the given matrix. No data copies occur
    result = self.reshape((rows, cols))

@ -183,11 +226,14 @@ proc transpose*[T](self: Matrix[T]): Matrix[T] =


 proc flatten*[T](self: Matrix[T]): Matrix[T] =
-    ## Flattens the matrix into a vector. No
-    ## data copies occur
-    result = self.dup()
-    result.data = self.data
-    result = result.reshape(0, len(self))
+    ## Flattens the matrix into a vector
+    new(result)
+    new(result.data)
+    for row in self:
+        for element in row:
+            result.data[].add(element)
+    result.order = RowMajor
+    result.shape = (0, len(self))


 # Helpers for fast applying of operations along an axis
@ -218,7 +264,7 @@ proc apply*[T](self: Matrix[T], op: proc (a, b: T): T {.noSideEffect.}, b: T, co


 proc apply*[T](self: Matrix[T], op: proc (a: T): T {.noSideEffect.}, copy: bool = false, axis: int): Matrix[T] =
-    ## Applies a binary operator to every
+    ## Applies a unary operator to every
    ## element in the given axis of the
    ## given matrix (0 = rows, 1 = columns, 
    ## -1 = both). No copies occur unless 
@ -362,6 +408,7 @@ proc dup*[T](self: MatrixView[T]): MatrixView[T] =
    new(result)
    result.m = self.m
    result.shape = self.shape
+    result.row = self.row

 # matrix/scalar operations

@ -407,7 +454,7 @@ proc `+`*[T](a, b: MatrixView[T]): Matrix[T] =
        result.data[].add(a[i] + b[i])


-proc `+`*[T](a, b: Matrix[T]): Matrix[T] {.raises: [ValueError].} =
+proc `+`*[T](a, b: Matrix[T]): Matrix[T] =
    when not defined(release):
        if a.shape.rows > 0 and b.shape.rows > 0 and a.shape != b.shape:
            raise newException(ValueError, &"incompatible argument shapes for addition")
@ -445,7 +492,7 @@ proc `*`*[T](a, b: MatrixView[T]): Matrix[T] =
        result.data[].add(a[i] * b[i])


-proc `*`*[T](a, b: Matrix[T]): Matrix[T] {.raises: [ValueError].} =
+proc `*`*[T](a, b: Matrix[T]): Matrix[T] =
    when not defined(release):
        if a.shape.rows > 0 and b.shape.rows > 0 and a.shape.cols != b.shape.rows:
            raise newException(ValueError, &"incompatible argument shapes for multiplication")
@ -468,6 +515,12 @@ proc `*`*[T](a, b: Matrix[T]): Matrix[T] {.raises: [ValueError].} =
                    for m in r1 * r2:
                        for element in m:
                            result.data[].add(element)
+        else:
+            for r1 in a:
+                for r2 in b:
+                    for m in r1 * r2:
+                        for element in m:
+                            result.data[].add(element)
    else:
        result = a[0] * b[0]

@ -521,7 +574,53 @@ proc `>=`*[T](a: Matrix[T], b: T): Matrix[bool] =
        result.data[].add(e >= b)


-proc `==`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
+proc `==`*[T](a: MatrixView[T], b: MatrixView[T]): Matrix[bool] =
+    when not defined(release):
+        if a.len() != b.len():
+            raise newException(ValueError, "invalid shapes for comparison")
+    new(result)
+    new(result.data)
+    result.shape = a.shape
+    result.order = RowMajor
+    result.data[] = newSeqOfCap[bool](result.shape.getSize())
+    var col = 0
+    while col < result.shape.cols:
+        result.data[].add(a[col] == b[col])
+        inc(col)
+
+
+proc `==`*[T](a: Matrix[T], b: MatrixView[T]): Matrix[bool] =
+    when not defined(release):
+        if a.shape.cols != b.len() or a.shape.rows > 0:
+            raise newException(ValueError, "invalid shapes for comparison")
+    return a[0] == b
+
+
+proc diag*[T](a: Matrix[T], diagonal: int): Matrix[T] =
+    ## Returns the chosen diagonal of the given
+    ## matrix as a linear array. Diagonal 0 means left, 
+    ## 1 means right
+    when not defined(release):
+        if a.shape.rows != a.shape.cols:
+            raise newException(ValueError, "only square matrices have diagonals")
+    var res = newSeqOfCap[T](a.shape.getSize())
+    case diagonal:
+        of 0:
+            for i in 0..<a.shape.rows:
+                res.add(a[i, i])
+        of 1:
+            for i in 0..<a.shape.rows:
+                res.add(a[i, a.shape.rows - i])
+        else:
+            when not defined(release):
+                raise newException(ValueError, &"invalid diagonal {diagonal} for matrix")
+            else:
+                discard
+    result = newMatrix(res)
+
+
+
+proc `==`*[T](a, b: Matrix[T]): Matrix[bool] =
    when not defined(release):
        if a.shape != b.shape:
            raise newException(ValueError, "can't compare matrices of different shapes")
@ -530,12 +629,14 @@ proc `==`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
    result.shape = a.shape
    result.order = RowMajor
    result.data[] = newSeqOfCap[bool](result.shape.getSize())
+    if a.shape.rows == 0:
+        result = a[0] == b[0]
    for r in 0..<a.shape.rows:
        for c in 0..<a.shape.cols:
            result.data[].add(a[r, c] == b[r, c])


-proc `>`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
+proc `>`*[T](a, b: Matrix[T]): Matrix[bool] =
    when not defined(release):
        if a.shape != b.shape:
            raise newException(ValueError, "can't compare matrices of different shapes")
@ -544,12 +645,14 @@ proc `>`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
    result.shape = a.shape
    result.order = RowMajor
    result.data[] = newSeqOfCap[bool](result.shape.getSize())
+    if a.shape.rows == 0:
+        result = a[0] > b[0]
    for r in 0..<a.shape.rows:
        for c in 0..<a.shape.cols:
            result.data[].add(a[r, c] > b[r, c])


-proc `>=`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
+proc `>=`*[T](a, b: Matrix[T]): Matrix[bool] =
    when not defined(release):
        if a.shape != b.shape:
            raise newException(ValueError, "can't compare matrices of different shapes")
@ -558,12 +661,14 @@ proc `>=`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
    result.shape = a.shape
    result.order = RowMajor
    result.data[] = newSeqOfCap[bool](result.shape.getSize())
+    if a.shape.rows == 0:
+        result = a[0] >= b[0]
    for r in 0..<a.shape.rows:
        for c in 0..<a.shape.cols:
            result.data[].add(a[r, c] >= b[r, c])


-proc `<=`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
+proc `<=`*[T](a, b: Matrix[T]): Matrix[bool] =
    when not defined(release):
        if a.shape != b.shape:
            raise newException(ValueError, "can't compare matrices of different shapes")
@ -572,6 +677,8 @@ proc `<=`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} =
    result.shape = a.shape
    result.order = RowMajor
    result.data[] = newSeqOfCap[bool](result.shape.getSize())
+    if a.shape.rows == 0:
+        result = a[0] <= b[0]
    for r in 0..<a.shape.rows:
        for c in 0..<a.shape.cols:
            result.data[].add(a[r, c] <= b[r, c])
@ -585,40 +692,49 @@ proc all*(a: Matrix[bool]): bool =
    return true


+proc any*(a: Matrix[bool]): bool =
+    # Helper for boolean comparisons
+    for e in a.data[]:
+        if e:
+            return true
+    return false
+
+
 # Specular definitions of commutative operators
-proc `<`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} = b > a
-proc `!=`*[T](a, b: Matrix[T]): Matrix[bool] {.raises: [ValueError].} = not a == b
-proc `*`*[T](a: Matrix[T], b: MatrixView[T]): Matrix[T] {.raises: [ValueError].} = b * a
+proc `<`*[T](a, b: Matrix[T]): Matrix[bool] = b > a
+proc `!=`*[T](a, b: Matrix[T]): Matrix[bool] = not a == b
+proc `*`*[T](a: Matrix[T], b: MatrixView[T]): Matrix[T] = b * a
 proc `==`*[T](a: T, b: Matrix[T]): Matrix[bool] = b == a
+proc `==`*[T](a: MatrixView[T], b: Matrix[T]): Matrix[bool] = b == a
 proc `!=`*[T](a: Matrix[T], b: T): Matrix[bool] = not a == b
 proc `!=`*[T](a: T, b: Matrix[T]): Matrix[bool] = not b == a


-proc toRowMajor*[T](self: Matrix[T]): Matrix[T] =
+proc toRowMajor*[T](self: Matrix[T], copy: bool = true): Matrix[T] =
    ## Converts a column-major matrix to a
-    ## row-major one
+    ## row-major one. Returns a copy unless
+    ## copy equals false
    if self.order == RowMajor:
-        return
-    self.order = RowMajor
-    let orig = self.data[]
-    self.data[] = @[]
-    var idx = 0
-    var col = 0
-    while col < self.shape.cols:
-        self.data[].add(orig[idx])
-        idx += self.shape.cols
-        if idx > orig.high():
-            inc(col)
-            idx = col
-    result = self
+        return self
+    if copy:
+        result = self.copy()
+    else:
+        result = self
+    result.order = RowMajor
+    for row in self:
+        for element in row:
+            self.data[].add(element)


-proc toColumnMajor*[T](self: Matrix[T]): Matrix[T] =
+proc toColumnMajor*[T](self: Matrix[T], copy: bool = true): Matrix[T] =
    ## Converts a row-major matrix to a
    ## column-major one
-    new(result)
    if self.order == ColumnMajor:
-        return
+        return self
+    if copy:
+        result = self.copy()
+    else:
+        result = self
    self.order = ColumnMajor
    let orig = self.data[]
    self.data[] = @[]
@ -674,7 +790,7 @@ proc `$`*[T](self: MatrixView[T]): string =
 proc `$`*[T](self: Matrix[T]): string =
    ## Stringifies the matrix
    if self.shape.rows == 0:
-        return $self[0]
+        return $(self[0])
    result &= "["
    for i, row in self:
        result &= "["
@ -693,10 +809,34 @@ proc `$`*[T](self: Matrix[T]): string =
 proc dot*[T](self, other: Matrix[T]): Matrix[T] =
    ## Computes the dot product of the two
    ## input matrices
-    when not defined(release):
-        if a.shape.cols != b.shape.rows:
-            raise newException(ValueError, &"incompatible argument shapes for dot product")
-    # TODO
+    if self.shape.rows > 1 and other.shape.rows > 1:
+        when not defined(release):
+            if self.shape.rows != other.shape.cols:
+                raise newException(ValueError, &"incompatible argument shapes for dot product")
+        result = zeros[T]((self.shape.rows, other.shape.cols))
+        echo self
+        var other = other.transpose()
+        echo other
+        for i in 0..<result.shape.rows:
+            for j in 0..<result.shape.cols:
+                result[i, j] = (self[i] * other[j]).sum()
+    elif self.shape.rows > 1:
+        when not defined(release):
+            if self.shape.cols != other.shape.cols:
+                raise newException(ValueError, &"incompatible argument shapes for dot product")
+        result = zeros[T]((0, self.shape.rows))
+        for i in 0..<result.shape.cols:
+            result[0, i] = (self[i] * other[0]).sum()
+    elif other.shape.rows > 1:
+        when not defined(release):
+            if self.shape.cols != other.shape.cols:
+                raise newException(ValueError, &"incompatible argument shapes for dot product")
+        result = zeros[T]((0, self.shape.cols))
+        var other = other.transpose()
+        for i in 0..<result.shape.cols:
+            result[0, i] = (self[0] * other[i]).sum()
+    else:
+        return self * other


 proc where*[T](cond: Matrix[bool], x, y: Matrix[T]): Matrix[T] =
@ -721,6 +861,50 @@ proc where*[T](cond: Matrix[bool], x, y: Matrix[T]): Matrix[T] =
        inc(row)
        col = 0

+
+# Just a helper to avoid mistakes and so that x.where(x > 10, y) works as expected
+proc where*[T](self: Matrix[T], cond: Matrix[bool], other: Matrix[T]): Matrix[T] = cond.where(self, other)
+
+
+proc max*[T](self: Matrix[T]): T =
+    ## Returns the largest element
+    ## into the matrix
+    var m: T = self[0, 0]
+    for row in self:
+        for element in row:
+            if m < element:
+                m = element
+    return m
+
+
+proc argmax*[T](self: Matrix[T]): T =
+    ## Returns the index largest element
+    ## into the matrix
+    var m: T = self[0, 0]
+    var 
+        row = 0
+        col = 0
+    while row < self.shape.rows:
+        while col < self.shape.cols:
+            if self[row, col] > m:
+                m = self[row, col]
+    if self.shape.rows == 0:
+        while col < self.shape.cols:
+            if self[0, col] > m:
+                m = self[0, col]
+            inc(col)
+    return m
+
+
+proc contains*[T](self: Matrix[T], e: T): bool =
+    ## Returns wherher the matrix contains
+    ## the element e
+    for row in self:
+        for element in row:
+            if element == e:
+                return true
+    return false
+
 when isMainModule:
    import math

@ -729,6 +913,7 @@ when isMainModule:

    var m = newMatrix[int](@[@[1, 2, 3], @[4, 5, 6]])
    var k = m.transpose()
+    assert k[2, 1] == m[1, 2], "transpose mismatch"
    assert all(m.transpose() == k), "transpose mismatch"
    assert k.sum() == m.sum(), "element sum mismatch"
    assert all(k.sum(axis=1) == m.sum(axis=0)), "sum over axis mismatch"
@ -741,4 +926,9 @@ when isMainModule:
    assert (m * z).sum() == 46, "matrix multiplication mismatch"
    assert all(z * z == z.apply(pow, 2, axis = -1, copy=true)), "matrix multiplication mismatch"
    var x = newMatrix[int](@[0, 1, 2, 3, 4, 5, 6, 7, 8, 9])
-    assert (x < 5).where(x, x * 10).sum() == 360, "where mismatch"
+    assert (x < 5).where(x, x * 10).sum() == 360, "where mismatch"
+    assert all((x < 5).where(x, x * 10) == x.where(x < 5, x * 10)), "where mismatch"
+    assert x.max() == 9, "max mismatch"
+    assert x.argmax() == 9, "argmax mismatch"
+    discard newMatrix[int](@[12, 23]).dot(newMatrix[int](@[@[11, 22], @[33, 44]]))
+    discard newMatrix[int](@[@[1, 2, 3], @[2, 3, 4]]).dot(newMatrix[int](@[1, 2, 3]))
--- a/src/nn/util/preprocessing.nim
+++ b/src/nn/util/preprocessing.nim
@ -0,0 +1,76 @@
+# Copyright 2022 Mattia Giambirtone
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+## Various data preprocessing tools
+
+import matrix
+
+
+import strformat
+import sets
+
+
+type
+    LabelEncoder* = ref object
+        ## An encoder to assign a numerical value in the
+        ## range from 0 to n_labels - 1 to the labels
+        # of some categorical data, reversibly
+        isFit: bool
+        labels: Matrix[string]
+
+
+proc newLabelEncoder*: LabelEncoder =
+    ## Initializes a new LabelEncoder object
+    new(result)
+
+
+proc toOrderedSet[T](m: Matrix[T]): OrderedSet[T] =
+    result = initOrderedSet[T]()
+    for row in m:
+        for element in row:
+            result.incl(element)
+
+
+proc fit*(self: LabelEncoder, labels: Matrix[string]) =
+    # Fits the encoder to the given labels
+    var lbl: seq[string] = @[]
+    for label in toOrderedSet(labels):
+        lbl.add(label)
+    self.labels = newMatrix(lbl)
+    self.is_fit = true
+
+
+proc transform*(self: LabelEncoder, labels: Matrix[string]): Matrix[int] =
+    ## Transforms a vector of labels into a vector of encoded
+    ## integers. Duplicate labels are assigned the same integer
+    assert self.isFit, "The estimator must be fit!"
+    var res: seq[int] = @[]
+    for row in labels:
+        for label in row: 
+            if label notin self.labels:
+                raise newException(ValueError, &"Unknown label '{label}'")
+            res.add(self.labels.raw[].find(label))
+    result = newMatrix(res)
+
+
+proc reverseTransform*(self: LabelEncoder, labels: Matrix[int]): Matrix[string] =
+    ## Reverses the transformation of the integer labels back to a string
+    assert self.is_fit, "The estimator must be fit!"
+    var res: seq[string] = @[]
+    for row in labels:
+        for label in row:
+            if label notin 0..<self.labels.len():
+                raise newException(ValueError, &"Unknown encoded label '{label}'")
+            res.add(self.labels[0, label])
+    result = newMatrix(res)
--- a/src/nn/util/tris.nim
+++ b/src/nn/util/tris.nim
@ -0,0 +1,78 @@
+import matrix
+
+
+type 
+    TileKind* = enum
+        ## A tile enumeration kind
+        Empty = 0,
+        Self,
+        Enemy
+    GameStatus* = enum
+        ## A game status enumeration
+        Playing,
+        Win,
+        Lose,
+        Draw
+    TrisGame* = ref object
+        map*: Matrix[int]
+
+
+proc newTrisGame*: TrisGame =
+    ## Creates a new TrisGame object
+    new(result)
+    result.map = zeros[int]((3, 3))
+
+
+proc get*(self: TrisGame): GameStatus =
+    ## Returns the game status
+    # Checks for rows
+    for _, row in self.map:
+        if all(row == newMatrix[int](@[1, 1, 1])):
+            return Win
+        elif all(row == newMatrix[int](@[2, 2, 2])):
+            return Lose
+    # Checks for columns
+    for _, col in self.map.transpose:
+        if all(col == newMatrix[int](@[1, 1, 1])):
+            return Win
+        elif all(col == newMatrix[int](@[2, 2, 2])):
+            return Lose
+    # Checks for diagonals
+    for i in 0..<2:
+        if all(self.map.diag(i) == newMatrix[int](@[1, 1, 1])):
+            return Win
+        elif all(self.map.diag(i) == newMatrix[int](@[2, 2, 2])):
+            return Lose
+    # No check was successful and there's no empty slots: draw!
+    if not any(self.map == 0):
+        return Draw
+    # There are empty slots and no one won yet, we're still in game!
+    return Playing
+
+
+proc `$`*(self: TrisGame): string =
+    ## Stringifies self
+    return $self.map
+
+
+proc place*(self: TrisGame, tile: TileKind, x, y: int) =
+    ## Places a tile onto the playing board
+    self.map[x, y] = int(tile)
+
+
+when isMainModule:
+    var game = newTrisGame()
+    game.place(Enemy, 0, 0)
+    game.place(Enemy, 0, 1)
+    assert game.get() == Playing
+    game.place(Enemy, 0, 2)
+    assert game.get() == Lose
+    game.place(Self, 0, 2)
+    assert game.get() == Playing
+    game.place(Enemy, 1, 1)
+    game.place(Enemy, 2, 2)
+    assert game.get() == Lose
+    game.place(Self, 2, 2)
+    assert game.get() == Playing
+    game.place(Self, 1, 2)
+    assert game.get() == Win