devitocodes · carloshnpa · Mar 26, 2023 · Mar 27, 2023 · Mar 27, 2023 · Apr 11, 2023
diff --git a/.gitignore b/.gitignore
@@ -189,3 +189,4 @@ dmypy.json
 
 # End of https://www.toptal.com/developers/gitignore/api/python,emacs
 
+data/
diff --git a/.idea/.gitignore b/.idea/.gitignore
diff --git a/.idea/inspectionProfiles/Project_Default.xml b/.idea/inspectionProfiles/Project_Default.xml
diff --git a/.idea/inspectionProfiles/profiles_settings.xml b/.idea/inspectionProfiles/profiles_settings.xml
diff --git a/.idea/joey2.0.iml b/.idea/joey2.0.iml
diff --git a/.idea/misc.xml b/.idea/misc.xml
diff --git a/.idea/modules.xml b/.idea/modules.xml
diff --git a/.idea/vcs.xml b/.idea/vcs.xml
diff --git a/README.md b/README.md
@@ -8,6 +8,7 @@ Joey is a machine learning framework running on top of [Devito](https://github.c
 * A backward pass through a neural network with batch processing
 * Producing backpropagation equations automatically based on the list of layers in a neural network (only a loss function must be defined manually by the user)
 * Training a neural network with PyTorch optimizers
+* Initiate a transformer neural network for image classification
 
 Unlike other machine learning frameworks, Joey generates and compiles an optimized low-level code on-the-spot (using Devito) for both standalone layers and proper neural networks.
 
@@ -16,10 +17,23 @@ Unlike other machine learning frameworks, Joey generates and compiles an optimiz
 * 2D max pooling (other types of 2D pooling can be implemented by the user by extending the `Pooling` abstract class)
 * Full connection
 * Flattening (an internal layer turning 2D data with channels into a 1D vector or 2D matrix, depending on the batch size)
+* 3D FullyConnected
+* Einsun function
+* Dropout 1, 2, 3 and 4 dimensions
+* Norm 2D
+* Norm 3D
+* Softmax 3D and 4D function
+
+## Supported modules
+* MultiHeadAttention
+* VisionEnconder
+
+## Built-in Models
+* ViT (Vision Transformer)
 
 ## Supported activation functions
 * ReLU
-* Softmax (only via the `FullyConnectedSoftmax` class)
+* Softmax (only via the `FullyConnectedSoftmax` class or with `Softmax3d` / `Softmax4d` function)
 * Dummy (`f(x) = x`)
 
 Other activation functions can be implemented by extending the `Activation` abstract class.

diff --git a/examples/ViT_Running.py b/examples/ViT_Running.py
@@ -0,0 +1,7 @@
+
+
+
+
+
+
+
diff --git a/examples/resources/model_weights_ViT b/examples/resources/model_weights_ViT
diff --git a/joey/base.py b/joey/base.py
@@ -1,5 +1,7 @@
 from abc import ABC, abstractmethod
-from devito import Operator, Function, dimensions
+
+import numpy as np
+from devito import Operator, Function, dimensions, SpaceDimension
 from joey import Activation
 from joey import activation as activ
 from numpy import array
@@ -8,21 +10,60 @@
 dim_index = 0
 
 
-def default_name_allocator():
+def default_name_allocator(name=''):
     global index
-    name = 'f' + str(index)
+    _name = 'f' + name + str(index)
     index += 1
-    return name
+    return _name
 
 
 def default_dim_allocator(count):
     global dim_index
-    names = ''
+    names = []
     for i in range(count):
-        names += 'd' + str(dim_index) + ' '
+        names.append('d' + str(dim_index))
         dim_index += 1
-    names = names[:-1]
-    return dimensions(names)
+    return [SpaceDimension(n) for n in names]
+
+
+class Module(ABC):
+    @property
+    def input(self):
+        """A Function object corresponding to an input data array."""
+        return self._I
+
+    @property
+    def result(self):
+        """A Function object corresponding to a result array."""
+        return self._R
+
+    @abstractmethod
+    def equations(self) -> (list, list):
+        pass
+
+    def init_params(self):
+        if self.kernel is not None:
+            self.kernel.data[:] = \
+                np.random.rand(*self.kernel.shape) - 0.5
+
+        if self.bias is not None:
+            self.bias.data[:] = np.random.rand(*self.bias.shape) - 0.5
+
+    @abstractmethod
+    def _allocate(self, **kwargs) -> (Function, Function, Function,
+                                      Function, Function, Function,
+                                      Function):
+
+        pass
+
+    def execute(self, kernel_data=None, input_data=None, bias=None) -> array:
+
+        self._op.apply(**self._arg_dict)
+        return self._R.data
+
+    @abstractmethod
+    def backprop_equations(self, prev_layer, next_layer) -> (list, list):
+        pass
 
 
 class Layer(ABC):
@@ -62,7 +103,7 @@ def __init__(self, kernel_size,
                  input_size, activation=activ.Dummy(),
                  name_allocator_func=default_name_allocator,
                  dim_allocator_func=default_dim_allocator,
-                 generate_code=False):
+                 generate_code=False, **kwargs):
         if activation is None:
             activation = activ.Dummy()
 
@@ -71,12 +112,14 @@ def __init__(self, kernel_size,
                             "its subclass")
 
         self._activation = activation
-
-        self._K, self._I, self._R, self._bias, self._KG, self._RG, \
-            self._biasG = self._allocate(kernel_size,
-                                         input_size,
-                                         name_allocator_func,
-                                         dim_allocator_func)
+        self.propagate = True
+        self.back_propagate = True
+        self.name = kwargs.get('name', '')
+        self._K, self._I, self._R, self._bias, self._KG, self._RG, self._biasG = self._allocate(kernel_size,
+                                                                                                input_size,
+                                                                                                name_allocator_func,
+                                                                                                dim_allocator_func,
+                                                                                                **kwargs)
 
         if generate_code:
             eqs, args = self.equations()
@@ -89,6 +132,11 @@ def kernel(self):
         """A Function object corresponding to a kernel/weight array."""
         return self._K
 
+    @property
+    def weight(self):
+        """A Function object corresponding to a kernel/weight array."""
+        return self._K.data
+
     @property
     def input(self):
         """A Function object corresponding to an input data array."""
@@ -135,27 +183,35 @@ def pytorch_parameters(self):
         kernel_parameter = None
         bias_parameter = None
 
-        if self._K is not None:
+        if self._K is not None and self.propagate:
             kernel_tensor = from_numpy(self._K.data)
             kernel_parameter = Parameter(kernel_tensor, requires_grad=False)
 
             if self._KG is not None:
                 kernel_parameter.grad = from_numpy(self._KG.data)
 
-        if self._bias is not None:
+        if self._bias is not None and self.propagate:
             bias_tensor = from_numpy(self._bias.data)
             bias_parameter = Parameter(bias_tensor, requires_grad=False)
 
             if self._biasG is not None:
                 bias_parameter.grad = from_numpy(self._biasG.data)
 
-        return (kernel_parameter, bias_parameter)
+        return kernel_parameter, bias_parameter
+
+    def init_params(self):
+        if self.kernel is not None:
+            self.kernel.data[:] = \
+                np.random.rand(*self.kernel.shape) - 0.5
+
+        if self.bias is not None:
+            self.bias.data[:] = np.random.rand(*self.bias.shape) - 0.5
 
     @abstractmethod
     def _allocate(self, kernel_size, input_size, name_allocator_func,
-                  dim_allocator_func) -> (Function, Function, Function,
-                                          Function, Function, Function,
-                                          Function):
+                  dim_allocator_func, **kwargs) -> (Function, Function, Function,
+                                                    Function, Function, Function,
+                                                    Function):
         """
         This method should return a (Function, Function, Function, Function,
         Function, Function, Function) object corresponding to a kernel,
Original file line number	Diff line number	Diff line change
Expand Up		@@ -189,3 +189,4 @@ dmypy.json

		# End of https://www.toptal.com/developers/gitignore/api/python,emacs

		data/