HugoPhi
diff --git a/‎README.md
+27-19 b/‎README.md
+27-19
diff --git a/‎gru_ucihar.ipynb
+23-26 b/‎gru_ucihar.ipynb
+23-26
diff --git a/‎plugins/lrkit b/‎plugins/lrkit
diff --git a/‎plugins/minitorch/initer.py
+168 b/‎plugins/minitorch/initer.py
+168
@@ -69,19 +69,25 @@ Overview of Framework
     - Basic rnn kernel
     - LSTM kernel
     - GRU kernel
-    - BiLSTM kernel <mark>TODO</mark>
-    - BiGRU kernel <mark>TODO</mark>
+    - BiLSTM kernel
+    - BiGRU kernel 
+    - Layer Norm <mark>TODO</mark>
   - FC
     - Dropout
     - Linear
 - Optimizer
-  - Raw GD
-  - Momentum
-  - Nesterov(NAG)
-  - AdaGrad
-  - RMSProp
-  - AdaDelta
-  - Adam[[6](#reference)]
+  - Algorithms
+    - Raw GD
+    - Momentum
+    - Nesterov(NAG)
+    - AdaGrad
+    - RMSProp
+    - AdaDelta
+    - Adam[[6](#reference)]
+  - Machanisms
+    - Lr Decay. <mark>TODO</mark>
+    - Weight Decay. <mark>TODO</mark>
+    - Freeze. <mark>TODO</mark>
 - Utils
   - sigmoid
   - one hot
@@ -91,25 +97,27 @@ Overview of Framework
   - l1_regularization
   - l2_regularization
 
-#### 🗠 Number of Codes
+#### @ Number of Codes
 
 Last update: 2025.03.14.   
 
 ```text
-      68 text files.
-      49 unique files.                              
-      49 files ignored.
+     236 text files.
+     135 unique files.                              
+     138 files ignored.
 
-github.com/AlDanial/cloc v 1.98  T=0.04 s (1365.4 files/s, 303229.6 lines/s)
+github.com/AlDanial/cloc v 1.98  T=0.05 s (2810.5 files/s, 307803.1 lines/s)
 -------------------------------------------------------------------------------
 Language                     files          blank        comment           code
 -------------------------------------------------------------------------------
-Jupyter Notebook                21              0           3954           2022
-Python                          21           1014           1805           1669
-Text                             6              1              0            295
-Markdown                         1             19              0            103
+Python                          33           1689           3297           3177
+Jupyter Notebook                21              0           3947           1913
+Text                             6              1              0            301
+CSV                             68              0              0            203
+Markdown                         5             40              0            198
+TOML                             2              3              0             16
 -------------------------------------------------------------------------------
-SUM:                            49           1034           5759           4089
+SUM:                           135           1733           7244           5808
 -------------------------------------------------------------------------------
 ```
 
 
@@ -10,7 +10,9 @@ class Initer:
     Supported layer types:
     - Basic Recurrent Neural Network (basic_rnn)
     - Long Short-Term Memory (lstm)
+    - Bidirectional Long Short-Term Memory (bilstm)
     - Gated Recurrent Unit (gru)
+    - Bidirectional Gated Recurrent Unit (bigru)
     - Fully Connected (fc) layers
     - 1D Convolutional layers (conv1d)
     - 2D Convolutional layers (conv2d)
@@ -19,7 +21,9 @@ class Initer:
     Their name should be like:
     - "basic_rnn:"
     - "lstm:"
+    - "bilstm:"
     - "gru:"
+    - "bigru:"
     - "fc:"
     - "conv1d:"
     - "conv2d:"
@@ -31,6 +35,7 @@ class Initer:
     '''
 
     SupportLayers = ('basic_rnn', 'lstm', 'gru',
+                     'bilstm', 'bigru',
                      'fc',
                      'conv1d', 'conv2d', 'conv3d')
 
@@ -81,6 +86,169 @@ def _init_param(self, name: str):
 
         return f(name)
 
+    def _bilstm(self, name):
+        '''
+        Initializes parameters for a bidirectional LSTM layer.
+
+        Config should be:
+        ```
+        name: {
+            'input_dim': int,  # Input dimension
+            'hidden_dim': int,  # Hidden state dimension
+            'strategy': str,  # Initial strategy, including None, Kaiming, Xavier
+        }
+        ```
+
+        Returns:
+            A dictionary containing:
+            - 'Ws': Weight matrix for input-to-hidden transformations (8, input_dim, hidden_dim).
+                - First 4 matrices are for forward direction.
+                - Last 4 matrices are for backward direction.
+            - 'Us': Weight matrix for hidden-to-hidden transformations (8, hidden_dim, hidden_dim).
+                - First 4 matrices are for forward direction.
+                - Last 4 matrices are for backward direction.
+            - 'Bs': Bias terms (8, hidden_dim).
+                - First 4 biases are for forward direction.
+                - Last 4 biases are for backward direction.
+                - The forget gate bias (index 0 and 4) is initialized to 1.
+        '''
+
+        match self.config[name]['strategy']:
+            case 'None':
+                return {
+                    'Ws': random.normal(self.key, (
+                        8,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )),
+                    'Us': random.normal(self.key, (
+                        8,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )),
+                    'Bs': jnp.zeros((
+                        8,
+                        self.config[name]['hidden_dim']
+                    )).at[0].set(1).at[4].set(1),  # Initialize forget gate biases to 1
+                }
+            case 'Kaiming':
+                return {
+                    'Ws': random.normal(self.key, (
+                        8,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'])),  # Kaiming
+                    'Us': random.normal(self.key, (
+                        8,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'])),
+                    'Bs': jnp.zeros((
+                        8,
+                        self.config[name]['hidden_dim']
+                    )).at[0].set(1).at[4].set(1),  # Initialize forget gate biases to 1
+                }
+            case 'Xavier':
+                return {
+                    'Ws': random.normal(self.key, (
+                        8,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'] + self.config[name]['hidden_dim'])),  # Xavier
+                    'Us': random.normal(self.key, (
+                        8,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'] + self.config[name]['hidden_dim'])),
+                    'Bs': jnp.zeros((
+                        8,
+                        self.config[name]['hidden_dim']
+                    )).at[0].set(1).at[4].set(1),  # Initialize forget gate biases to 1
+                }
+            case _:
+                raise ValueError(f'[x] Do not support strategy: {name["strategy"]} given by {name}.')
+
+    def _bigru(self, name):
+        '''
+        Initializes parameters for a bidirectional GRU layer.
+
+        Config should be:
+        ```
+        name: {
+            'input_dim': int,  # Input dimension
+            'hidden_dim': int,  # Hidden state dimension
+            'strategy': str,  # Initial strategy, including None, Kaiming, Xavier
+        }
+        ```
+
+        Returns:
+            A dictionary containing:
+            - 'Ws': Weight matrix for input-to-hidden transformations (6, input_dim, hidden_dim).
+                - First 3 matrices are for forward direction.
+                - Last 3 matrices are for backward direction.
+            - 'Us': Weight matrix for hidden-to-hidden transformations (6, hidden_dim, hidden_dim).
+                - First 3 matrices are for forward direction.
+                - Last 3 matrices are for backward direction.
+            - 'Bs': Bias terms (6, hidden_dim).
+                - First 3 biases are for forward direction.
+                - Last 3 biases are for backward direction.
+        '''
+
+        match self.config[name]['strategy']:
+            case 'None':
+                return {
+                    'Ws': random.normal(self.key, (
+                        6,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )),
+                    'Us': random.normal(self.key, (
+                        6,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )),
+                    'Bs': jnp.zeros((
+                        6,
+                        self.config[name]['hidden_dim']
+                    )),
+                }
+            case 'Kaiming':
+                return {
+                    'Ws': random.normal(self.key, (
+                        6,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'])),  # Kaiming
+                    'Us': random.normal(self.key, (
+                        6,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'])),
+                    'Bs': jnp.zeros((
+                        6,
+                        self.config[name]['hidden_dim']
+                    )),
+                }
+            case 'Xavier':
+                return {
+                    'Ws': random.normal(self.key, (
+                        6,
+                        self.config[name]['input_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'] + self.config[name]['hidden_dim'])),  # Xavier
+                    'Us': random.normal(self.key, (
+                        6,
+                        self.config[name]['hidden_dim'],
+                        self.config[name]['hidden_dim'],
+                    )) * jnp.sqrt(2 / (self.config[name]['input_dim'] + self.config[name]['hidden_dim'])),
+                    'Bs': jnp.zeros((
+                        6,
+                        self.config[name]['hidden_dim']
+                    )),
+                }
+            case _:
+                raise ValueError(f'[x] Do not support strategy: {name["strategy"]} given by {name}.')
+
     def _basic_rnn(self, name):
         '''
         Initializes parameters for a basic RNN layer.