diff --git a/examples/structured_data/class_with_grn_and_vsn_with_hyperparameters_tuning.py b/examples/structured_data/class_with_grn_and_vsn_with_hyperparameters_tuning.py
new file mode 100644
index 0000000000..31fd374bbb
--- /dev/null
+++ b/examples/structured_data/class_with_grn_and_vsn_with_hyperparameters_tuning.py
@@ -0,0 +1,684 @@
+"""
+Title: Classification with Gated Residual and Variable Selection Networks with HyperParameters tuning
+Author: [Humbulani Ndou](https://github.com/Humbulani1234)
+Date created: 2025/03/17
+Last modified: 2025/03/17
+Description: Using Gated Residual and Variable Selection Networks for income level prediction with HyperParameters tuning
+Accelerator: GPU
+"""
+
+"""
+## Introduction
+
+The following example extends the script `structured_data/classification_with_grn_and_vsn.py` by incorporating hyperparameters tuning
+using [Autokeras](https://github.com/keras-team/autokeras) and [KerasTuner](https://github.com/keras-team/keras-tuner). Specifics regarding
+which APIs are used from the these two packages will be described in detail in the relevant code sections.
+
+This example demonstrates the use of Gated
+Residual Networks (GRN) and Variable Selection Networks (VSN), proposed by
+Bryan Lim et al. in
+[Temporal Fusion Transformers (TFT) for Interpretable Multi-horizon Time Series Forecasting](https://arxiv.org/abs/1912.09363),
+for structured data classification. GRNs give the flexibility to the model to apply
+non-linear processing only where needed. VSNs allow the model to softly remove any
+unnecessary noisy inputs which could negatively impact performance.
+Together, those techniques help improving the learning capacity of deep neural
+network models.
+
+Note that this example implements only the GRN and VSN components described in
+in the paper, rather than the whole TFT model, as GRN and VSN can be useful on
+their own for structured data learning tasks.
+
+
+To run the code you need to use TensorFlow 2.3 or higher.
+"""
+
+"""
+## The dataset
+
+This example uses the
+[United States Census Income Dataset](https://archive.ics.uci.edu/ml/datasets/Census-Income+%28KDD%29)
+provided by the
+[UC Irvine Machine Learning Repository](https://archive.ics.uci.edu/ml/index.php).
+The task is binary classification to determine whether a person makes over 50K a year.
+
+The dataset includes ~300K instances with 41 input features: 7 numerical features
+and 34 categorical features.
+"""
+
+"""
+## Setup
+"""
+
+
+import os
+import subprocess
+import tarfile
+import numpy as np
+import pandas as pd
+import tree
+from typing import Optional, Union
+
+os.environ["KERAS_BACKEND"] = "torch"  # or jax, or tensorflow
+
+# Keras imports
+import keras
+from keras import layers
+
+# KerasTuner imports
+import keras_tuner
+from keras_tuner import HyperParameters
+
+# AutoKeras imports
+import autokeras as ak
+from autokeras.utils import utils, types
+
+
+"""
+## Prepare the data
+
+First we load the data from the UCI Machine Learning Repository into a Pandas DataFrame.
+"""
+
+# Column names.
+CSV_HEADER = [
+    "age",
+    "class_of_worker",
+    "detailed_industry_recode",
+    "detailed_occupation_recode",
+    "education",
+    "wage_per_hour",
+    "enroll_in_edu_inst_last_wk",
+    "marital_stat",
+    "major_industry_code",
+    "major_occupation_code",
+    "race",
+    "hispanic_origin",
+    "sex",
+    "member_of_a_labor_union",
+    "reason_for_unemployment",
+    "full_or_part_time_employment_stat",
+    "capital_gains",
+    "capital_losses",
+    "dividends_from_stocks",
+    "tax_filer_stat",
+    "region_of_previous_residence",
+    "state_of_previous_residence",
+    "detailed_household_and_family_stat",
+    "detailed_household_summary_in_household",
+    "instance_weight",
+    "migration_code-change_in_msa",
+    "migration_code-change_in_reg",
+    "migration_code-move_within_reg",
+    "live_in_this_house_1_year_ago",
+    "migration_prev_res_in_sunbelt",
+    "num_persons_worked_for_employer",
+    "family_members_under_18",
+    "country_of_birth_father",
+    "country_of_birth_mother",
+    "country_of_birth_self",
+    "citizenship",
+    "own_business_or_self_employed",
+    "fill_inc_questionnaire_for_veterans_admin",
+    "veterans_benefits",
+    "weeks_worked_in_year",
+    "year",
+    "income_level",
+]
+
+data_url = "https://archive.ics.uci.edu/static/public/117/census+income+kdd.zip"
+if not os.path.isdir(
+    os.path.join(os.path.expanduser("~"), ".keras", "datasets", "census+income+kdd.zip")
+):
+    keras.utils.get_file(origin=data_url, extract=True)
+
+
+"""
+Determine the downloaded .tar.gz file path and
+extract the files from the downloaded .tar.gz file
+"""
+
+extracted_path = os.path.join(
+    os.path.expanduser("~"), ".keras", "datasets", "census+income+kdd.zip"
+)
+if not os.path.exists(
+    os.path.join(
+        os.path.expanduser("~"),
+        ".keras",
+        "datasets",
+        "census+income+kdd.zip",
+        "census-income.test",
+    )
+):
+    for root, dirs, files in os.walk(extracted_path):
+        for file in files:
+            if file.endswith(".tar.gz"):
+                tar_gz_path = os.path.join(root, file)
+                with tarfile.open(tar_gz_path, "r:gz") as tar:
+                    tar.extractall(path=root)
+
+train_data_path = os.path.join(
+    os.path.expanduser("~"),
+    ".keras",
+    "datasets",
+    "census+income+kdd.zip",
+    "census-income.data",
+)
+test_data_path = os.path.join(
+    os.path.expanduser("~"),
+    ".keras",
+    "datasets",
+    "census+income+kdd.zip",
+    "census-income.test",
+)
+
+data = pd.read_csv(train_data_path, header=None, names=CSV_HEADER).iloc[0:10000]
+test_data = pd.read_csv(test_data_path, header=None, names=CSV_HEADER).iloc[0:5000]
+
+print(f"Data shape: {data.shape}")
+print(f"Test data shape: {test_data.shape}")
+
+
+"""
+We convert the target column from string to integer.
+"""
+
+data["income_level"] = data["income_level"].apply(
+    lambda x: 0 if x == " - 50000." else 1
+)
+test_data["income_level"] = test_data["income_level"].apply(
+    lambda x: 0 if x == " - 50000." else 1
+)
+
+
+"""
+Then, We split the dataset into train and validation sets.
+"""
+
+random_selection = np.random.rand(len(data.index)) <= 0.85
+train_data = data[random_selection]
+valid_data = data[~random_selection]
+
+
+"""
+Finally we store the train and test data splits locally to CSV files.
+"""
+
+train_data_file = "train_data.csv"
+valid_data_file = "valid_data.csv"
+test_data_file = "test_data.csv"
+
+train_data.to_csv(train_data_file, index=False, header=False)
+valid_data.to_csv(valid_data_file, index=False, header=False)
+test_data.to_csv(test_data_file, index=False, header=False)
+
+"""
+## Define dataset metadata
+
+Here, we define the metadata of the dataset that will be useful for reading and
+parsing the data into input features, and encoding the input features with respect
+to their types.
+"""
+
+# Target feature name.
+TARGET_FEATURE_NAME = "income_level"
+# Weight column name.
+WEIGHT_COLUMN_NAME = "instance_weight"
+# Numeric feature names.
+NUMERIC_FEATURE_NAMES = [
+    "age",
+    "wage_per_hour",
+    "capital_gains",
+    "capital_losses",
+    "dividends_from_stocks",
+    "num_persons_worked_for_employer",
+    "weeks_worked_in_year",
+]
+# Categorical features and their vocabulary lists.
+# Note that we add 'v=' as a prefix to all categorical feature values to make
+# sure that they are treated as strings.
+CATEGORICAL_FEATURES_WITH_VOCABULARY = {
+    feature_name: sorted([str(value) for value in list(data[feature_name].unique())])
+    for feature_name in CSV_HEADER
+    if feature_name
+    not in list(NUMERIC_FEATURE_NAMES + [WEIGHT_COLUMN_NAME, TARGET_FEATURE_NAME])
+}
+# All features names.
+FEATURE_NAMES = NUMERIC_FEATURE_NAMES + list(
+    CATEGORICAL_FEATURES_WITH_VOCABULARY.keys()
+)
+# Feature default values.
+COLUMN_DEFAULTS = [
+    (
+        [0.0]
+        if feature_name
+        in NUMERIC_FEATURE_NAMES + [TARGET_FEATURE_NAME, WEIGHT_COLUMN_NAME]
+        else ["NA"]
+    )
+    for feature_name in CSV_HEADER
+]
+
+"""
+## Create a `tf.data.Dataset` for training and evaluation
+
+We create an input function to read and parse the file, and convert features and
+labels into a [`tf.data.Dataset`](https://www.tensorflow.org/guide/datasets) for
+training and evaluation.
+"""
+
+# Tensorflow required for tf.data.Datasets
+import tensorflow as tf
+
+
+# We process our datasets elements here (categorical) and convert them to indices to avoid this step
+# during model training since only tensorflow support strings.
+def process(features, target):
+    for feature_name in features:
+        if feature_name in CATEGORICAL_FEATURES_WITH_VOCABULARY:
+            # Cast categorical feature values to string.
+            features[feature_name] = tf.cast(features[feature_name], "string")
+            vocabulary = CATEGORICAL_FEATURES_WITH_VOCABULARY[feature_name]
+            # Create a lookup to convert a string values to an integer indices.
+            # Since we are not using a mask token we leave at default.
+            index = layers.StringLookup(
+                vocabulary=vocabulary,
+                mask_token=None,
+                num_oov_indices=1,
+                output_mode="int",
+            )
+            # Convert the string input values into integer indices.
+            value_index = index(features[feature_name])
+            features[feature_name] = value_index
+        else:
+            # Do nothing for numerical features
+            pass
+
+    # Get the instance weight.
+    weight = features.pop(WEIGHT_COLUMN_NAME)
+    # Change features from OrderedDict to Dict to match Inputs as they are Dict.
+    return dict(features), target, weight
+
+
+def get_dataset_from_csv(csv_file_path, shuffle=False, batch_size=128):
+    dataset = tf.data.experimental.make_csv_dataset(
+        csv_file_path,
+        batch_size=batch_size,
+        column_names=CSV_HEADER,
+        column_defaults=COLUMN_DEFAULTS,
+        label_name=TARGET_FEATURE_NAME,
+        num_epochs=1,
+        header=False,
+        shuffle=shuffle,
+    ).map(process)
+    return dataset
+
+
+"""
+## Subclassing Autokeras Graph 
+
+Here we subclass the Autokeras `Graph`
+
+- `build`: we override this method to be able to handle model `Inputs` passed
+as dictionaries. In structured data analysis Inputs are normally passed as
+dictionaries for each feature of interest
+
+"""
+
+
+class Graph(ak.graph.Graph):
+
+    def build(self, hp):
+        """Build the HyperModel into a Keras Model."""
+        keras_nodes = {}
+        keras_input_nodes = []
+        for node in self.inputs:
+            node_id = self._node_to_id[node]
+            input_node = node.build_node(hp)
+            output_node = node.build(hp, input_node)
+            keras_input_nodes.append(input_node)
+            keras_nodes[node_id] = output_node
+        for block in self.blocks:
+            # This code block is to handle dict inputs.
+            temp_inputs = None
+            for input_node in block.inputs:
+                if isinstance(input_node, ak.Input):
+                    temp_inputs = temp_inputs if temp_inputs is not None else {}
+                    temp_inputs[input_node.name] = keras_nodes[
+                        self._node_to_id[input_node]
+                    ]
+                else:
+                    temp_inputs = temp_inputs if temp_inputs is not None else []
+                    temp_inputs.append(keras_nodes[self._node_to_id[input_node]])
+            outputs = block.build(hp, inputs=temp_inputs)
+            outputs = tree.flatten(outputs)
+            for output_node, real_output_node in zip(block.outputs, outputs):
+                keras_nodes[self._node_to_id[output_node]] = real_output_node
+        model = keras.models.Model(
+            keras_input_nodes,
+            [
+                keras_nodes[self._node_to_id[output_node]]
+                for output_node in self.outputs
+            ],
+        )
+        return self._compile_keras_model(hp, model)
+
+    def _compile_keras_model(self, hp, model):
+        # Specify hyperparameters from compile(...)
+        optimizer_name = hp.Choice(
+            "optimizer",
+            ["adam", "sgd"],
+            default="adam",
+        )
+        learning_rate = hp.Choice(
+            "learning_rate", [1e-1, 1e-2, 1e-3, 1e-4, 2e-5, 1e-5], default=1e-3
+        )
+        if optimizer_name == "adam":
+            optimizer = keras.optimizers.Adam(learning_rate=learning_rate)
+        elif optimizer_name == "sgd":
+            optimizer = keras.optimizers.SGD(learning_rate=learning_rate)
+        model.compile(
+            optimizer=optimizer,
+            metrics=self._get_metrics(),
+            loss=self._get_loss(),
+        )
+        return model
+
+
+"""
+
+## Subclassing Autokeras `Input`
+
+Here we subclass the Autokeras Input node object and override the dtype attribute
+from None to a user supplied value. We also override the `build_node` method to
+use user supplied name for Inputs layers.
+
+"""
+
+
+class Input(ak.Input):
+    def __init__(self, dtype, name=None, **kwargs):
+        super().__init__(name=name, **kwargs)
+        # Override dtype to a user dtype value
+        self.dtype = dtype
+        self.name = name
+
+    def build_node(self, hp):
+        return keras.Input(name=self.name, shape=self.shape, dtype=self.dtype)
+
+
+"""
+
+## Subclassing ClassificationHead
+
+Here we subclass Autokeras ClassificationHead and override the __init__ method, and
+we add the method `get_expected_shape` to infer the labels shape.
+We remove the preprocessing fuctionality as we prefer to conduct such manually.
+"""
+
+
+class ClassifierHead(ak.ClassificationHead):
+
+    def __init__(
+        self,
+        num_classes: Optional[int] = None,
+        multi_label: bool = False,
+        loss: Optional[types.LossType] = None,
+        metrics: Optional[types.MetricsType] = None,
+        dropout: Optional[float] = None,
+        **kwargs,
+    ):
+        self.num_classes = num_classes
+        self.multi_label = multi_label
+        self.dropout = dropout
+        if metrics is None:
+            metrics = ["accuracy"]
+        if loss is None:
+            loss = self.infer_loss()
+        ak.Head.__init__(self, loss=loss, metrics=metrics, **kwargs)
+        self.shape = self.get_expected_shape()
+
+    def get_expected_shape(self):
+        # Compute expected shape from num_classes.
+        if self.num_classes == 2 and not self.multi_label:
+            return [1]
+        return [self.num_classes]
+
+
+"""
+## GatedLinearUnit Layer
+
+This is a keras layer defined in the script `structured_data/classification_with_grn_vsn.py` 
+More details about this layer maybe found in the relevant script 
+
+"""
+
+
+class GatedLinearUnit(layers.Layer):
+    def __init__(self, num_units, activation, **kwargs):
+        super().__init__(**kwargs)
+        self.linear = layers.Dense(num_units)
+        self.sigmoid = layers.Dense(num_units, activation=activation)
+
+    def call(self, inputs):
+        return self.linear(inputs) * self.sigmoid(inputs)
+
+    def build(self):
+        self.built = True
+
+
+"""
+## GatedResidualNetwork Layer
+
+This is a keras layer defined in the script `structured_data/classification_with_grn_vsn.py`
+More details about this layer maybe found in the relevant script
+
+"""
+
+
+class GatedResidualNetwork(layers.Layer):
+
+    def __init__(
+        self, num_units, dropout_rate, activation, use_layernorm=None, **kwargs
+    ):
+        super().__init__(**kwargs)
+        self.num_units = num_units
+        self.use_layernorm = use_layernorm
+        self.elu_dense = layers.Dense(num_units, activation=activation)
+        self.linear_dense = layers.Dense(num_units)
+        self.dropout = layers.Dropout(dropout_rate)
+        self.gated_linear_unit = GatedLinearUnit(num_units, activation)
+        self.layer_norm = layers.LayerNormalization()
+        self.project = layers.Dense(num_units)
+
+    def call(self, inputs, hp):
+        x = self.elu_dense(inputs)
+        x = self.linear_dense(x)
+        x = self.dropout(x)
+        if inputs.shape[-1] != self.num_units:
+            inputs = self.project(inputs)
+        x = inputs + self.gated_linear_unit(x)
+        use_layernorm = self.use_layernorm
+        if use_layernorm is None:
+            use_layernorm = hp.Boolean("use_layernorm", default=True)
+        if use_layernorm:
+            x = self.layer_norm(x)
+        return x
+
+    def build(self):
+        self.built = True
+
+
+"""
+## Building the Autokeras `VariableSelection Block`
+
+We have converted the following keras layer to an Autokeras Block to include
+hyperapameters to tune. Refer to Autokeras blocks API for writing custom Blocks.
+
+"""
+
+
+class VariableSelection(ak.Block):
+    def __init__(
+        self,
+        num_units: Optional[Union[int, HyperParameters.Choice]] = None,
+        dropout_rate: Optional[Union[float, HyperParameters.Choice]] = None,
+        activation: Optional[Union[str, HyperParameters.Choice]] = None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        self.dropout = utils.get_hyperparameter(
+            dropout_rate,
+            HyperParameters().Choice("dropout", [0.0, 0.25, 0.5], default=0.0),
+            float,
+        )
+        self.num_units = utils.get_hyperparameter(
+            num_units,
+            HyperParameters().Choice(
+                "num_units", [16, 32, 64, 128, 256, 512, 1024], default=16
+            ),
+            int,
+        )
+        self.activation = utils.get_hyperparameter(
+            activation,
+            HyperParameters().Choice(
+                "vsn_activation", ["sigmoid", "elu"], default="sigmoid"
+            ),
+            str,
+        )
+
+    def build(self, hp, inputs):
+        num_units = utils.add_to_hp(self.num_units, hp, "num_units")
+        dropout_rate = utils.add_to_hp(self.dropout, hp, "dropout_rate")
+        activation = utils.add_to_hp(self.activation, hp, "activation")
+        concat_inputs = []
+        for input_ in inputs:
+            if input_ in CATEGORICAL_FEATURES_WITH_VOCABULARY:
+                vocabulary = CATEGORICAL_FEATURES_WITH_VOCABULARY[input_]
+                max_index = len(vocabulary) - 1  # Clamp the indices
+                # torch had some index errors during embedding hence the clip function
+                embedded_feature = layers.Embedding(
+                    input_dim=len(vocabulary),
+                    output_dim=num_units,
+                )(keras.ops.clip(inputs[input_], 0, max_index))
+                concat_inputs.append(embedded_feature)
+            else:
+                # Project the numeric feature to encoding_size using linear transformation.
+                proj_feature = keras.ops.expand_dims(inputs[input_], -1)
+                proj_feature = layers.Dense(units=num_units)(proj_feature)
+                concat_inputs.append(proj_feature)
+        v = layers.concatenate(concat_inputs)
+        v = GatedResidualNetwork(
+            num_units=num_units, dropout_rate=dropout_rate, activation=activation
+        )(v, hp=hp)
+        v = keras.ops.expand_dims(
+            layers.Dense(units=len(inputs), activation=activation)(v), axis=-1
+        )
+        x = []
+        for idx, input in enumerate(concat_inputs):
+            x.append(
+                GatedResidualNetwork(
+                    num_units=num_units,
+                    dropout_rate=dropout_rate,
+                    activation=activation,
+                )(input, hp=hp)
+            )
+        x = keras.ops.stack(x, axis=1)
+        return keras.ops.squeeze(
+            keras.ops.matmul(keras.ops.transpose(v, axes=[0, 2, 1]), x), axis=1
+        )
+
+
+"""
+
+# We craete the HyperModel (from KerasTuner) Inputs which will be built into Keras Input objects
+
+"""
+
+
+def create_model_inputs():
+    inputs = {}
+    for feature_name in FEATURE_NAMES:
+        if feature_name in CATEGORICAL_FEATURES_WITH_VOCABULARY:
+            # Make them int64, they are Categorical (whole units)
+            inputs[feature_name] = Input(name=feature_name, shape=(), dtype="int64")
+        else:
+            # Make them float32, they are Real numbers
+            inputs[feature_name] = Input(name=feature_name, shape=(), dtype="float32")
+    return inputs
+
+
+"""
+
+## KerasTuner `HyperModel`
+
+Here we use the Autokeras `Functional` API to construct a network of BlocksSSS which will
+be built into a KerasTuner HyperModel and finally to a Keras Model.
+
+"""
+
+
+class MyHyperModel(keras_tuner.HyperModel):
+
+    def build(self, hp):
+        inputs = create_model_inputs()
+        features = VariableSelection()(inputs)
+        outputs = ClassifierHead(num_classes=2, multi_label=False)(features)
+        model = Graph(inputs=inputs, outputs=outputs)
+        model = model.build(hp)
+        return model
+
+    def fit(self, hp, model, *args, **kwargs):
+        return model.fit(
+            *args,
+            # Tune whether to shuffle the data in each epoch.
+            shuffle=hp.Boolean("shuffle"),
+            **kwargs,
+        )
+
+
+"""
+
+##  Using `RandomSearch` Tuner to find best HyperParameters
+
+We use the RandomSearch tuner to serach for hyparameters in the search space
+We also display the search space
+
+"""
+
+print("Start training the model...")
+train_dataset = get_dataset_from_csv(train_data_file, shuffle=True, batch_size=256)
+valid_dataset = get_dataset_from_csv(valid_data_file, batch_size=256)
+
+tuner = keras_tuner.RandomSearch(
+    MyHyperModel(),
+    objective="val_accuracy",
+    max_trials=3,
+    overwrite=True,
+    directory="my_dir",
+    project_name="tune_hypermodel",
+)
+
+# Show the search space summary
+print("Tuner search space summary:\n")
+tuner.search_space_summary()
+# Search for best model
+tuner.search(train_dataset, epochs=2, validation_data=valid_dataset)
+
+"""
+## Extracting the best model
+"""
+
+# Get the top model.
+models = tuner.get_best_models(num_models=1)
+best_model = models[0]
+best_model.summary()
+
+
+"""
+## Evaluating Model Performance 
+
+"""
+
+print("Evaluating model performance...")
+test_dataset = get_dataset_from_csv(test_data_file, batch_size=128)
+_, accuracy = best_model.evaluate(test_dataset)
+print(f"Test accuracy: {round(accuracy * 100, 2)}%")