[Test only] BFloat16 test for SkipSimplifiedLayerNormalization #22941

jiafatom · 2024-11-25T18:35:52Z

Description

Motivation and Context

github-actions

You can commit the suggested changes from lintrunner.

github-actions · 2024-11-25T18:42:11Z

onnxruntime/contrib_ops/cuda/bert/skip_layer_norm.cc

+          skip_size);
+    } 
+    else
+    {
+      LaunchSkipLayerNormKernel<CudaT, Simplified>(


Suggested change

skip_size);

}

else

{

LaunchSkipLayerNormKernel<CudaT, Simplified>(

skip_size);

} else {

LaunchSkipLayerNormKernel<CudaT, Simplified>(

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py

 import tempfile
 from typing import Dict
+from enum import Enum



Suggested change

import tempfile

from typing import Dict

from enum import Enum

import tempfile

from enum import Enum

from typing import Dict

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py

 from onnx import AttributeProto, GraphProto, ModelProto, NodeProto, TensorProto, helper, numpy_helper
 from onnx.shape_inference import infer_shapes, infer_shapes_path
+from onnx.helper import float32_to_bfloat16
 from packaging import version


Suggested change

from onnx import AttributeProto, GraphProto, ModelProto, NodeProto, TensorProto, helper, numpy_helper

from onnx.shape_inference import infer_shapes, infer_shapes_path

from onnx.helper import float32_to_bfloat16

from packaging import version

from onnx import AttributeProto, GraphProto, ModelProto, NodeProto, TensorProto, helper, numpy_helper

from onnx.helper import float32_to_bfloat16

from onnx.shape_inference import infer_shapes, infer_shapes_path

from packaging import version

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py


-
 def convert_np_to_float16(np_array, min_positive_val=5.96e-08, max_finite_val=65504.0):


Suggested change

def convert_np_to_float16(np_array, min_positive_val=5.96e-08, max_finite_val=65504.0):

def convert_np_to_float16(np_array, min_positive_val=5.96e-08, max_finite_val=65504.0):

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py


+def convert_tensor_float_to_bfloat16(tensor):


Suggested change

def convert_tensor_float_to_bfloat16(tensor):

def convert_tensor_float_to_bfloat16(tensor):

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py

+class NodeValueType(Enum):
+    FP32 = 1


Suggested change

class NodeValueType(Enum):

FP32 = 1

class NodeValueType(Enum):

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py

 class InitializerTracker:
    """Class for keeping track of initializer."""


Suggested change

class InitializerTracker:

"""Class for keeping track of initializer."""

class InitializerTracker:

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py

 def convert_float_to_float16(
    model,


Suggested change

def convert_float_to_float16(

model,

def convert_float_to_float16(

github-actions · 2024-11-25T18:42:12Z

onnxruntime/python/tools/transformers/float16.py


    # Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.
    for node in mixed_float_type_node_list:


Suggested change

# Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.

for node in mixed_float_type_node_list:

# Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.

github-actions

You can commit the suggested changes from lintrunner.

github-actions · 2024-11-25T22:34:11Z

onnxruntime/python/tools/transformers/float16.py

 import tempfile
 from typing import Dict
+from enum import Enum
+import ml_dtypes

 import numpy as np


Suggested change

import tempfile

from typing import Dict

from enum import Enum

import ml_dtypes

import numpy as np

import tempfile

from enum import Enum

from typing import Dict

import ml_dtypes

import numpy as np

github-actions

You can commit the suggested changes from lintrunner.

github-actions · 2024-11-26T02:27:35Z

onnxruntime/contrib_ops/cuda/bert/skip_layer_norm.cc

+          skip_size);
+    }
+    else
+    {
+      LaunchSkipLayerNormKernel<CudaT, Simplified>(


Suggested change

skip_size);

}

else

{

LaunchSkipLayerNormKernel<CudaT, Simplified>(

skip_size);

} else {

LaunchSkipLayerNormKernel<CudaT, Simplified>(

…lic_shape bugfix (#23558) - Add symbolic shape inference dispatcher for `ReduceMean`. - Reducemean is used in RMSNorm so shape inference fails for llama, phi, etc torch exported models. - Reuse the dispatcher for ReduceSum since ReduceMean 18+ and ReduceSum 13+ have the same specs other than the type of reduction done. - Fix an issue with `quant_pre_process` tool where the external data file is missing if `skip_symbolic_shape=True` and `skip_optimization=False`. - Add `"session.optimized_model_external_initializers_file_name"` to session options so that the external data gets saved in the same temp directory as the optimized model.

github-actions

You can commit the suggested changes from lintrunner.

github-actions · 2025-02-03T18:16:13Z

onnxruntime/python/tools/transformers/float16.py

 import tempfile
+from typing import Dict
+from enum import Enum
+import ml_dtypes

 import numpy as np


Suggested change

import tempfile

from typing import Dict

from enum import Enum

import ml_dtypes

import numpy as np

import tempfile

from enum import Enum

import ml_dtypes

import numpy as np

github-actions · 2025-02-03T18:16:13Z

onnxruntime/python/tools/transformers/float16.py


+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex
+import onnxruntime as rt
+



Suggested change

import onnxscript

from onnxscript import optimizer, ir

import onnxconverter_common

from onnxconverter_common.onnx_ex import make_model_ex

import onnxruntime as rt

github-actions · 2025-02-03T18:16:13Z

onnxruntime/python/tools/transformers/float16.py


-def convert_tensor_float_to_float16(tensor, min_positive_val=5.96e-08, max_finite_val=65504.0):
+def convert_tensor_float_to_float16(tensor, is_value_type_bfloat16=False, min_positive_val=5.96e-08, max_finite_val=65504.0):
    """Convert tensor float to float16.


Suggested change

def convert_tensor_float_to_float16(tensor, min_positive_val=5.96e-08, max_finite_val=65504.0):

def convert_tensor_float_to_float16(tensor, is_value_type_bfloat16=False, min_positive_val=5.96e-08, max_finite_val=65504.0):

"""Convert tensor float to float16.

def convert_tensor_float_to_float16(

tensor, is_value_type_bfloat16=False, min_positive_val=5.96e-08, max_finite_val=65504.0

):

"""Convert tensor float to float16.

github-actions · 2025-02-03T18:16:13Z

onnxruntime/python/tools/transformers/float16.py


+class NodeValueType(Enum):


Suggested change

class NodeValueType(Enum):

class NodeValueType(Enum):

github-actions · 2025-02-03T18:16:14Z

onnxruntime/python/tools/transformers/float16.py


 class InitializerTracker:


Suggested change

class InitializerTracker:

class InitializerTracker:

github-actions · 2025-02-03T18:16:14Z

onnxruntime/python/tools/transformers/float16.py

+

    # Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.


Suggested change

# Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.

# Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.

github-actions · 2025-02-03T18:16:14Z

onnxruntime/python/tools/transformers/float16.py

                    node_name = node.name + "_input_cast" + str(i)
-                    new_node = [helper.make_node("Cast", [input_name], [output_name], to=1, name=node_name)]
+                    new_node = [helper.make_node("Cast", [input_name], [output_name], to=TensorProto.FLOAT, name=node_name)]
                    model.graph.node.extend(new_node)


Suggested change

node_name = node.name + "_input_cast" + str(i)

new_node = [helper.make_node("Cast", [input_name], [output_name], to=1, name=node_name)]

new_node = [helper.make_node("Cast", [input_name], [output_name], to=TensorProto.FLOAT, name=node_name)]

model.graph.node.extend(new_node)

node_name = node.name + "_input_cast" + str(i)

new_node = [

helper.make_node("Cast", [input_name], [output_name], to=TensorProto.FLOAT, name=node_name)

]

model.graph.node.extend(new_node)

github-actions · 2025-02-03T18:16:14Z

onnxruntime/python/tools/transformers/float16.py

+                    # new_node = [helper.make_node("Cast", [input_name], [output], to=final_value_type, name=node_name)]
+                    new_node = [helper.make_node("Cast", [input_name], [output], to=TensorProto.FLOAT16, name=node_name)]
                    model.graph.node.extend(new_node)


Suggested change

# new_node = [helper.make_node("Cast", [input_name], [output], to=final_value_type, name=node_name)]

new_node = [helper.make_node("Cast", [input_name], [output], to=TensorProto.FLOAT16, name=node_name)]

model.graph.node.extend(new_node)

# new_node = [helper.make_node("Cast", [input_name], [output], to=final_value_type, name=node_name)]

new_node = [

helper.make_node("Cast", [input_name], [output], to=TensorProto.FLOAT16, name=node_name)

]

model.graph.node.extend(new_node)

github-actions · 2025-02-03T18:16:15Z

onnxruntime/python/tools/transformers/float16.py

+    # model = ir.serde.serialize_model(ir_model)
+    '''
+


Suggested change

# model = ir.serde.serialize_model(ir_model)

'''

# model = ir.serde.serialize_model(ir_model)

"""

github-actions · 2025-02-03T18:16:15Z

onnxruntime/python/tools/transformers/float16.py

+                          domain=model.domain)
+    '''
+


Suggested change

domain=model.domain)

'''

domain=model.domain)

"""

onnxruntime/python/tools/transformers/float16.py

@@ -16,6 +16,9 @@
 import logging
 import os
 import tempfile
+from typing import Dict


onnxruntime/python/tools/transformers/float16.py

@@ -16,6 +16,9 @@
 import logging
 import os
 import tempfile
+from typing import Dict


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common


onnxruntime/python/tools/transformers/float16.py

+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex


onnxruntime/python/tools/transformers/float16.py

+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex


onnxruntime/python/tools/transformers/float16.py

+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex
+import onnxruntime as rt


onnxruntime/python/tools/transformers/float16.py

+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex
+import onnxruntime as rt


onnxruntime/python/tools/transformers/float16.py

@@ -16,6 +16,9 @@
 import logging
 import os
 import tempfile
+from typing import Dict


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript
+from onnxscript import optimizer, ir


onnxruntime/python/tools/transformers/float16.py

@@ -25,6 +28,12 @@

 logger = logging.getLogger(__name__)

+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common


onnxruntime/python/tools/transformers/float16.py

+import onnxscript
+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex


onnxruntime/python/tools/transformers/float16.py

+from onnxscript import optimizer, ir
+import onnxconverter_common
+from onnxconverter_common.onnx_ex import make_model_ex
+import onnxruntime as rt


onnxruntime/python/tools/transformers/float16.py

+    # if func_infer_shape is not None:
+    #    model = func_infer_shape(model)


jiafatom changed the title ~~BFloat16 test for SkipSimplifiedLayerNormalization~~ [Test only] BFloat16 test for SkipSimplifiedLayerNormalization Nov 25, 2024

github-actions bot reviewed Nov 25, 2024

View reviewed changes

jiafatom force-pushed the skip_bf_16 branch from e4ef17b to e5f20f2 Compare November 25, 2024 22:28

github-actions bot reviewed Nov 25, 2024

View reviewed changes

jiafatom force-pushed the skip_bf_16 branch 4 times, most recently from 03bf839 to 09e2cc1 Compare November 26, 2024 02:24

github-actions bot reviewed Nov 26, 2024

View reviewed changes

jiafatom force-pushed the skip_bf_16 branch from 09e2cc1 to a09b5da Compare February 3, 2025 18:11

github-actions bot reviewed Feb 3, 2025

View reviewed changes

github-advanced-security bot found potential problems Feb 3, 2025

View reviewed changes

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[Test only] BFloat16 test for SkipSimplifiedLayerNormalization #22941

[Test only] BFloat16 test for SkipSimplifiedLayerNormalization #22941

jiafatom commented Nov 25, 2024

github-actions bot left a comment

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot Nov 25, 2024

github-actions bot left a comment

github-actions bot Nov 25, 2024

github-actions bot left a comment

github-actions bot Nov 26, 2024

github-actions bot left a comment

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025

github-actions bot Feb 3, 2025



		def convert_np_to_float16(np_array, min_positive_val=5.96e-08, max_finite_val=65504.0):


	def convert_tensor_float_to_bfloat16(tensor):


	def convert_tensor_float_to_bfloat16(tensor):

		class InitializerTracker:
		"""Class for keeping track of initializer."""


		# Some operators have data type fixed as float for some input. Add a float16 to float cast for those inputs.
		for node in mixed_float_type_node_list:

		@@ -25,6 +28,12 @@

		logger = logging.getLogger(__name__)

		import onnxscript

		# if func_infer_shape is not None:
		# model = func_infer_shape(model)

[Test only] BFloat16 test for SkipSimplifiedLayerNormalization #22941

Are you sure you want to change the base?

[Test only] BFloat16 test for SkipSimplifiedLayerNormalization #22941

Conversation

jiafatom commented Nov 25, 2024

Description

Motivation and Context

github-actions bot left a comment

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot left a comment

Choose a reason for hiding this comment

github-actions bot Nov 25, 2024

Choose a reason for hiding this comment

github-actions bot left a comment

Choose a reason for hiding this comment

github-actions bot Nov 26, 2024

Choose a reason for hiding this comment

github-actions bot left a comment

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment

github-actions bot Feb 3, 2025

Choose a reason for hiding this comment