@@ -65,29 +65,29 @@ static std::shared_ptr<ov::Model> buildROPE_Llama2(const int batch,
65
65
auto Constant585 = cos_sin_cache[1 ];
66
66
67
67
// concat KV length
68
- auto transpose_Transpose = makeOP<opset1 ::Transpose>({input, {0 , 2 , 1 , 3 }});
69
- auto slice_Unsqueeze_426 = makeOP<opset1 ::Unsqueeze>({pos_id_end, 0 });
70
- auto ScatterUpdate_152236 = makeOP<opset3 ::ScatterUpdate>({{0 , 0 , 0 }, {2 }, slice_Unsqueeze_426, {0 }});
71
- auto slice_Slice = makeOP<opset1 ::StridedSlice>({Constant582, {0 , 0 , 0 }, ScatterUpdate_152236, {1 , 1 , 1 }},
68
+ auto transpose_Transpose = makeOP<ov::op::v1 ::Transpose>({input, {0 , 2 , 1 , 3 }});
69
+ auto slice_Unsqueeze_426 = makeOP<ov::op::v0 ::Unsqueeze>({pos_id_end, 0 });
70
+ auto ScatterUpdate_152236 = makeOP<ov::op::v3 ::ScatterUpdate>({{0 , 0 , 0 }, {2 }, slice_Unsqueeze_426, {0 }});
71
+ auto slice_Slice = makeOP<ov::op::v1 ::StridedSlice>({Constant582, {0 , 0 , 0 }, ScatterUpdate_152236, {1 , 1 , 1 }},
72
72
{{" begin_mask" , {1 , 1 , 0 }},
73
73
{" end_mask" , {1 , 1 , 0 }},
74
74
{" new_axis_mask" , {}},
75
75
{" shrink_axis_mask" , {}},
76
76
{" ellipsis_mask" , {}}});
77
- auto squeeze_Squeeze = makeOP<opset1 ::Squeeze>({slice_Slice, 1 });
78
- auto squeeze_Squeeze_435 = makeOP<opset1 ::Squeeze>({squeeze_Squeeze, 0 });
79
- auto index_441_Gather = makeOP<opset8 ::Gather>({squeeze_Squeeze_435, pos_ids, 0 }, {{" batch_dims" , 0 }});
80
- auto unsqueeze_Unsqueeze = makeOP<opset1 ::Unsqueeze>({index_441_Gather, 1 });
77
+ auto squeeze_Squeeze = makeOP<ov::op::v0 ::Squeeze>({slice_Slice, 1 });
78
+ auto squeeze_Squeeze_435 = makeOP<ov::op::v0 ::Squeeze>({squeeze_Squeeze, 0 });
79
+ auto index_441_Gather = makeOP<ov::op::v8 ::Gather>({squeeze_Squeeze_435, pos_ids, 0 }, {{" batch_dims" , 0 }});
80
+ auto unsqueeze_Unsqueeze = makeOP<ov::op::v0 ::Unsqueeze>({index_441_Gather, 1 });
81
81
auto mul_Multiply =
82
- makeOP<opset1 ::Multiply>({transpose_Transpose, unsqueeze_Unsqueeze}, {{" auto_broadcast" , " numpy" }});
83
- auto size_ShapeOf_448 = makeOP<opset3 ::ShapeOf>({transpose_Transpose}, {{" output_type" , " i32" }});
84
- auto size_Gather_450 = makeOP<opset8 ::Gather>({size_ShapeOf_448, 3 , 0 }, {{" batch_dims" , 0 }});
82
+ makeOP<ov::op::v1 ::Multiply>({transpose_Transpose, unsqueeze_Unsqueeze}, {{" auto_broadcast" , " numpy" }});
83
+ auto size_ShapeOf_448 = makeOP<ov::op::v3 ::ShapeOf>({transpose_Transpose}, {{" output_type" , " i32" }});
84
+ auto size_Gather_450 = makeOP<ov::op::v8 ::Gather>({size_ShapeOf_448, 3 , 0 }, {{" batch_dims" , 0 }});
85
85
auto floor_divide_Divide =
86
- makeOP<opset1 ::Divide>({size_Gather_450, 2 }, {{" auto_broadcast" , " numpy" }, {" m_pythondiv" , true }});
87
- auto floor_divide_Floor = makeOP<opset1 ::Floor>({floor_divide_Divide});
88
- auto slice_Unsqueeze_452 = makeOP<opset1 ::Unsqueeze>({floor_divide_Floor, 0 });
89
- auto ScatterUpdate_152312 = makeOP<opset3 ::ScatterUpdate>({{0 , 0 , 0 , 0 }, {3 }, slice_Unsqueeze_452, {0 }});
90
- auto slice_Slice_459 = makeOP<opset1 ::StridedSlice>(
86
+ makeOP<ov::op::v1 ::Divide>({size_Gather_450, 2 }, {{" auto_broadcast" , " numpy" }, {" m_pythondiv" , true }});
87
+ auto floor_divide_Floor = makeOP<ov::op::v0 ::Floor>({floor_divide_Divide});
88
+ auto slice_Unsqueeze_452 = makeOP<ov::op::v0 ::Unsqueeze>({floor_divide_Floor, 0 });
89
+ auto ScatterUpdate_152312 = makeOP<ov::op::v3 ::ScatterUpdate>({{0 , 0 , 0 , 0 }, {3 }, slice_Unsqueeze_452, {0 }});
90
+ auto slice_Slice_459 = makeOP<ov::op::v1 ::StridedSlice>(
91
91
{transpose_Transpose, ScatterUpdate_152312, {0ll , 0ll , 0ll , LLONG_MAX}, {1 , 1 , 1 , 1 }},
92
92
{{" begin_mask" , {1 , 1 , 1 , 0 }},
93
93
{" end_mask" , {1 , 1 , 1 , 0 }},
@@ -102,30 +102,30 @@ static std::shared_ptr<ov::Model> buildROPE_Llama2(const int batch,
102
102
1 ,
103
103
}),
104
104
{-1 .000000f });
105
- auto neg_Multiply = makeOP<opset1 ::Multiply>({slice_Slice_459, Constant_182988}, {{" auto_broadcast" , " numpy" }});
106
- auto ScatterUpdate_152368 = makeOP<opset3 ::ScatterUpdate>({{0 , 0 , 0 , 0 }, {3 }, slice_Unsqueeze_452, {0 }});
105
+ auto neg_Multiply = makeOP<ov::op::v1 ::Multiply>({slice_Slice_459, Constant_182988}, {{" auto_broadcast" , " numpy" }});
106
+ auto ScatterUpdate_152368 = makeOP<ov::op::v3 ::ScatterUpdate>({{0 , 0 , 0 , 0 }, {3 }, slice_Unsqueeze_452, {0 }});
107
107
auto slice_Slice2 =
108
- makeOP<opset1 ::StridedSlice>({transpose_Transpose, {0 , 0 , 0 , 0 }, ScatterUpdate_152368, {1 , 1 , 1 , 1 }},
108
+ makeOP<ov::op::v1 ::StridedSlice>({transpose_Transpose, {0 , 0 , 0 , 0 }, ScatterUpdate_152368, {1 , 1 , 1 , 1 }},
109
109
{{" begin_mask" , {1 , 1 , 1 , 0 }},
110
110
{" end_mask" , {1 , 1 , 1 , 0 }},
111
111
{" new_axis_mask" , {}},
112
112
{" shrink_axis_mask" , {}},
113
113
{" ellipsis_mask" , {}}});
114
- auto cat_Concat = makeOP<opset1 ::Concat>({neg_Multiply, slice_Slice2}, {{" axis" , -1 }});
115
- auto ScatterUpdate_152421 = makeOP<opset3 ::ScatterUpdate>({{0 , 0 , 0 }, {2 }, slice_Unsqueeze_426, {0 }});
116
- auto slice_Slice_433 = makeOP<opset1 ::StridedSlice>({Constant585, {0 , 0 , 0 }, ScatterUpdate_152421, {1 , 1 , 1 }},
114
+ auto cat_Concat = makeOP<ov::op::v0 ::Concat>({neg_Multiply, slice_Slice2}, {{" axis" , -1 }});
115
+ auto ScatterUpdate_152421 = makeOP<ov::op::v3 ::ScatterUpdate>({{0 , 0 , 0 }, {2 }, slice_Unsqueeze_426, {0 }});
116
+ auto slice_Slice_433 = makeOP<ov::op::v1 ::StridedSlice>({Constant585, {0 , 0 , 0 }, ScatterUpdate_152421, {1 , 1 , 1 }},
117
117
{{" begin_mask" , {1 , 1 , 0 }},
118
118
{" end_mask" , {1 , 1 , 0 }},
119
119
{" new_axis_mask" , {}},
120
120
{" shrink_axis_mask" , {}},
121
121
{" ellipsis_mask" , {}}});
122
- auto squeeze_Squeeze_436 = makeOP<opset1 ::Squeeze>({slice_Slice_433, 1 });
123
- auto squeeze_Squeeze_437 = makeOP<opset1 ::Squeeze>({squeeze_Squeeze_436, 0 });
124
- auto index_446_Gather = makeOP<opset8 ::Gather>({squeeze_Squeeze_437, pos_ids, 0 }, {{" batch_dims" , 0 }});
125
- auto unsqueeze_Unsqueeze_447 = makeOP<opset1 ::Unsqueeze>({index_446_Gather, 1 });
122
+ auto squeeze_Squeeze_436 = makeOP<ov::op::v0 ::Squeeze>({slice_Slice_433, 1 });
123
+ auto squeeze_Squeeze_437 = makeOP<ov::op::v0 ::Squeeze>({squeeze_Squeeze_436, 0 });
124
+ auto index_446_Gather = makeOP<ov::op::v8 ::Gather>({squeeze_Squeeze_437, pos_ids, 0 }, {{" batch_dims" , 0 }});
125
+ auto unsqueeze_Unsqueeze_447 = makeOP<ov::op::v0 ::Unsqueeze>({index_446_Gather, 1 });
126
126
auto mul_Multiply_463 =
127
- makeOP<opset1 ::Multiply>({cat_Concat, unsqueeze_Unsqueeze_447}, {{" auto_broadcast" , " numpy" }});
128
- auto add_Add = makeOP<opset1 ::Add>({mul_Multiply, mul_Multiply_463}, {{" auto_broadcast" , " numpy" }});
127
+ makeOP<ov::op::v1 ::Multiply>({cat_Concat, unsqueeze_Unsqueeze_447}, {{" auto_broadcast" , " numpy" }});
128
+ auto add_Add = makeOP<ov::op::v1 ::Add>({mul_Multiply, mul_Multiply_463}, {{" auto_broadcast" , " numpy" }});
129
129
130
130
return std::make_shared<ov::Model>(ov::NodeVector{add_Add}, ov::ParameterVector{input, pos_id_end, pos_ids});
131
131
}
0 commit comments