|
7528 | 7528 | "lat": 4,
|
7529 | 7529 | "sizelat": 4,
|
7530 | 7530 | "size": 2,
|
7531 |
| - "gisize": -1, |
| 7531 | + "gisize": 22, |
7532 | 7532 | "extrasize": 0,
|
7533 | 7533 | "asm": "index z1.d, #7, #-1\nptrue p0.d, vl2\nudiv z0.d, p0/m, z0.d, z1.d\nret",
|
7534 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %178:_(s64), %179:_(s64), %180:_(s64), %181:_(s64) = G_UNMERGE_VALUES %103:_(<2 x s128>) (in function: test)", |
| 7534 | + "giasm": "mov x8, #9363 // =0x2493\nfmov x9, d0\nmov x10, #-6148914691236517206 // =0xaaaaaaaaaaaaaaaa\nmovk x8, #37449, lsl #16\nmovk x10, #43691\nmovk x8, #18724, lsl #32\nmovk x8, #9362, lsl #48\numulh x8, x9, x8\nmov x9, v0.d[1]\numulh x9, x9, x10\nmov v1.d[0], x8\nmov x8, #-9223372036854775808 // =0x8000000000000000\nmov v1.d[1], x9\nsub v0.2d, v0.2d, v1.2d\nfmov x9, d0\nmov x10, v0.d[1]\numulh x8, x9, x8\numulh x9, x10, xzr\nmov v0.d[0], x8\nmov v0.d[1], x9\nadd v0.2d, v0.2d, v1.2d\nushr v0.2d, v0.2d, #2\nret", |
7535 | 7535 | "ll": "define <2 x i64> @test(<2 x i64> %a) {\n %r = udiv <2 x i64> %a, <i64 7, i64 6>\n ret <2 x i64> %r\n}",
|
7536 | 7536 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 4 for instruction: %r = udiv <2 x i64> %a, <i64 7, i64 6>\nCost Model: Found an estimated cost of 1 for instruction: ret <2 x i64> %r"
|
7537 | 7537 | },
|
|
7560 | 7560 | "lat": 4,
|
7561 | 7561 | "sizelat": 4,
|
7562 | 7562 | "size": 3,
|
7563 |
| - "gisize": -1, |
| 7563 | + "gisize": 13, |
7564 | 7564 | "extrasize": 0,
|
7565 | 7565 | "asm": "mov w8, #7 // =0x7\nptrue p0.d, vl2\ndup v1.2d, x8\nudiv z0.d, p0/m, z0.d, z1.d\nret",
|
7566 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %110:_(s64), %111:_(s64), %112:_(s64), %113:_(s64) = G_UNMERGE_VALUES %33:_(<2 x s128>) (in function: test)", |
| 7566 | + "giasm": "mov x8, #9363 // =0x2493\nfmov x9, d0\nmov x10, v0.d[1]\nmovk x8, #37449, lsl #16\nmovk x8, #18724, lsl #32\nmovk x8, #9362, lsl #48\numulh x9, x9, x8\numulh x8, x10, x8\nmov v1.d[0], x9\nmov v1.d[1], x8\nsub v0.2d, v0.2d, v1.2d\nusra v1.2d, v0.2d, #1\nushr v0.2d, v1.2d, #2\nret", |
7567 | 7567 | "ll": "define <2 x i64> @test(<2 x i64> %a) {\n %r = udiv <2 x i64> %a, splat (i64 7)\n ret <2 x i64> %r\n}",
|
7568 | 7568 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 4 for instruction: %r = udiv <2 x i64> %a, splat (i64 7)\nCost Model: Found an estimated cost of 1 for instruction: ret <2 x i64> %r"
|
7569 | 7569 | },
|
|
7592 | 7592 | "lat": 4,
|
7593 | 7593 | "sizelat": 4,
|
7594 | 7594 | "size": 3,
|
7595 |
| - "gisize": -1, |
| 7595 | + "gisize": 37, |
7596 | 7596 | "extrasize": 0,
|
7597 | 7597 | "asm": "index z2.d, #7, #-1\nptrue p0.d, vl2\nudiv z0.d, p0/m, z0.d, z2.d\nudiv z1.d, p0/m, z1.d, z2.d\nret",
|
7598 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %0:_(<4 x s64>) = G_CONCAT_VECTORS %1:_(<2 x s64>), %2:_(<2 x s64>) (in function: test)", |
| 7598 | + "giasm": "mov x8, #9363 // =0x2493\nfmov x9, d0\nfmov x11, d1\nmovk x8, #37449, lsl #16\nmov x10, v0.d[1]\nmov x12, v1.d[1]\nmovk x8, #18724, lsl #32\nmovk x8, #9362, lsl #48\numulh x9, x9, x8\numulh x8, x11, x8\nmov x11, #-6148914691236517206 // =0xaaaaaaaaaaaaaaaa\nmovk x11, #43691\numulh x10, x10, x11\nmov v2.d[0], x9\numulh x9, x12, x11\nmov v3.d[0], x8\nmov x8, #-9223372036854775808 // =0x8000000000000000\nmov v2.d[1], x10\nmov v3.d[1], x9\nsub v0.2d, v0.2d, v2.2d\nsub v1.2d, v1.2d, v3.2d\nfmov x9, d0\nmov x10, v0.d[1]\nfmov x11, d1\nmov x12, v1.d[1]\numulh x9, x9, x8\numulh x8, x11, x8\numulh x10, x10, xzr\nmov v0.d[0], x9\numulh x11, x12, xzr\nmov v1.d[0], x8\nmov v0.d[1], x10\nmov v1.d[1], x11\nadd v0.2d, v0.2d, v2.2d\nadd v1.2d, v1.2d, v3.2d\nushr v0.2d, v0.2d, #2\nushr v1.2d, v1.2d, #2\nret", |
7599 | 7599 | "ll": "define <4 x i64> @test(<4 x i64> %a) {\n %r = udiv <4 x i64> %a, <i64 7, i64 6, i64 7, i64 6>\n ret <4 x i64> %r\n}",
|
7600 | 7600 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 4 for instruction: %r = udiv <4 x i64> %a, <i64 7, i64 6, i64 7, i64 6>\nCost Model: Found an estimated cost of 1 for instruction: ret <4 x i64> %r"
|
7601 | 7601 | },
|
|
7624 | 7624 | "lat": 4,
|
7625 | 7625 | "sizelat": 4,
|
7626 | 7626 | "size": 4,
|
7627 |
| - "gisize": -1, |
| 7627 | + "gisize": 22, |
7628 | 7628 | "extrasize": 0,
|
7629 | 7629 | "asm": "mov w8, #7 // =0x7\nptrue p0.d, vl2\ndup v2.2d, x8\nudiv z0.d, p0/m, z0.d, z2.d\nudiv z1.d, p0/m, z1.d, z2.d\nret",
|
7630 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %0:_(<4 x s64>) = G_CONCAT_VECTORS %1:_(<2 x s64>), %2:_(<2 x s64>) (in function: test)", |
| 7630 | + "giasm": "mov x8, #9363 // =0x2493\nfmov x9, d0\nfmov x11, d1\nmovk x8, #37449, lsl #16\nmov x10, v0.d[1]\nmov x12, v1.d[1]\nmovk x8, #18724, lsl #32\nmovk x8, #9362, lsl #48\numulh x9, x9, x8\numulh x11, x11, x8\numulh x10, x10, x8\nmov v2.d[0], x9\numulh x8, x12, x8\nmov v3.d[0], x11\nmov v2.d[1], x10\nmov v3.d[1], x8\nsub v0.2d, v0.2d, v2.2d\nsub v1.2d, v1.2d, v3.2d\nusra v2.2d, v0.2d, #1\nusra v3.2d, v1.2d, #1\nushr v0.2d, v2.2d, #2\nushr v1.2d, v3.2d, #2\nret", |
7631 | 7631 | "ll": "define <4 x i64> @test(<4 x i64> %a) {\n %r = udiv <4 x i64> %a, splat (i64 7)\n ret <4 x i64> %r\n}",
|
7632 | 7632 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 4 for instruction: %r = udiv <4 x i64> %a, splat (i64 7)\nCost Model: Found an estimated cost of 1 for instruction: ret <4 x i64> %r"
|
7633 | 7633 | },
|
@@ -32936,10 +32936,10 @@
|
32936 | 32936 | "lat": 160,
|
32937 | 32937 | "sizelat": 160,
|
32938 | 32938 | "size": 7,
|
32939 |
| - "gisize": -1, |
| 32939 | + "gisize": 7, |
32940 | 32940 | "extrasize": 0,
|
32941 | 32941 | "asm": "movi v2.16b, #1\nsub v3.16b, v0.16b, v2.16b\nsub v2.16b, v1.16b, v2.16b\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nret",
|
32942 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<32 x s8>) = G_CTPOP %10:_(<32 x s8>) (in function: test)", |
| 32942 | + "giasm": "movi v2.2d, #0xffffffffffffffff\nadd v3.16b, v0.16b, v2.16b\nadd v2.16b, v1.16b, v2.16b\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nret", |
32943 | 32943 | "ll": "define <32 x i8> @test(<32 x i8> %a) {\n %r = call <32 x i8> @llvm.cttz(<32 x i8> %a, i1 0)\n ret <32 x i8> %r\n}",
|
32944 | 32944 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 160 for instruction: %r = call <32 x i8> @llvm.cttz.v32i8(<32 x i8> %a, i1 false)\nCost Model: Found an estimated cost of 1 for instruction: ret <32 x i8> %r"
|
32945 | 32945 | },
|
@@ -32984,10 +32984,10 @@
|
32984 | 32984 | "lat": 80,
|
32985 | 32985 | "sizelat": 80,
|
32986 | 32986 | "size": 10,
|
32987 |
| - "gisize": -1, |
| 32987 | + "gisize": 9, |
32988 | 32988 | "extrasize": 0,
|
32989 | 32989 | "asm": "movi v2.8h, #1\nsub v3.8h, v0.8h, v2.8h\nsub v2.8h, v1.8h, v2.8h\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\nmovi v2.8h, #16\nclz v0.8h, v0.8h\nclz v1.8h, v1.8h\nsub v0.8h, v2.8h, v0.8h\nsub v1.8h, v2.8h, v1.8h\nret",
|
32990 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<16 x s16>) = G_CTPOP %10:_(<16 x s16>) (in function: test)", |
| 32990 | + "giasm": "movi v2.2d, #0xffffffffffffffff\nadd v3.8h, v0.8h, v2.8h\nadd v2.8h, v1.8h, v2.8h\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nret", |
32991 | 32991 | "ll": "define <16 x i16> @test(<16 x i16> %a) {\n %r = call <16 x i16> @llvm.cttz(<16 x i16> %a, i1 0)\n ret <16 x i16> %r\n}",
|
32992 | 32992 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 80 for instruction: %r = call <16 x i16> @llvm.cttz.v16i16(<16 x i16> %a, i1 false)\nCost Model: Found an estimated cost of 1 for instruction: ret <16 x i16> %r"
|
32993 | 32993 | },
|
@@ -33032,10 +33032,10 @@
|
33032 | 33032 | "lat": 40,
|
33033 | 33033 | "sizelat": 40,
|
33034 | 33034 | "size": 10,
|
33035 |
| - "gisize": -1, |
| 33035 | + "gisize": 11, |
33036 | 33036 | "extrasize": 0,
|
33037 | 33037 | "asm": "movi v2.4s, #1\nsub v3.4s, v0.4s, v2.4s\nsub v2.4s, v1.4s, v2.4s\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\nmovi v2.4s, #32\nclz v0.4s, v0.4s\nclz v1.4s, v1.4s\nsub v0.4s, v2.4s, v0.4s\nsub v1.4s, v2.4s, v1.4s\nret",
|
33038 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<8 x s32>) = G_CTPOP %10:_(<8 x s32>) (in function: test)", |
| 33038 | + "giasm": "movi v2.2d, #0xffffffffffffffff\nadd v3.4s, v0.4s, v2.4s\nadd v2.4s, v1.4s, v2.4s\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nret", |
33039 | 33039 | "ll": "define <8 x i32> @test(<8 x i32> %a) {\n %r = call <8 x i32> @llvm.cttz(<8 x i32> %a, i1 0)\n ret <8 x i32> %r\n}",
|
33040 | 33040 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 40 for instruction: %r = call <8 x i32> @llvm.cttz.v8i32(<8 x i32> %a, i1 false)\nCost Model: Found an estimated cost of 1 for instruction: ret <8 x i32> %r"
|
33041 | 33041 | },
|
@@ -33064,10 +33064,10 @@
|
33064 | 33064 | "lat": 20,
|
33065 | 33065 | "sizelat": 20,
|
33066 | 33066 | "size": 14,
|
33067 |
| - "gisize": -1, |
| 33067 | + "gisize": 13, |
33068 | 33068 | "extrasize": 0,
|
33069 | 33069 | "asm": "mov w8, #1 // =0x1\ndup v2.2d, x8\nsub v3.2d, v0.2d, v2.2d\nsub v2.2d, v1.2d, v2.2d\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nuaddlp v0.2d, v0.4s\nuaddlp v1.2d, v1.4s\nret",
|
33070 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<4 x s64>) = G_CTPOP %10:_(<4 x s64>) (in function: test)", |
| 33070 | + "giasm": "movi v2.2d, #0xffffffffffffffff\nadd v3.2d, v0.2d, v2.2d\nadd v2.2d, v1.2d, v2.2d\nbic v0.16b, v3.16b, v0.16b\nbic v1.16b, v2.16b, v1.16b\ncnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nuaddlp v0.2d, v0.4s\nuaddlp v1.2d, v1.4s\nret", |
33071 | 33071 | "ll": "define <4 x i64> @test(<4 x i64> %a) {\n %r = call <4 x i64> @llvm.cttz(<4 x i64> %a, i1 0)\n ret <4 x i64> %r\n}",
|
33072 | 33072 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 20 for instruction: %r = call <4 x i64> @llvm.cttz.v4i64(<4 x i64> %a, i1 false)\nCost Model: Found an estimated cost of 1 for instruction: ret <4 x i64> %r"
|
33073 | 33073 | },
|
@@ -33352,10 +33352,10 @@
|
33352 | 33352 | "lat": 2,
|
33353 | 33353 | "sizelat": 2,
|
33354 | 33354 | "size": 2,
|
33355 |
| - "gisize": -1, |
| 33355 | + "gisize": 2, |
33356 | 33356 | "extrasize": 0,
|
33357 | 33357 | "asm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nret",
|
33358 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<32 x s8>) = G_CTPOP %0:_(<32 x s8>) (in function: test)", |
| 33358 | + "giasm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nret", |
33359 | 33359 | "ll": "define <32 x i8> @test(<32 x i8> %a) {\n %r = call <32 x i8> @llvm.ctpop(<32 x i8> %a)\n ret <32 x i8> %r\n}",
|
33360 | 33360 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 2 for instruction: %r = call <32 x i8> @llvm.ctpop.v32i8(<32 x i8> %a)\nCost Model: Found an estimated cost of 1 for instruction: ret <32 x i8> %r"
|
33361 | 33361 | },
|
@@ -33400,10 +33400,10 @@
|
33400 | 33400 | "lat": 4,
|
33401 | 33401 | "sizelat": 4,
|
33402 | 33402 | "size": 4,
|
33403 |
| - "gisize": -1, |
| 33403 | + "gisize": 4, |
33404 | 33404 | "extrasize": 0,
|
33405 | 33405 | "asm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nret",
|
33406 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<16 x s16>) = G_CTPOP %0:_(<16 x s16>) (in function: test)", |
| 33406 | + "giasm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nret", |
33407 | 33407 | "ll": "define <16 x i16> @test(<16 x i16> %a) {\n %r = call <16 x i16> @llvm.ctpop(<16 x i16> %a)\n ret <16 x i16> %r\n}",
|
33408 | 33408 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 4 for instruction: %r = call <16 x i16> @llvm.ctpop.v16i16(<16 x i16> %a)\nCost Model: Found an estimated cost of 1 for instruction: ret <16 x i16> %r"
|
33409 | 33409 | },
|
@@ -33448,10 +33448,10 @@
|
33448 | 33448 | "lat": 6,
|
33449 | 33449 | "sizelat": 6,
|
33450 | 33450 | "size": 6,
|
33451 |
| - "gisize": -1, |
| 33451 | + "gisize": 6, |
33452 | 33452 | "extrasize": 0,
|
33453 | 33453 | "asm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nret",
|
33454 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<8 x s32>) = G_CTPOP %0:_(<8 x s32>) (in function: test)", |
| 33454 | + "giasm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nret", |
33455 | 33455 | "ll": "define <8 x i32> @test(<8 x i32> %a) {\n %r = call <8 x i32> @llvm.ctpop(<8 x i32> %a)\n ret <8 x i32> %r\n}",
|
33456 | 33456 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 6 for instruction: %r = call <8 x i32> @llvm.ctpop.v8i32(<8 x i32> %a)\nCost Model: Found an estimated cost of 1 for instruction: ret <8 x i32> %r"
|
33457 | 33457 | },
|
@@ -33480,10 +33480,10 @@
|
33480 | 33480 | "lat": 8,
|
33481 | 33481 | "sizelat": 8,
|
33482 | 33482 | "size": 8,
|
33483 |
| - "gisize": -1, |
| 33483 | + "gisize": 8, |
33484 | 33484 | "extrasize": 0,
|
33485 | 33485 | "asm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nuaddlp v0.2d, v0.4s\nuaddlp v1.2d, v1.4s\nret",
|
33486 |
| - "giasm": "LLVM ERROR: unable to legalize instruction: %3:_(<4 x s64>) = G_CTPOP %0:_(<4 x s64>) (in function: test)", |
| 33486 | + "giasm": "cnt v0.16b, v0.16b\ncnt v1.16b, v1.16b\nuaddlp v0.8h, v0.16b\nuaddlp v1.8h, v1.16b\nuaddlp v0.4s, v0.8h\nuaddlp v1.4s, v1.8h\nuaddlp v0.2d, v0.4s\nuaddlp v1.2d, v1.4s\nret", |
33487 | 33487 | "ll": "define <4 x i64> @test(<4 x i64> %a) {\n %r = call <4 x i64> @llvm.ctpop(<4 x i64> %a)\n ret <4 x i64> %r\n}",
|
33488 | 33488 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found an estimated cost of 8 for instruction: %r = call <4 x i64> @llvm.ctpop.v4i64(<4 x i64> %a)\nCost Model: Found an estimated cost of 1 for instruction: ret <4 x i64> %r"
|
33489 | 33489 | },
|
|
0 commit comments