|
2647 | 2647 | "thru": 1, |
2648 | 2648 | "lat": 1, |
2649 | 2649 | "sizelat": 1, |
2650 | | - "size": 3, |
| 2650 | + "size": 4, |
2651 | 2651 | "gisize": 3, |
2652 | 2652 | "extrasize": 0, |
2653 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.8b, v0.8b, v1.8b\nret", |
| 2653 | + "asm": "mov x8, #434041037028460038 // =0x606060606060606\norr x8, x8, #0x7000700070007\nfmov d1, x8\nushl v0.8b, v0.8b, v1.8b\nret", |
2654 | 2654 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.8b, v0.8b, v1.8b\nret", |
2655 | 2655 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = shl <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\n ret <8 x i8> %r\n}", |
2656 | 2656 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = shl <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
|
2839 | 2839 | "thru": 1, |
2840 | 2840 | "lat": 1, |
2841 | 2841 | "sizelat": 1, |
2842 | | - "size": 3, |
| 2842 | + "size": 4, |
2843 | 2843 | "gisize": 3, |
2844 | 2844 | "extrasize": 0, |
2845 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.4h, v0.4h, v1.4h\nret", |
| 2845 | + "asm": "mov x8, #1688875630460934 // =0x6000600060006\norr x8, x8, #0x700000007\nfmov d1, x8\nushl v0.4h, v0.4h, v1.4h\nret", |
2846 | 2846 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.4h, v0.4h, v1.4h\nret", |
2847 | 2847 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = shl <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\n ret <4 x i16> %r\n}", |
2848 | 2848 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = shl <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
|
4007 | 4007 | "thru": 1, |
4008 | 4008 | "lat": 1, |
4009 | 4009 | "sizelat": 1, |
4010 | | - "size": 3, |
| 4010 | + "size": 4, |
4011 | 4011 | "gisize": 4, |
4012 | 4012 | "extrasize": 0, |
4013 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nsshl v0.8b, v0.8b, v1.8b\nret", |
| 4013 | + "asm": "mov x8, #-434041037028460039 // =0xf9f9f9f9f9f9f9f9\neor x8, x8, #0x300030003000300\nfmov d1, x8\nsshl v0.8b, v0.8b, v1.8b\nret", |
4014 | 4014 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nneg v1.8b, v1.8b\nsshl v0.8b, v0.8b, v1.8b\nret", |
4015 | 4015 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = ashr <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\n ret <8 x i8> %r\n}", |
4016 | 4016 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = ashr <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
|
4199 | 4199 | "thru": 1, |
4200 | 4200 | "lat": 1, |
4201 | 4201 | "sizelat": 1, |
4202 | | - "size": 3, |
| 4202 | + "size": 4, |
4203 | 4203 | "gisize": 4, |
4204 | 4204 | "extrasize": 0, |
4205 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nsshl v0.4h, v0.4h, v1.4h\nret", |
| 4205 | + "asm": "mov x8, #-1688875630460935 // =0xfff9fff9fff9fff9\neor x8, x8, #0x3000000030000\nfmov d1, x8\nsshl v0.4h, v0.4h, v1.4h\nret", |
4206 | 4206 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nneg v1.4h, v1.4h\nsshl v0.4h, v0.4h, v1.4h\nret", |
4207 | 4207 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = ashr <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\n ret <4 x i16> %r\n}", |
4208 | 4208 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = ashr <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
|
5367 | 5367 | "thru": 1, |
5368 | 5368 | "lat": 1, |
5369 | 5369 | "sizelat": 1, |
5370 | | - "size": 3, |
| 5370 | + "size": 4, |
5371 | 5371 | "gisize": 4, |
5372 | 5372 | "extrasize": 0, |
5373 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.8b, v0.8b, v1.8b\nret", |
| 5373 | + "asm": "mov x8, #-434041037028460039 // =0xf9f9f9f9f9f9f9f9\neor x8, x8, #0x300030003000300\nfmov d1, x8\nushl v0.8b, v0.8b, v1.8b\nret", |
5374 | 5374 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nneg v1.8b, v1.8b\nushl v0.8b, v0.8b, v1.8b\nret", |
5375 | 5375 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = lshr <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\n ret <8 x i8> %r\n}", |
5376 | 5376 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = lshr <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
|
5559 | 5559 | "thru": 1, |
5560 | 5560 | "lat": 1, |
5561 | 5561 | "sizelat": 1, |
5562 | | - "size": 3, |
| 5562 | + "size": 4, |
5563 | 5563 | "gisize": 4, |
5564 | 5564 | "extrasize": 0, |
5565 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nushl v0.4h, v0.4h, v1.4h\nret", |
| 5565 | + "asm": "mov x8, #-1688875630460935 // =0xfff9fff9fff9fff9\neor x8, x8, #0x3000000030000\nfmov d1, x8\nushl v0.4h, v0.4h, v1.4h\nret", |
5566 | 5566 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nneg v1.4h, v1.4h\nushl v0.4h, v0.4h, v1.4h\nret", |
5567 | 5567 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = lshr <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\n ret <4 x i16> %r\n}", |
5568 | 5568 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 1 for: %r = lshr <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
|
8087 | 8087 | "thru": 30, |
8088 | 8088 | "lat": 4, |
8089 | 8089 | "sizelat": 4, |
8090 | | - "size": 11, |
| 8090 | + "size": 12, |
8091 | 8091 | "gisize": 15, |
8092 | 8092 | "extrasize": 0, |
8093 | | - "asm": "adrp x8, .LCPI0_0\nfmov d2, d0\nmovi v3.4h, #254\nldr d1, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_1\nsmulh z1.b, z0.b, z1.b\nbic v2.4h, #255, lsl #8\nadd v1.8b, v1.8b, v2.8b\nldr d2, [x8, :lo12:.LCPI0_1]\nsshl v1.8b, v1.8b, v3.8b\nusra v1.8b, v1.8b, #7\nmls v0.8b, v1.8b, v2.8b\nret", |
| 8093 | + "asm": "adrp x8, .LCPI0_0\nfmov d2, d0\nmovi v3.4h, #254\nldr d1, [x8, :lo12:.LCPI0_0]\nmov x8, #434041037028460038 // =0x606060606060606\norr x8, x8, #0x7000700070007\nsmulh z1.b, z0.b, z1.b\nbic v2.4h, #255, lsl #8\nadd v1.8b, v1.8b, v2.8b\nfmov d2, x8\nsshl v1.8b, v1.8b, v3.8b\nusra v1.8b, v1.8b, #7\nmls v0.8b, v1.8b, v2.8b\nret", |
8094 | 8094 | "giasm": "adrp x8, .LCPI0_2\nldr d1, [x8, :lo12:.LCPI0_2]\nadrp x8, .LCPI0_1\nldr d2, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nsmull v1.8h, v0.8b, v1.8b\nldr d3, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_3\nshrn v1.8b, v1.8h, #8\nmla v1.8b, v0.8b, v2.8b\nneg v2.8b, v3.8b\nsshl v1.8b, v1.8b, v2.8b\nldr d2, [x8, :lo12:.LCPI0_3]\nusra v1.8b, v1.8b, #7\nmls v0.8b, v1.8b, v2.8b\nret", |
8095 | 8095 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = srem <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\n ret <8 x i8> %r\n}", |
8096 | 8096 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of RThru:30 CodeSize:4 Lat:4 SizeLat:4 for: %r = srem <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
|
8279 | 8279 | "thru": 18, |
8280 | 8280 | "lat": 4, |
8281 | 8281 | "sizelat": 4, |
8282 | | - "size": 9, |
| 8282 | + "size": 10, |
8283 | 8283 | "gisize": 12, |
8284 | 8284 | "extrasize": 0, |
8285 | | - "asm": "adrp x8, .LCPI0_0\nmovi d2, #0x00ffff0000ffff\nldr d1, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_1\nsmulh z1.h, z0.h, z1.h\nsshl v1.4h, v1.4h, v2.4h\nldr d2, [x8, :lo12:.LCPI0_1]\nusra v1.4h, v1.4h, #15\nmls v0.4h, v1.4h, v2.4h\nret", |
| 8285 | + "asm": "adrp x8, .LCPI0_0\nmovi d2, #0x00ffff0000ffff\nldr d1, [x8, :lo12:.LCPI0_0]\nmov x8, #1688875630460934 // =0x6000600060006\norr x8, x8, #0x700000007\nsmulh z1.h, z0.h, z1.h\nsshl v1.4h, v1.4h, v2.4h\nfmov d2, x8\nusra v1.4h, v1.4h, #15\nmls v0.4h, v1.4h, v2.4h\nret", |
8286 | 8286 | "giasm": "adrp x8, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nldr d2, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_2\nsmull v1.4s, v0.4h, v1.4h\nneg v2.4h, v2.4h\nshrn v1.4h, v1.4s, #16\nsshl v1.4h, v1.4h, v2.4h\nldr d2, [x8, :lo12:.LCPI0_2]\nusra v1.4h, v1.4h, #15\nmls v0.4h, v1.4h, v2.4h\nret", |
8287 | 8287 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = srem <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\n ret <4 x i16> %r\n}", |
8288 | 8288 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of RThru:18 CodeSize:4 Lat:4 SizeLat:4 for: %r = srem <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
@@ -10807,10 +10807,10 @@ |
10807 | 10807 | "thru": 7, |
10808 | 10808 | "lat": 4, |
10809 | 10809 | "sizelat": 4, |
10810 | | - "size": 13, |
| 10810 | + "size": 14, |
10811 | 10811 | "gisize": 14, |
10812 | 10812 | "extrasize": 0, |
10813 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nmov w8, #128 // =0x80\nindex z2.b, #0, w8\nadrp x8, .LCPI0_1\numulh z1.b, z0.b, z1.b\nadd z2.b, z2.b, #128 // =0x80\nsub v3.8b, v0.8b, v1.8b\numulh z2.b, z3.b, z2.b\nadd v1.8b, v2.8b, v1.8b\nldr d2, [x8, :lo12:.LCPI0_1]\nushr v1.8b, v1.8b, #2\nmls v0.8b, v1.8b, v2.8b\nret", |
| 10813 | + "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nmov w8, #128 // =0x80\nindex z2.b, #0, w8\nmov x8, #434041037028460038 // =0x606060606060606\numulh z1.b, z0.b, z1.b\norr x8, x8, #0x7000700070007\nadd z2.b, z2.b, #128 // =0x80\nsub v3.8b, v0.8b, v1.8b\numulh z2.b, z3.b, z2.b\nadd v1.8b, v2.8b, v1.8b\nfmov d2, x8\nushr v1.8b, v1.8b, #2\nmls v0.8b, v1.8b, v2.8b\nret", |
10814 | 10814 | "giasm": "adrp x8, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nldr d3, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_2\numull v1.8h, v0.8b, v1.8b\nshrn v1.8b, v1.8h, #8\nsub v2.8b, v0.8b, v1.8b\numull v2.8h, v2.8b, v3.8b\nshrn v2.8b, v2.8h, #8\nadd v1.8b, v2.8b, v1.8b\nldr d2, [x8, :lo12:.LCPI0_2]\nushr v1.8b, v1.8b, #2\nmls v0.8b, v1.8b, v2.8b\nret", |
10815 | 10815 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = urem <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\n ret <8 x i8> %r\n}", |
10816 | 10816 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of RThru:7 CodeSize:4 Lat:4 SizeLat:4 for: %r = urem <8 x i8> %a, <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
@@ -10999,10 +10999,10 @@ |
10999 | 10999 | "thru": 7, |
11000 | 11000 | "lat": 4, |
11001 | 11001 | "sizelat": 4, |
11002 | | - "size": 13, |
| 11002 | + "size": 14, |
11003 | 11003 | "gisize": 14, |
11004 | 11004 | "extrasize": 0, |
11005 | | - "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nmov w8, #32768 // =0x8000\nindex z2.h, #0, w8\nadrp x8, .LCPI0_1\numulh z1.h, z0.h, z1.h\nadd z2.h, z2.h, #32768 // =0x8000\nsub v3.4h, v0.4h, v1.4h\numulh z2.h, z3.h, z2.h\nadd v1.4h, v2.4h, v1.4h\nldr d2, [x8, :lo12:.LCPI0_1]\nushr v1.4h, v1.4h, #2\nmls v0.4h, v1.4h, v2.4h\nret", |
| 11005 | + "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nmov w8, #32768 // =0x8000\nindex z2.h, #0, w8\nmov x8, #1688875630460934 // =0x6000600060006\numulh z1.h, z0.h, z1.h\norr x8, x8, #0x700000007\nadd z2.h, z2.h, #32768 // =0x8000\nsub v3.4h, v0.4h, v1.4h\numulh z2.h, z3.h, z2.h\nadd v1.4h, v2.4h, v1.4h\nfmov d2, x8\nushr v1.4h, v1.4h, #2\nmls v0.4h, v1.4h, v2.4h\nret", |
11006 | 11006 | "giasm": "adrp x8, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nldr d3, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_2\numull v1.4s, v0.4h, v1.4h\nshrn v1.4h, v1.4s, #16\nsub v2.4h, v0.4h, v1.4h\numull v2.4s, v2.4h, v3.4h\nshrn v2.4h, v2.4s, #16\nadd v1.4h, v2.4h, v1.4h\nldr d2, [x8, :lo12:.LCPI0_2]\nushr v1.4h, v1.4h, #2\nmls v0.4h, v1.4h, v2.4h\nret", |
11007 | 11007 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = urem <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\n ret <4 x i16> %r\n}", |
11008 | 11008 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of RThru:7 CodeSize:4 Lat:4 SizeLat:4 for: %r = urem <4 x i16> %a, <i16 7, i16 6, i16 7, i16 6>\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
@@ -15495,10 +15495,10 @@ |
15495 | 15495 | "thru": 4, |
15496 | 15496 | "lat": 4, |
15497 | 15497 | "sizelat": 4, |
15498 | | - "size": 7, |
| 15498 | + "size": 9, |
15499 | 15499 | "gisize": 8, |
15500 | 15500 | "extrasize": 0, |
15501 | | - "asm": "adrp x8, .LCPI0_0\nadrp x9, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_0]\nldr d2, [x9, :lo12:.LCPI0_1]\nushl v1.8b, v0.8b, v1.8b\nushl v0.8b, v0.8b, v2.8b\norr v0.8b, v0.8b, v1.8b\nret", |
| 15501 | + "asm": "mov x8, #144117387132666368 // =0x200020002000200\nmov x9, #-434041037028460039 // =0xf9f9f9f9f9f9f9f9\norr x8, x8, #0x1000100010001\neor x9, x9, #0x300030003000300\nfmov d1, x8\nfmov d2, x9\nushl v1.8b, v0.8b, v1.8b\nushl v0.8b, v0.8b, v2.8b\norr v0.8b, v0.8b, v1.8b\nret", |
15502 | 15502 | "giasm": "adrp x8, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nldr d2, [x8, :lo12:.LCPI0_0]\nneg v1.8b, v1.8b\nushl v1.8b, v0.8b, v1.8b\nushl v0.8b, v0.8b, v2.8b\norr v0.8b, v1.8b, v0.8b\nret", |
15503 | 15503 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = call <8 x i8> @llvm.fshr(<8 x i8> %a, <8 x i8> %a, <8 x i8> <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>)\n ret <8 x i8> %r\n}", |
15504 | 15504 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 4 for: %r = call <8 x i8> @llvm.fshr.v8i8(<8 x i8> %a, <8 x i8> %a, <8 x i8> <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>)\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
@@ -15687,10 +15687,10 @@ |
15687 | 15687 | "thru": 4, |
15688 | 15688 | "lat": 4, |
15689 | 15689 | "sizelat": 4, |
15690 | | - "size": 7, |
| 15690 | + "size": 8, |
15691 | 15691 | "gisize": 8, |
15692 | 15692 | "extrasize": 0, |
15693 | | - "asm": "adrp x8, .LCPI0_0\nadrp x9, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_0]\nldr d2, [x9, :lo12:.LCPI0_1]\nushl v1.4h, v0.4h, v1.4h\nushl v0.4h, v0.4h, v2.4h\norr v0.8b, v0.8b, v1.8b\nret", |
| 15693 | + "asm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nmov x8, #-1688875630460935 // =0xfff9fff9fff9fff9\neor x8, x8, #0x3000000030000\nfmov d2, x8\nushl v1.4h, v0.4h, v1.4h\nushl v0.4h, v0.4h, v2.4h\norr v0.8b, v0.8b, v1.8b\nret", |
15694 | 15694 | "giasm": "adrp x8, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_1]\nadrp x8, .LCPI0_0\nldr d2, [x8, :lo12:.LCPI0_0]\nneg v1.4h, v1.4h\nushl v1.4h, v0.4h, v1.4h\nushl v0.4h, v0.4h, v2.4h\norr v0.8b, v1.8b, v0.8b\nret", |
15695 | 15695 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = call <4 x i16> @llvm.fshr(<4 x i16> %a, <4 x i16> %a, <4 x i16> <i16 7, i16 6, i16 7, i16 6>)\n ret <4 x i16> %r\n}", |
15696 | 15696 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 4 for: %r = call <4 x i16> @llvm.fshr.v4i16(<4 x i16> %a, <4 x i16> %a, <4 x i16> <i16 7, i16 6, i16 7, i16 6>)\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
@@ -16855,10 +16855,10 @@ |
16855 | 16855 | "thru": 4, |
16856 | 16856 | "lat": 4, |
16857 | 16857 | "sizelat": 4, |
16858 | | - "size": 6, |
| 16858 | + "size": 7, |
16859 | 16859 | "gisize": 8, |
16860 | 16860 | "extrasize": 0, |
16861 | | - "asm": "mvni v1.4h, #1, lsl #8\nadrp x8, .LCPI0_0\nldr d2, [x8, :lo12:.LCPI0_0]\nushl v1.8b, v0.8b, v1.8b\nushl v0.8b, v0.8b, v2.8b\norr v0.8b, v0.8b, v1.8b\nret", |
| 16861 | + "asm": "mov x8, #434041037028460038 // =0x606060606060606\nmvni v1.4h, #1, lsl #8\norr x8, x8, #0x7000700070007\nfmov d2, x8\nushl v1.8b, v0.8b, v1.8b\nushl v0.8b, v0.8b, v2.8b\norr v0.8b, v0.8b, v1.8b\nret", |
16862 | 16862 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_1\nldr d2, [x8, :lo12:.LCPI0_1]\nneg v1.8b, v1.8b\nushl v2.8b, v0.8b, v2.8b\nushl v0.8b, v0.8b, v1.8b\norr v0.8b, v2.8b, v0.8b\nret", |
16863 | 16863 | "ll": "define <8 x i8> @test(<8 x i8> %a) vscale_range(2, 2){\n %r = call <8 x i8> @llvm.fshl(<8 x i8> %a, <8 x i8> %a, <8 x i8> <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>)\n ret <8 x i8> %r\n}", |
16864 | 16864 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 4 for: %r = call <8 x i8> @llvm.fshl.v8i8(<8 x i8> %a, <8 x i8> %a, <8 x i8> <i8 7, i8 6, i8 7, i8 6, i8 7, i8 6, i8 7, i8 6>)\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <8 x i8> %r" |
@@ -17047,10 +17047,10 @@ |
17047 | 17047 | "thru": 4, |
17048 | 17048 | "lat": 4, |
17049 | 17049 | "sizelat": 4, |
17050 | | - "size": 7, |
| 17050 | + "size": 9, |
17051 | 17051 | "gisize": 8, |
17052 | 17052 | "extrasize": 0, |
17053 | | - "asm": "adrp x8, .LCPI0_0\nadrp x9, .LCPI0_1\nldr d1, [x8, :lo12:.LCPI0_0]\nldr d2, [x9, :lo12:.LCPI0_1]\nushl v1.4h, v0.4h, v1.4h\nushl v0.4h, v0.4h, v2.4h\norr v0.8b, v0.8b, v1.8b\nret", |
| 17053 | + "asm": "mov x8, #-2251834173947913 // =0xfff7fff7fff7fff7\nmov x9, #1688875630460934 // =0x6000600060006\nand x8, x8, #0xfffefffffffeffff\norr x9, x9, #0x700000007\nfmov d1, x8\nfmov d2, x9\nushl v1.4h, v0.4h, v1.4h\nushl v0.4h, v0.4h, v2.4h\norr v0.8b, v0.8b, v1.8b\nret", |
17054 | 17054 | "giasm": "adrp x8, .LCPI0_0\nldr d1, [x8, :lo12:.LCPI0_0]\nadrp x8, .LCPI0_1\nldr d2, [x8, :lo12:.LCPI0_1]\nneg v1.4h, v1.4h\nushl v2.4h, v0.4h, v2.4h\nushl v0.4h, v0.4h, v1.4h\norr v0.8b, v2.8b, v0.8b\nret", |
17055 | 17055 | "ll": "define <4 x i16> @test(<4 x i16> %a) vscale_range(2, 2){\n %r = call <4 x i16> @llvm.fshl(<4 x i16> %a, <4 x i16> %a, <4 x i16> <i16 7, i16 6, i16 7, i16 6>)\n ret <4 x i16> %r\n}", |
17056 | 17056 | "costoutput": "Printing analysis 'Cost Model Analysis' for function 'test':\nCost Model: Found costs of 4 for: %r = call <4 x i16> @llvm.fshl.v4i16(<4 x i16> %a, <4 x i16> %a, <4 x i16> <i16 7, i16 6, i16 7, i16 6>)\nCost Model: Found costs of RThru:0 CodeSize:1 Lat:1 SizeLat:1 for: ret <4 x i16> %r" |
|
0 commit comments