@@ -18,8 +18,8 @@ define <2 x float> @test_ret_const() #0 {
18
18
; CHECK-NEXT: .reg .f32 %f<3>;
19
19
; CHECK-EMPTY:
20
20
; CHECK-NEXT: // %bb.0:
21
- ; CHECK-NEXT: mov.f32 %f1, 0f40000000;
22
- ; CHECK-NEXT: mov.f32 %f2, 0f3F800000;
21
+ ; CHECK-NEXT: mov.b32 %f1, 0f40000000;
22
+ ; CHECK-NEXT: mov.b32 %f2, 0f3F800000;
23
23
; CHECK-NEXT: st.param.v2.f32 [func_retval0], {%f2, %f1};
24
24
; CHECK-NEXT: ret;
25
25
ret <2 x float > <float 1 .0 , float 2 .0 >
@@ -86,8 +86,8 @@ define <2 x float> @test_fadd_imm_0(<2 x float> %a) #0 {
86
86
; CHECK-EMPTY:
87
87
; CHECK-NEXT: // %bb.0:
88
88
; CHECK-NEXT: ld.param.b64 %rd1, [test_fadd_imm_0_param_0];
89
- ; CHECK-NEXT: mov.f32 %f1, 0f40000000;
90
- ; CHECK-NEXT: mov.f32 %f2, 0f3F800000;
89
+ ; CHECK-NEXT: mov.b32 %f1, 0f40000000;
90
+ ; CHECK-NEXT: mov.b32 %f2, 0f3F800000;
91
91
; CHECK-NEXT: mov.b64 %rd2, {%f2, %f1};
92
92
; CHECK-NEXT: add.rn.f32x2 %rd3, %rd1, %rd2;
93
93
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -104,8 +104,8 @@ define <2 x float> @test_fadd_imm_1(<2 x float> %a) #0 {
104
104
; CHECK-EMPTY:
105
105
; CHECK-NEXT: // %bb.0:
106
106
; CHECK-NEXT: ld.param.b64 %rd1, [test_fadd_imm_1_param_0];
107
- ; CHECK-NEXT: mov.f32 %f1, 0f40000000;
108
- ; CHECK-NEXT: mov.f32 %f2, 0f3F800000;
107
+ ; CHECK-NEXT: mov.b32 %f1, 0f40000000;
108
+ ; CHECK-NEXT: mov.b32 %f2, 0f3F800000;
109
109
; CHECK-NEXT: mov.b64 %rd2, {%f2, %f1};
110
110
; CHECK-NEXT: add.rn.f32x2 %rd3, %rd1, %rd2;
111
111
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -138,12 +138,12 @@ define <4 x float> @test_fadd_imm_0_v4(<4 x float> %a) #0 {
138
138
; CHECK-EMPTY:
139
139
; CHECK-NEXT: // %bb.0:
140
140
; CHECK-NEXT: ld.param.v2.b64 {%rd1, %rd2}, [test_fadd_imm_0_v4_param_0];
141
- ; CHECK-NEXT: mov.f32 %f1, 0f40800000;
142
- ; CHECK-NEXT: mov.f32 %f2, 0f40400000;
141
+ ; CHECK-NEXT: mov.b32 %f1, 0f40800000;
142
+ ; CHECK-NEXT: mov.b32 %f2, 0f40400000;
143
143
; CHECK-NEXT: mov.b64 %rd3, {%f2, %f1};
144
144
; CHECK-NEXT: add.rn.f32x2 %rd4, %rd2, %rd3;
145
- ; CHECK-NEXT: mov.f32 %f3, 0f40000000;
146
- ; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
145
+ ; CHECK-NEXT: mov.b32 %f3, 0f40000000;
146
+ ; CHECK-NEXT: mov.b32 %f4, 0f3F800000;
147
147
; CHECK-NEXT: mov.b64 %rd5, {%f4, %f3};
148
148
; CHECK-NEXT: add.rn.f32x2 %rd6, %rd1, %rd5;
149
149
; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6, %rd4};
@@ -160,12 +160,12 @@ define <4 x float> @test_fadd_imm_1_v4(<4 x float> %a) #0 {
160
160
; CHECK-EMPTY:
161
161
; CHECK-NEXT: // %bb.0:
162
162
; CHECK-NEXT: ld.param.v2.b64 {%rd1, %rd2}, [test_fadd_imm_1_v4_param_0];
163
- ; CHECK-NEXT: mov.f32 %f1, 0f40800000;
164
- ; CHECK-NEXT: mov.f32 %f2, 0f40400000;
163
+ ; CHECK-NEXT: mov.b32 %f1, 0f40800000;
164
+ ; CHECK-NEXT: mov.b32 %f2, 0f40400000;
165
165
; CHECK-NEXT: mov.b64 %rd3, {%f2, %f1};
166
166
; CHECK-NEXT: add.rn.f32x2 %rd4, %rd2, %rd3;
167
- ; CHECK-NEXT: mov.f32 %f3, 0f40000000;
168
- ; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
167
+ ; CHECK-NEXT: mov.b32 %f3, 0f40000000;
168
+ ; CHECK-NEXT: mov.b32 %f4, 0f3F800000;
169
169
; CHECK-NEXT: mov.b64 %rd5, {%f4, %f3};
170
170
; CHECK-NEXT: add.rn.f32x2 %rd6, %rd1, %rd5;
171
171
; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6, %rd4};
@@ -197,7 +197,7 @@ define <2 x float> @test_fneg(<2 x float> %a) #0 {
197
197
; CHECK-EMPTY:
198
198
; CHECK-NEXT: // %bb.0:
199
199
; CHECK-NEXT: ld.param.b64 %rd1, [test_fneg_param_0];
200
- ; CHECK-NEXT: mov.f32 %f1, 0f00000000;
200
+ ; CHECK-NEXT: mov.b32 %f1, 0f00000000;
201
201
; CHECK-NEXT: mov.b64 %rd2, {%f1, %f1};
202
202
; CHECK-NEXT: sub.rn.f32x2 %rd3, %rd2, %rd1;
203
203
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -270,14 +270,14 @@ define <2 x float> @test_frem(<2 x float> %a, <2 x float> %b) #0 {
270
270
; CHECK-NEXT: mov.b64 {%f3, %f4}, %rd1;
271
271
; CHECK-NEXT: div.rn.f32 %f5, %f4, %f2;
272
272
; CHECK-NEXT: cvt.rzi.f32.f32 %f6, %f5;
273
- ; CHECK-NEXT: mul .f32 %f7, %f6, %f2 ;
274
- ; CHECK-NEXT: sub. f32 %f8, %f4 , %f7 ;
273
+ ; CHECK-NEXT: neg .f32 %f7, %f6;
274
+ ; CHECK-NEXT: fma.rn. f32 %f8, %f7 , %f2, %f4 ;
275
275
; CHECK-NEXT: testp.infinite.f32 %p1, %f2;
276
276
; CHECK-NEXT: selp.f32 %f9, %f4, %f8, %p1;
277
277
; CHECK-NEXT: div.rn.f32 %f10, %f3, %f1;
278
278
; CHECK-NEXT: cvt.rzi.f32.f32 %f11, %f10;
279
- ; CHECK-NEXT: mul .f32 %f12, %f11, %f1 ;
280
- ; CHECK-NEXT: sub. f32 %f13, %f3 , %f12 ;
279
+ ; CHECK-NEXT: neg .f32 %f12, %f11;
280
+ ; CHECK-NEXT: fma.rn. f32 %f13, %f12 , %f1, %f3 ;
281
281
; CHECK-NEXT: testp.infinite.f32 %p2, %f1;
282
282
; CHECK-NEXT: selp.f32 %f14, %f3, %f13, %p2;
283
283
; CHECK-NEXT: st.param.v2.f32 [func_retval0], {%f14, %f9};
@@ -309,8 +309,8 @@ define <2 x float> @test_fadd_imm_0_ftz(<2 x float> %a) #2 {
309
309
; CHECK-EMPTY:
310
310
; CHECK-NEXT: // %bb.0:
311
311
; CHECK-NEXT: ld.param.b64 %rd1, [test_fadd_imm_0_ftz_param_0];
312
- ; CHECK-NEXT: mov.f32 %f1, 0f40000000;
313
- ; CHECK-NEXT: mov.f32 %f2, 0f3F800000;
312
+ ; CHECK-NEXT: mov.b32 %f1, 0f40000000;
313
+ ; CHECK-NEXT: mov.b32 %f2, 0f3F800000;
314
314
; CHECK-NEXT: mov.b64 %rd2, {%f2, %f1};
315
315
; CHECK-NEXT: add.rn.ftz.f32x2 %rd3, %rd1, %rd2;
316
316
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -327,8 +327,8 @@ define <2 x float> @test_fadd_imm_1_ftz(<2 x float> %a) #2 {
327
327
; CHECK-EMPTY:
328
328
; CHECK-NEXT: // %bb.0:
329
329
; CHECK-NEXT: ld.param.b64 %rd1, [test_fadd_imm_1_ftz_param_0];
330
- ; CHECK-NEXT: mov.f32 %f1, 0f40000000;
331
- ; CHECK-NEXT: mov.f32 %f2, 0f3F800000;
330
+ ; CHECK-NEXT: mov.b32 %f1, 0f40000000;
331
+ ; CHECK-NEXT: mov.b32 %f2, 0f3F800000;
332
332
; CHECK-NEXT: mov.b64 %rd2, {%f2, %f1};
333
333
; CHECK-NEXT: add.rn.ftz.f32x2 %rd3, %rd1, %rd2;
334
334
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -361,12 +361,12 @@ define <4 x float> @test_fadd_imm_0_v4_ftz(<4 x float> %a) #2 {
361
361
; CHECK-EMPTY:
362
362
; CHECK-NEXT: // %bb.0:
363
363
; CHECK-NEXT: ld.param.v2.b64 {%rd1, %rd2}, [test_fadd_imm_0_v4_ftz_param_0];
364
- ; CHECK-NEXT: mov.f32 %f1, 0f40800000;
365
- ; CHECK-NEXT: mov.f32 %f2, 0f40400000;
364
+ ; CHECK-NEXT: mov.b32 %f1, 0f40800000;
365
+ ; CHECK-NEXT: mov.b32 %f2, 0f40400000;
366
366
; CHECK-NEXT: mov.b64 %rd3, {%f2, %f1};
367
367
; CHECK-NEXT: add.rn.ftz.f32x2 %rd4, %rd2, %rd3;
368
- ; CHECK-NEXT: mov.f32 %f3, 0f40000000;
369
- ; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
368
+ ; CHECK-NEXT: mov.b32 %f3, 0f40000000;
369
+ ; CHECK-NEXT: mov.b32 %f4, 0f3F800000;
370
370
; CHECK-NEXT: mov.b64 %rd5, {%f4, %f3};
371
371
; CHECK-NEXT: add.rn.ftz.f32x2 %rd6, %rd1, %rd5;
372
372
; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6, %rd4};
@@ -383,12 +383,12 @@ define <4 x float> @test_fadd_imm_1_v4_ftz(<4 x float> %a) #2 {
383
383
; CHECK-EMPTY:
384
384
; CHECK-NEXT: // %bb.0:
385
385
; CHECK-NEXT: ld.param.v2.b64 {%rd1, %rd2}, [test_fadd_imm_1_v4_ftz_param_0];
386
- ; CHECK-NEXT: mov.f32 %f1, 0f40800000;
387
- ; CHECK-NEXT: mov.f32 %f2, 0f40400000;
386
+ ; CHECK-NEXT: mov.b32 %f1, 0f40800000;
387
+ ; CHECK-NEXT: mov.b32 %f2, 0f40400000;
388
388
; CHECK-NEXT: mov.b64 %rd3, {%f2, %f1};
389
389
; CHECK-NEXT: add.rn.ftz.f32x2 %rd4, %rd2, %rd3;
390
- ; CHECK-NEXT: mov.f32 %f3, 0f40000000;
391
- ; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
390
+ ; CHECK-NEXT: mov.b32 %f3, 0f40000000;
391
+ ; CHECK-NEXT: mov.b32 %f4, 0f3F800000;
392
392
; CHECK-NEXT: mov.b64 %rd5, {%f4, %f3};
393
393
; CHECK-NEXT: add.rn.ftz.f32x2 %rd6, %rd1, %rd5;
394
394
; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6, %rd4};
@@ -420,7 +420,7 @@ define <2 x float> @test_fneg_ftz(<2 x float> %a) #2 {
420
420
; CHECK-EMPTY:
421
421
; CHECK-NEXT: // %bb.0:
422
422
; CHECK-NEXT: ld.param.b64 %rd1, [test_fneg_ftz_param_0];
423
- ; CHECK-NEXT: mov.f32 %f1, 0f00000000;
423
+ ; CHECK-NEXT: mov.b32 %f1, 0f00000000;
424
424
; CHECK-NEXT: mov.b64 %rd2, {%f1, %f1};
425
425
; CHECK-NEXT: sub.rn.ftz.f32x2 %rd3, %rd2, %rd1;
426
426
; CHECK-NEXT: st.param.b64 [func_retval0], %rd3;
@@ -493,14 +493,14 @@ define <2 x float> @test_frem_ftz(<2 x float> %a, <2 x float> %b) #2 {
493
493
; CHECK-NEXT: mov.b64 {%f3, %f4}, %rd1;
494
494
; CHECK-NEXT: div.rn.ftz.f32 %f5, %f4, %f2;
495
495
; CHECK-NEXT: cvt.rzi.ftz.f32.f32 %f6, %f5;
496
- ; CHECK-NEXT: mul .ftz.f32 %f7, %f6, %f2 ;
497
- ; CHECK-NEXT: sub. ftz.f32 %f8, %f4 , %f7 ;
496
+ ; CHECK-NEXT: neg .ftz.f32 %f7, %f6;
497
+ ; CHECK-NEXT: fma.rn. ftz.f32 %f8, %f7 , %f2, %f4 ;
498
498
; CHECK-NEXT: testp.infinite.f32 %p1, %f2;
499
499
; CHECK-NEXT: selp.f32 %f9, %f4, %f8, %p1;
500
500
; CHECK-NEXT: div.rn.ftz.f32 %f10, %f3, %f1;
501
501
; CHECK-NEXT: cvt.rzi.ftz.f32.f32 %f11, %f10;
502
- ; CHECK-NEXT: mul .ftz.f32 %f12, %f11, %f1 ;
503
- ; CHECK-NEXT: sub. ftz.f32 %f13, %f3 , %f12 ;
502
+ ; CHECK-NEXT: neg .ftz.f32 %f12, %f11;
503
+ ; CHECK-NEXT: fma.rn. ftz.f32 %f13, %f12 , %f1, %f3 ;
504
504
; CHECK-NEXT: testp.infinite.f32 %p2, %f1;
505
505
; CHECK-NEXT: selp.f32 %f14, %f3, %f13, %p2;
506
506
; CHECK-NEXT: st.param.v2.f32 [func_retval0], {%f14, %f9};
0 commit comments