@@ -117,14 +117,14 @@ define <2 x float> @test_fadd_imm_1(<2 x float> %a) #0 {
117
117
define <4 x float > @test_fadd_v4 (<4 x float > %a , <4 x float > %b ) #0 {
118
118
; CHECK-LABEL: test_fadd_v4(
119
119
; CHECK: {
120
- ; CHECK-NEXT: .reg .b64 %rd<11 >;
120
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
121
121
; CHECK-EMPTY:
122
122
; CHECK-NEXT: // %bb.0:
123
- ; CHECK-NEXT: ld.param.v2.u64 {%rd5 , %rd6 }, [test_fadd_v4_param_1];
124
- ; CHECK-NEXT: ld.param.v2.u64 {%rd7 , %rd8 }, [test_fadd_v4_param_0];
125
- ; CHECK-NEXT: add.rn.f32x2 %rd9 , %rd8 , %rd6 ;
126
- ; CHECK-NEXT: add.rn.f32x2 %rd10 , %rd7 , %rd5 ;
127
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd10 , %rd9 };
123
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd3 , %rd4 }, [test_fadd_v4_param_1];
124
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_v4_param_0];
125
+ ; CHECK-NEXT: add.rn.f32x2 %rd5 , %rd2 , %rd4 ;
126
+ ; CHECK-NEXT: add.rn.f32x2 %rd6 , %rd1 , %rd3 ;
127
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd5 };
128
128
; CHECK-NEXT: ret;
129
129
%r = fadd <4 x float > %a , %b
130
130
ret <4 x float > %r
@@ -134,19 +134,19 @@ define <4 x float> @test_fadd_imm_0_v4(<4 x float> %a) #0 {
134
134
; CHECK-LABEL: test_fadd_imm_0_v4(
135
135
; CHECK: {
136
136
; CHECK-NEXT: .reg .f32 %f<5>;
137
- ; CHECK-NEXT: .reg .b64 %rd<9 >;
137
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
138
138
; CHECK-EMPTY:
139
139
; CHECK-NEXT: // %bb.0:
140
- ; CHECK-NEXT: ld.param.v2.u64 {%rd3 , %rd4 }, [test_fadd_imm_0_v4_param_0];
140
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_imm_0_v4_param_0];
141
141
; CHECK-NEXT: mov.f32 %f1, 0f40800000;
142
142
; CHECK-NEXT: mov.f32 %f2, 0f40400000;
143
- ; CHECK-NEXT: mov.b64 %rd5 , {%f2, %f1};
144
- ; CHECK-NEXT: add.rn.f32x2 %rd6 , %rd4 , %rd5 ;
143
+ ; CHECK-NEXT: mov.b64 %rd3 , {%f2, %f1};
144
+ ; CHECK-NEXT: add.rn.f32x2 %rd4 , %rd2 , %rd3 ;
145
145
; CHECK-NEXT: mov.f32 %f3, 0f40000000;
146
146
; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
147
- ; CHECK-NEXT: mov.b64 %rd7 , {%f4, %f3};
148
- ; CHECK-NEXT: add.rn.f32x2 %rd8 , %rd3 , %rd7 ;
149
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd8 , %rd6 };
147
+ ; CHECK-NEXT: mov.b64 %rd5 , {%f4, %f3};
148
+ ; CHECK-NEXT: add.rn.f32x2 %rd6 , %rd1 , %rd5 ;
149
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd4 };
150
150
; CHECK-NEXT: ret;
151
151
%r = fadd <4 x float > <float 1 .0 , float 2 .0 , float 3 .0 , float 4 .0 >, %a
152
152
ret <4 x float > %r
@@ -156,19 +156,19 @@ define <4 x float> @test_fadd_imm_1_v4(<4 x float> %a) #0 {
156
156
; CHECK-LABEL: test_fadd_imm_1_v4(
157
157
; CHECK: {
158
158
; CHECK-NEXT: .reg .f32 %f<5>;
159
- ; CHECK-NEXT: .reg .b64 %rd<9 >;
159
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
160
160
; CHECK-EMPTY:
161
161
; CHECK-NEXT: // %bb.0:
162
- ; CHECK-NEXT: ld.param.v2.u64 {%rd3 , %rd4 }, [test_fadd_imm_1_v4_param_0];
162
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_imm_1_v4_param_0];
163
163
; CHECK-NEXT: mov.f32 %f1, 0f40800000;
164
164
; CHECK-NEXT: mov.f32 %f2, 0f40400000;
165
- ; CHECK-NEXT: mov.b64 %rd5 , {%f2, %f1};
166
- ; CHECK-NEXT: add.rn.f32x2 %rd6 , %rd4 , %rd5 ;
165
+ ; CHECK-NEXT: mov.b64 %rd3 , {%f2, %f1};
166
+ ; CHECK-NEXT: add.rn.f32x2 %rd4 , %rd2 , %rd3 ;
167
167
; CHECK-NEXT: mov.f32 %f3, 0f40000000;
168
168
; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
169
- ; CHECK-NEXT: mov.b64 %rd7 , {%f4, %f3};
170
- ; CHECK-NEXT: add.rn.f32x2 %rd8 , %rd3 , %rd7 ;
171
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd8 , %rd6 };
169
+ ; CHECK-NEXT: mov.b64 %rd5 , {%f4, %f3};
170
+ ; CHECK-NEXT: add.rn.f32x2 %rd6 , %rd1 , %rd5 ;
171
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd4 };
172
172
; CHECK-NEXT: ret;
173
173
%r = fadd <4 x float > %a , <float 1 .0 , float 2 .0 , float 3 .0 , float 4 .0 >
174
174
ret <4 x float > %r
@@ -340,14 +340,14 @@ define <2 x float> @test_fadd_imm_1_ftz(<2 x float> %a) #2 {
340
340
define <4 x float > @test_fadd_v4_ftz (<4 x float > %a , <4 x float > %b ) #2 {
341
341
; CHECK-LABEL: test_fadd_v4_ftz(
342
342
; CHECK: {
343
- ; CHECK-NEXT: .reg .b64 %rd<11 >;
343
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
344
344
; CHECK-EMPTY:
345
345
; CHECK-NEXT: // %bb.0:
346
- ; CHECK-NEXT: ld.param.v2.u64 {%rd5 , %rd6 }, [test_fadd_v4_ftz_param_1];
347
- ; CHECK-NEXT: ld.param.v2.u64 {%rd7 , %rd8 }, [test_fadd_v4_ftz_param_0];
348
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd9 , %rd8 , %rd6 ;
349
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd10 , %rd7 , %rd5 ;
350
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd10 , %rd9 };
346
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd3 , %rd4 }, [test_fadd_v4_ftz_param_1];
347
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_v4_ftz_param_0];
348
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd5 , %rd2 , %rd4 ;
349
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd6 , %rd1 , %rd3 ;
350
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd5 };
351
351
; CHECK-NEXT: ret;
352
352
%r = fadd <4 x float > %a , %b
353
353
ret <4 x float > %r
@@ -357,19 +357,19 @@ define <4 x float> @test_fadd_imm_0_v4_ftz(<4 x float> %a) #2 {
357
357
; CHECK-LABEL: test_fadd_imm_0_v4_ftz(
358
358
; CHECK: {
359
359
; CHECK-NEXT: .reg .f32 %f<5>;
360
- ; CHECK-NEXT: .reg .b64 %rd<9 >;
360
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
361
361
; CHECK-EMPTY:
362
362
; CHECK-NEXT: // %bb.0:
363
- ; CHECK-NEXT: ld.param.v2.u64 {%rd3 , %rd4 }, [test_fadd_imm_0_v4_ftz_param_0];
363
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_imm_0_v4_ftz_param_0];
364
364
; CHECK-NEXT: mov.f32 %f1, 0f40800000;
365
365
; CHECK-NEXT: mov.f32 %f2, 0f40400000;
366
- ; CHECK-NEXT: mov.b64 %rd5 , {%f2, %f1};
367
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd6 , %rd4 , %rd5 ;
366
+ ; CHECK-NEXT: mov.b64 %rd3 , {%f2, %f1};
367
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd4 , %rd2 , %rd3 ;
368
368
; CHECK-NEXT: mov.f32 %f3, 0f40000000;
369
369
; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
370
- ; CHECK-NEXT: mov.b64 %rd7 , {%f4, %f3};
371
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd8 , %rd3 , %rd7 ;
372
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd8 , %rd6 };
370
+ ; CHECK-NEXT: mov.b64 %rd5 , {%f4, %f3};
371
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd6 , %rd1 , %rd5 ;
372
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd4 };
373
373
; CHECK-NEXT: ret;
374
374
%r = fadd <4 x float > <float 1 .0 , float 2 .0 , float 3 .0 , float 4 .0 >, %a
375
375
ret <4 x float > %r
@@ -379,19 +379,19 @@ define <4 x float> @test_fadd_imm_1_v4_ftz(<4 x float> %a) #2 {
379
379
; CHECK-LABEL: test_fadd_imm_1_v4_ftz(
380
380
; CHECK: {
381
381
; CHECK-NEXT: .reg .f32 %f<5>;
382
- ; CHECK-NEXT: .reg .b64 %rd<9 >;
382
+ ; CHECK-NEXT: .reg .b64 %rd<7 >;
383
383
; CHECK-EMPTY:
384
384
; CHECK-NEXT: // %bb.0:
385
- ; CHECK-NEXT: ld.param.v2.u64 {%rd3 , %rd4 }, [test_fadd_imm_1_v4_ftz_param_0];
385
+ ; CHECK-NEXT: ld.param.v2.b64 {%rd1 , %rd2 }, [test_fadd_imm_1_v4_ftz_param_0];
386
386
; CHECK-NEXT: mov.f32 %f1, 0f40800000;
387
387
; CHECK-NEXT: mov.f32 %f2, 0f40400000;
388
- ; CHECK-NEXT: mov.b64 %rd5 , {%f2, %f1};
389
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd6 , %rd4 , %rd5 ;
388
+ ; CHECK-NEXT: mov.b64 %rd3 , {%f2, %f1};
389
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd4 , %rd2 , %rd3 ;
390
390
; CHECK-NEXT: mov.f32 %f3, 0f40000000;
391
391
; CHECK-NEXT: mov.f32 %f4, 0f3F800000;
392
- ; CHECK-NEXT: mov.b64 %rd7 , {%f4, %f3};
393
- ; CHECK-NEXT: add.rn.ftz.f32x2 %rd8 , %rd3 , %rd7 ;
394
- ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd8 , %rd6 };
392
+ ; CHECK-NEXT: mov.b64 %rd5 , {%f4, %f3};
393
+ ; CHECK-NEXT: add.rn.ftz.f32x2 %rd6 , %rd1 , %rd5 ;
394
+ ; CHECK-NEXT: st.param.v2.b64 [func_retval0], {%rd6 , %rd4 };
395
395
; CHECK-NEXT: ret;
396
396
%r = fadd <4 x float > %a , <float 1 .0 , float 2 .0 , float 3 .0 , float 4 .0 >
397
397
ret <4 x float > %r
0 commit comments