1 | //===------- LegalizeVectorTypes.cpp - Legalization of vector types -------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file performs vector type splitting and scalarization for LegalizeTypes. |
10 | // Scalarization is the act of changing a computation in an illegal one-element |
11 | // vector type to be a computation in its scalar element type. For example, |
12 | // implementing <1 x f32> arithmetic in a scalar f32 register. This is needed |
13 | // as a base case when scalarizing vector arithmetic like <4 x f32>, which |
14 | // eventually decomposes to scalars if the target doesn't support v4f32 or v2f32 |
15 | // types. |
16 | // Splitting is the act of changing a computation in an invalid vector type to |
17 | // be a computation in two vectors of half the size. For example, implementing |
18 | // <128 x f32> operations in terms of two <64 x f32> operations. |
19 | // |
20 | //===----------------------------------------------------------------------===// |
21 | |
22 | #include "LegalizeTypes.h" |
23 | #include "llvm/ADT/SmallBitVector.h" |
24 | #include "llvm/Analysis/MemoryLocation.h" |
25 | #include "llvm/Analysis/VectorUtils.h" |
26 | #include "llvm/IR/DataLayout.h" |
27 | #include "llvm/Support/ErrorHandling.h" |
28 | #include "llvm/Support/TypeSize.h" |
29 | #include "llvm/Support/raw_ostream.h" |
30 | #include <numeric> |
31 | |
32 | using namespace llvm; |
33 | |
34 | #define DEBUG_TYPE "legalize-types" |
35 | |
36 | //===----------------------------------------------------------------------===// |
37 | // Result Vector Scalarization: <1 x ty> -> ty. |
38 | //===----------------------------------------------------------------------===// |
39 | |
40 | void DAGTypeLegalizer::ScalarizeVectorResult(SDNode *N, unsigned ResNo) { |
41 | LLVM_DEBUG(dbgs() << "Scalarize node result " << ResNo << ": " ; |
42 | N->dump(&DAG)); |
43 | SDValue R = SDValue(); |
44 | |
45 | switch (N->getOpcode()) { |
46 | default: |
47 | #ifndef NDEBUG |
48 | dbgs() << "ScalarizeVectorResult #" << ResNo << ": " ; |
49 | N->dump(G: &DAG); |
50 | dbgs() << "\n" ; |
51 | #endif |
52 | report_fatal_error(reason: "Do not know how to scalarize the result of this " |
53 | "operator!\n" ); |
54 | |
55 | case ISD::MERGE_VALUES: R = ScalarizeVecRes_MERGE_VALUES(N, ResNo);break; |
56 | case ISD::BITCAST: R = ScalarizeVecRes_BITCAST(N); break; |
57 | case ISD::BUILD_VECTOR: R = ScalarizeVecRes_BUILD_VECTOR(N); break; |
58 | case ISD::EXTRACT_SUBVECTOR: R = ScalarizeVecRes_EXTRACT_SUBVECTOR(N); break; |
59 | case ISD::FP_ROUND: R = ScalarizeVecRes_FP_ROUND(N); break; |
60 | case ISD::FPOWI: R = ScalarizeVecRes_ExpOp(N); break; |
61 | case ISD::INSERT_VECTOR_ELT: R = ScalarizeVecRes_INSERT_VECTOR_ELT(N); break; |
62 | case ISD::LOAD: R = ScalarizeVecRes_LOAD(N: cast<LoadSDNode>(Val: N));break; |
63 | case ISD::SCALAR_TO_VECTOR: R = ScalarizeVecRes_SCALAR_TO_VECTOR(N); break; |
64 | case ISD::SIGN_EXTEND_INREG: R = ScalarizeVecRes_InregOp(N); break; |
65 | case ISD::VSELECT: R = ScalarizeVecRes_VSELECT(N); break; |
66 | case ISD::SELECT: R = ScalarizeVecRes_SELECT(N); break; |
67 | case ISD::SELECT_CC: R = ScalarizeVecRes_SELECT_CC(N); break; |
68 | case ISD::SETCC: R = ScalarizeVecRes_SETCC(N); break; |
69 | case ISD::UNDEF: R = ScalarizeVecRes_UNDEF(N); break; |
70 | case ISD::VECTOR_SHUFFLE: R = ScalarizeVecRes_VECTOR_SHUFFLE(N); break; |
71 | case ISD::IS_FPCLASS: R = ScalarizeVecRes_IS_FPCLASS(N); break; |
72 | case ISD::ANY_EXTEND_VECTOR_INREG: |
73 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
74 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
75 | R = ScalarizeVecRes_VecInregOp(N); |
76 | break; |
77 | case ISD::ABS: |
78 | case ISD::ANY_EXTEND: |
79 | case ISD::BITREVERSE: |
80 | case ISD::BSWAP: |
81 | case ISD::CTLZ: |
82 | case ISD::CTLZ_ZERO_UNDEF: |
83 | case ISD::CTPOP: |
84 | case ISD::CTTZ: |
85 | case ISD::CTTZ_ZERO_UNDEF: |
86 | case ISD::FABS: |
87 | case ISD::FCEIL: |
88 | case ISD::FCOS: |
89 | case ISD::FEXP: |
90 | case ISD::FEXP2: |
91 | case ISD::FEXP10: |
92 | case ISD::FFLOOR: |
93 | case ISD::FLOG: |
94 | case ISD::FLOG10: |
95 | case ISD::FLOG2: |
96 | case ISD::FNEARBYINT: |
97 | case ISD::FNEG: |
98 | case ISD::FREEZE: |
99 | case ISD::ARITH_FENCE: |
100 | case ISD::FP_EXTEND: |
101 | case ISD::FP_TO_SINT: |
102 | case ISD::FP_TO_UINT: |
103 | case ISD::FRINT: |
104 | case ISD::LRINT: |
105 | case ISD::LLRINT: |
106 | case ISD::FROUND: |
107 | case ISD::FROUNDEVEN: |
108 | case ISD::FSIN: |
109 | case ISD::FSQRT: |
110 | case ISD::FTRUNC: |
111 | case ISD::SIGN_EXTEND: |
112 | case ISD::SINT_TO_FP: |
113 | case ISD::TRUNCATE: |
114 | case ISD::UINT_TO_FP: |
115 | case ISD::ZERO_EXTEND: |
116 | case ISD::FCANONICALIZE: |
117 | R = ScalarizeVecRes_UnaryOp(N); |
118 | break; |
119 | case ISD::FFREXP: |
120 | R = ScalarizeVecRes_FFREXP(N, ResNo); |
121 | break; |
122 | case ISD::ADD: |
123 | case ISD::AND: |
124 | case ISD::FADD: |
125 | case ISD::FCOPYSIGN: |
126 | case ISD::FDIV: |
127 | case ISD::FMUL: |
128 | case ISD::FMINNUM: |
129 | case ISD::FMAXNUM: |
130 | case ISD::FMINNUM_IEEE: |
131 | case ISD::FMAXNUM_IEEE: |
132 | case ISD::FMINIMUM: |
133 | case ISD::FMAXIMUM: |
134 | case ISD::FLDEXP: |
135 | case ISD::SMIN: |
136 | case ISD::SMAX: |
137 | case ISD::UMIN: |
138 | case ISD::UMAX: |
139 | |
140 | case ISD::SADDSAT: |
141 | case ISD::UADDSAT: |
142 | case ISD::SSUBSAT: |
143 | case ISD::USUBSAT: |
144 | case ISD::SSHLSAT: |
145 | case ISD::USHLSAT: |
146 | |
147 | case ISD::FPOW: |
148 | case ISD::FREM: |
149 | case ISD::FSUB: |
150 | case ISD::MUL: |
151 | case ISD::MULHS: |
152 | case ISD::MULHU: |
153 | case ISD::OR: |
154 | case ISD::SDIV: |
155 | case ISD::SREM: |
156 | case ISD::SUB: |
157 | case ISD::UDIV: |
158 | case ISD::UREM: |
159 | case ISD::XOR: |
160 | case ISD::SHL: |
161 | case ISD::SRA: |
162 | case ISD::SRL: |
163 | case ISD::ROTL: |
164 | case ISD::ROTR: |
165 | R = ScalarizeVecRes_BinOp(N); |
166 | break; |
167 | case ISD::FMA: |
168 | case ISD::FSHL: |
169 | case ISD::FSHR: |
170 | R = ScalarizeVecRes_TernaryOp(N); |
171 | break; |
172 | |
173 | #define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN) \ |
174 | case ISD::STRICT_##DAGN: |
175 | #include "llvm/IR/ConstrainedOps.def" |
176 | R = ScalarizeVecRes_StrictFPOp(N); |
177 | break; |
178 | |
179 | case ISD::FP_TO_UINT_SAT: |
180 | case ISD::FP_TO_SINT_SAT: |
181 | R = ScalarizeVecRes_FP_TO_XINT_SAT(N); |
182 | break; |
183 | |
184 | case ISD::UADDO: |
185 | case ISD::SADDO: |
186 | case ISD::USUBO: |
187 | case ISD::SSUBO: |
188 | case ISD::UMULO: |
189 | case ISD::SMULO: |
190 | R = ScalarizeVecRes_OverflowOp(N, ResNo); |
191 | break; |
192 | case ISD::SMULFIX: |
193 | case ISD::SMULFIXSAT: |
194 | case ISD::UMULFIX: |
195 | case ISD::UMULFIXSAT: |
196 | case ISD::SDIVFIX: |
197 | case ISD::SDIVFIXSAT: |
198 | case ISD::UDIVFIX: |
199 | case ISD::UDIVFIXSAT: |
200 | R = ScalarizeVecRes_FIX(N); |
201 | break; |
202 | } |
203 | |
204 | // If R is null, the sub-method took care of registering the result. |
205 | if (R.getNode()) |
206 | SetScalarizedVector(Op: SDValue(N, ResNo), Result: R); |
207 | } |
208 | |
209 | SDValue DAGTypeLegalizer::ScalarizeVecRes_BinOp(SDNode *N) { |
210 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
211 | SDValue RHS = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
212 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), |
213 | VT: LHS.getValueType(), N1: LHS, N2: RHS, Flags: N->getFlags()); |
214 | } |
215 | |
216 | SDValue DAGTypeLegalizer::ScalarizeVecRes_TernaryOp(SDNode *N) { |
217 | SDValue Op0 = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
218 | SDValue Op1 = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
219 | SDValue Op2 = GetScalarizedVector(Op: N->getOperand(Num: 2)); |
220 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: Op0.getValueType(), N1: Op0, N2: Op1, |
221 | N3: Op2, Flags: N->getFlags()); |
222 | } |
223 | |
224 | SDValue DAGTypeLegalizer::ScalarizeVecRes_FIX(SDNode *N) { |
225 | SDValue Op0 = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
226 | SDValue Op1 = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
227 | SDValue Op2 = N->getOperand(Num: 2); |
228 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: Op0.getValueType(), N1: Op0, N2: Op1, |
229 | N3: Op2, Flags: N->getFlags()); |
230 | } |
231 | |
232 | SDValue DAGTypeLegalizer::ScalarizeVecRes_FFREXP(SDNode *N, unsigned ResNo) { |
233 | assert(N->getValueType(0).getVectorNumElements() == 1 && |
234 | "Unexpected vector type!" ); |
235 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
236 | |
237 | EVT VT0 = N->getValueType(ResNo: 0); |
238 | EVT VT1 = N->getValueType(ResNo: 1); |
239 | SDLoc dl(N); |
240 | |
241 | SDNode *ScalarNode = |
242 | DAG.getNode(Opcode: N->getOpcode(), DL: dl, |
243 | ResultTys: {VT0.getScalarType(), VT1.getScalarType()}, Ops: Elt) |
244 | .getNode(); |
245 | |
246 | // Replace the other vector result not being explicitly scalarized here. |
247 | unsigned OtherNo = 1 - ResNo; |
248 | EVT OtherVT = N->getValueType(ResNo: OtherNo); |
249 | if (getTypeAction(VT: OtherVT) == TargetLowering::TypeScalarizeVector) { |
250 | SetScalarizedVector(Op: SDValue(N, OtherNo), Result: SDValue(ScalarNode, OtherNo)); |
251 | } else { |
252 | SDValue OtherVal = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: dl, VT: OtherVT, |
253 | Operand: SDValue(ScalarNode, OtherNo)); |
254 | ReplaceValueWith(From: SDValue(N, OtherNo), To: OtherVal); |
255 | } |
256 | |
257 | return SDValue(ScalarNode, ResNo); |
258 | } |
259 | |
260 | SDValue DAGTypeLegalizer::ScalarizeVecRes_StrictFPOp(SDNode *N) { |
261 | EVT VT = N->getValueType(ResNo: 0).getVectorElementType(); |
262 | unsigned NumOpers = N->getNumOperands(); |
263 | SDValue Chain = N->getOperand(Num: 0); |
264 | EVT ValueVTs[] = {VT, MVT::Other}; |
265 | SDLoc dl(N); |
266 | |
267 | SmallVector<SDValue, 4> Opers(NumOpers); |
268 | |
269 | // The Chain is the first operand. |
270 | Opers[0] = Chain; |
271 | |
272 | // Now process the remaining operands. |
273 | for (unsigned i = 1; i < NumOpers; ++i) { |
274 | SDValue Oper = N->getOperand(Num: i); |
275 | EVT OperVT = Oper.getValueType(); |
276 | |
277 | if (OperVT.isVector()) { |
278 | if (getTypeAction(VT: OperVT) == TargetLowering::TypeScalarizeVector) |
279 | Oper = GetScalarizedVector(Op: Oper); |
280 | else |
281 | Oper = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, |
282 | VT: OperVT.getVectorElementType(), N1: Oper, |
283 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
284 | } |
285 | |
286 | Opers[i] = Oper; |
287 | } |
288 | |
289 | SDValue Result = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VTList: DAG.getVTList(ValueVTs), |
290 | Ops: Opers, Flags: N->getFlags()); |
291 | |
292 | // Legalize the chain result - switch anything that used the old chain to |
293 | // use the new one. |
294 | ReplaceValueWith(From: SDValue(N, 1), To: Result.getValue(R: 1)); |
295 | return Result; |
296 | } |
297 | |
298 | SDValue DAGTypeLegalizer::ScalarizeVecRes_OverflowOp(SDNode *N, |
299 | unsigned ResNo) { |
300 | SDLoc DL(N); |
301 | EVT ResVT = N->getValueType(ResNo: 0); |
302 | EVT OvVT = N->getValueType(ResNo: 1); |
303 | |
304 | SDValue ScalarLHS, ScalarRHS; |
305 | if (getTypeAction(VT: ResVT) == TargetLowering::TypeScalarizeVector) { |
306 | ScalarLHS = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
307 | ScalarRHS = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
308 | } else { |
309 | SmallVector<SDValue, 1> ElemsLHS, ElemsRHS; |
310 | DAG.ExtractVectorElements(Op: N->getOperand(Num: 0), Args&: ElemsLHS); |
311 | DAG.ExtractVectorElements(Op: N->getOperand(Num: 1), Args&: ElemsRHS); |
312 | ScalarLHS = ElemsLHS[0]; |
313 | ScalarRHS = ElemsRHS[0]; |
314 | } |
315 | |
316 | SDVTList ScalarVTs = DAG.getVTList( |
317 | VT1: ResVT.getVectorElementType(), VT2: OvVT.getVectorElementType()); |
318 | SDNode *ScalarNode = DAG.getNode( |
319 | Opcode: N->getOpcode(), DL, VTList: ScalarVTs, N1: ScalarLHS, N2: ScalarRHS).getNode(); |
320 | ScalarNode->setFlags(N->getFlags()); |
321 | |
322 | // Replace the other vector result not being explicitly scalarized here. |
323 | unsigned OtherNo = 1 - ResNo; |
324 | EVT OtherVT = N->getValueType(ResNo: OtherNo); |
325 | if (getTypeAction(VT: OtherVT) == TargetLowering::TypeScalarizeVector) { |
326 | SetScalarizedVector(Op: SDValue(N, OtherNo), Result: SDValue(ScalarNode, OtherNo)); |
327 | } else { |
328 | SDValue OtherVal = DAG.getNode( |
329 | Opcode: ISD::SCALAR_TO_VECTOR, DL, VT: OtherVT, Operand: SDValue(ScalarNode, OtherNo)); |
330 | ReplaceValueWith(From: SDValue(N, OtherNo), To: OtherVal); |
331 | } |
332 | |
333 | return SDValue(ScalarNode, ResNo); |
334 | } |
335 | |
336 | SDValue DAGTypeLegalizer::ScalarizeVecRes_MERGE_VALUES(SDNode *N, |
337 | unsigned ResNo) { |
338 | SDValue Op = DisintegrateMERGE_VALUES(N, ResNo); |
339 | return GetScalarizedVector(Op); |
340 | } |
341 | |
342 | SDValue DAGTypeLegalizer::ScalarizeVecRes_BITCAST(SDNode *N) { |
343 | SDValue Op = N->getOperand(Num: 0); |
344 | if (Op.getValueType().isVector() |
345 | && Op.getValueType().getVectorNumElements() == 1 |
346 | && !isSimpleLegalType(VT: Op.getValueType())) |
347 | Op = GetScalarizedVector(Op); |
348 | EVT NewVT = N->getValueType(ResNo: 0).getVectorElementType(); |
349 | return DAG.getNode(Opcode: ISD::BITCAST, DL: SDLoc(N), |
350 | VT: NewVT, Operand: Op); |
351 | } |
352 | |
353 | SDValue DAGTypeLegalizer::ScalarizeVecRes_BUILD_VECTOR(SDNode *N) { |
354 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
355 | SDValue InOp = N->getOperand(Num: 0); |
356 | // The BUILD_VECTOR operands may be of wider element types and |
357 | // we may need to truncate them back to the requested return type. |
358 | if (EltVT.isInteger()) |
359 | return DAG.getNode(Opcode: ISD::TRUNCATE, DL: SDLoc(N), VT: EltVT, Operand: InOp); |
360 | return InOp; |
361 | } |
362 | |
363 | SDValue DAGTypeLegalizer::(SDNode *N) { |
364 | return DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: SDLoc(N), |
365 | VT: N->getValueType(ResNo: 0).getVectorElementType(), |
366 | N1: N->getOperand(Num: 0), N2: N->getOperand(Num: 1)); |
367 | } |
368 | |
369 | SDValue DAGTypeLegalizer::ScalarizeVecRes_FP_ROUND(SDNode *N) { |
370 | SDLoc DL(N); |
371 | SDValue Op = N->getOperand(Num: 0); |
372 | EVT OpVT = Op.getValueType(); |
373 | // The result needs scalarizing, but it's not a given that the source does. |
374 | // See similar logic in ScalarizeVecRes_UnaryOp. |
375 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeScalarizeVector) { |
376 | Op = GetScalarizedVector(Op); |
377 | } else { |
378 | EVT VT = OpVT.getVectorElementType(); |
379 | Op = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: Op, |
380 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
381 | } |
382 | return DAG.getNode(Opcode: ISD::FP_ROUND, DL, |
383 | VT: N->getValueType(ResNo: 0).getVectorElementType(), N1: Op, |
384 | N2: N->getOperand(Num: 1)); |
385 | } |
386 | |
387 | SDValue DAGTypeLegalizer::ScalarizeVecRes_ExpOp(SDNode *N) { |
388 | SDValue Op = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
389 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: Op.getValueType(), N1: Op, |
390 | N2: N->getOperand(Num: 1)); |
391 | } |
392 | |
393 | SDValue DAGTypeLegalizer::ScalarizeVecRes_INSERT_VECTOR_ELT(SDNode *N) { |
394 | // The value to insert may have a wider type than the vector element type, |
395 | // so be sure to truncate it to the element type if necessary. |
396 | SDValue Op = N->getOperand(Num: 1); |
397 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
398 | if (Op.getValueType() != EltVT) |
399 | // FIXME: Can this happen for floating point types? |
400 | Op = DAG.getNode(Opcode: ISD::TRUNCATE, DL: SDLoc(N), VT: EltVT, Operand: Op); |
401 | return Op; |
402 | } |
403 | |
404 | SDValue DAGTypeLegalizer::ScalarizeVecRes_LOAD(LoadSDNode *N) { |
405 | assert(N->isUnindexed() && "Indexed vector load?" ); |
406 | |
407 | SDValue Result = DAG.getLoad( |
408 | AM: ISD::UNINDEXED, ExtType: N->getExtensionType(), |
409 | VT: N->getValueType(ResNo: 0).getVectorElementType(), dl: SDLoc(N), Chain: N->getChain(), |
410 | Ptr: N->getBasePtr(), Offset: DAG.getUNDEF(VT: N->getBasePtr().getValueType()), |
411 | PtrInfo: N->getPointerInfo(), MemVT: N->getMemoryVT().getVectorElementType(), |
412 | Alignment: N->getOriginalAlign(), MMOFlags: N->getMemOperand()->getFlags(), AAInfo: N->getAAInfo()); |
413 | |
414 | // Legalize the chain result - switch anything that used the old chain to |
415 | // use the new one. |
416 | ReplaceValueWith(From: SDValue(N, 1), To: Result.getValue(R: 1)); |
417 | return Result; |
418 | } |
419 | |
420 | SDValue DAGTypeLegalizer::ScalarizeVecRes_UnaryOp(SDNode *N) { |
421 | // Get the dest type - it doesn't always match the input type, e.g. int_to_fp. |
422 | EVT DestVT = N->getValueType(ResNo: 0).getVectorElementType(); |
423 | SDValue Op = N->getOperand(Num: 0); |
424 | EVT OpVT = Op.getValueType(); |
425 | SDLoc DL(N); |
426 | // The result needs scalarizing, but it's not a given that the source does. |
427 | // This is a workaround for targets where it's impossible to scalarize the |
428 | // result of a conversion, because the source type is legal. |
429 | // For instance, this happens on AArch64: v1i1 is illegal but v1i{8,16,32} |
430 | // are widened to v8i8, v4i16, and v2i32, which is legal, because v1i64 is |
431 | // legal and was not scalarized. |
432 | // See the similar logic in ScalarizeVecRes_SETCC |
433 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeScalarizeVector) { |
434 | Op = GetScalarizedVector(Op); |
435 | } else { |
436 | EVT VT = OpVT.getVectorElementType(); |
437 | Op = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: Op, |
438 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
439 | } |
440 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: DestVT, Operand: Op, Flags: N->getFlags()); |
441 | } |
442 | |
443 | SDValue DAGTypeLegalizer::ScalarizeVecRes_InregOp(SDNode *N) { |
444 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
445 | EVT ExtVT = cast<VTSDNode>(Val: N->getOperand(Num: 1))->getVT().getVectorElementType(); |
446 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
447 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: EltVT, |
448 | N1: LHS, N2: DAG.getValueType(ExtVT)); |
449 | } |
450 | |
451 | SDValue DAGTypeLegalizer::ScalarizeVecRes_VecInregOp(SDNode *N) { |
452 | SDLoc DL(N); |
453 | SDValue Op = N->getOperand(Num: 0); |
454 | |
455 | EVT OpVT = Op.getValueType(); |
456 | EVT OpEltVT = OpVT.getVectorElementType(); |
457 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
458 | |
459 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeScalarizeVector) { |
460 | Op = GetScalarizedVector(Op); |
461 | } else { |
462 | Op = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT: OpEltVT, N1: Op, |
463 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
464 | } |
465 | |
466 | switch (N->getOpcode()) { |
467 | case ISD::ANY_EXTEND_VECTOR_INREG: |
468 | return DAG.getNode(Opcode: ISD::ANY_EXTEND, DL, VT: EltVT, Operand: Op); |
469 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
470 | return DAG.getNode(Opcode: ISD::SIGN_EXTEND, DL, VT: EltVT, Operand: Op); |
471 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
472 | return DAG.getNode(Opcode: ISD::ZERO_EXTEND, DL, VT: EltVT, Operand: Op); |
473 | } |
474 | |
475 | llvm_unreachable("Illegal extend_vector_inreg opcode" ); |
476 | } |
477 | |
478 | SDValue DAGTypeLegalizer::ScalarizeVecRes_SCALAR_TO_VECTOR(SDNode *N) { |
479 | // If the operand is wider than the vector element type then it is implicitly |
480 | // truncated. Make that explicit here. |
481 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
482 | SDValue InOp = N->getOperand(Num: 0); |
483 | if (InOp.getValueType() != EltVT) |
484 | return DAG.getNode(Opcode: ISD::TRUNCATE, DL: SDLoc(N), VT: EltVT, Operand: InOp); |
485 | return InOp; |
486 | } |
487 | |
488 | SDValue DAGTypeLegalizer::ScalarizeVecRes_VSELECT(SDNode *N) { |
489 | SDValue Cond = N->getOperand(Num: 0); |
490 | EVT OpVT = Cond.getValueType(); |
491 | SDLoc DL(N); |
492 | // The vselect result and true/value operands needs scalarizing, but it's |
493 | // not a given that the Cond does. For instance, in AVX512 v1i1 is legal. |
494 | // See the similar logic in ScalarizeVecRes_SETCC |
495 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeScalarizeVector) { |
496 | Cond = GetScalarizedVector(Op: Cond); |
497 | } else { |
498 | EVT VT = OpVT.getVectorElementType(); |
499 | Cond = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: Cond, |
500 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
501 | } |
502 | |
503 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
504 | TargetLowering::BooleanContent ScalarBool = |
505 | TLI.getBooleanContents(isVec: false, isFloat: false); |
506 | TargetLowering::BooleanContent VecBool = TLI.getBooleanContents(isVec: true, isFloat: false); |
507 | |
508 | // If integer and float booleans have different contents then we can't |
509 | // reliably optimize in all cases. There is a full explanation for this in |
510 | // DAGCombiner::visitSELECT() where the same issue affects folding |
511 | // (select C, 0, 1) to (xor C, 1). |
512 | if (TLI.getBooleanContents(isVec: false, isFloat: false) != |
513 | TLI.getBooleanContents(isVec: false, isFloat: true)) { |
514 | // At least try the common case where the boolean is generated by a |
515 | // comparison. |
516 | if (Cond->getOpcode() == ISD::SETCC) { |
517 | EVT OpVT = Cond->getOperand(Num: 0).getValueType(); |
518 | ScalarBool = TLI.getBooleanContents(Type: OpVT.getScalarType()); |
519 | VecBool = TLI.getBooleanContents(Type: OpVT); |
520 | } else |
521 | ScalarBool = TargetLowering::UndefinedBooleanContent; |
522 | } |
523 | |
524 | EVT CondVT = Cond.getValueType(); |
525 | if (ScalarBool != VecBool) { |
526 | switch (ScalarBool) { |
527 | case TargetLowering::UndefinedBooleanContent: |
528 | break; |
529 | case TargetLowering::ZeroOrOneBooleanContent: |
530 | assert(VecBool == TargetLowering::UndefinedBooleanContent || |
531 | VecBool == TargetLowering::ZeroOrNegativeOneBooleanContent); |
532 | // Vector read from all ones, scalar expects a single 1 so mask. |
533 | Cond = DAG.getNode(Opcode: ISD::AND, DL: SDLoc(N), VT: CondVT, |
534 | N1: Cond, N2: DAG.getConstant(Val: 1, DL: SDLoc(N), VT: CondVT)); |
535 | break; |
536 | case TargetLowering::ZeroOrNegativeOneBooleanContent: |
537 | assert(VecBool == TargetLowering::UndefinedBooleanContent || |
538 | VecBool == TargetLowering::ZeroOrOneBooleanContent); |
539 | // Vector reads from a one, scalar from all ones so sign extend. |
540 | Cond = DAG.getNode(ISD::SIGN_EXTEND_INREG, SDLoc(N), CondVT, |
541 | Cond, DAG.getValueType(MVT::i1)); |
542 | break; |
543 | } |
544 | } |
545 | |
546 | // Truncate the condition if needed |
547 | auto BoolVT = getSetCCResultType(VT: CondVT); |
548 | if (BoolVT.bitsLT(VT: CondVT)) |
549 | Cond = DAG.getNode(Opcode: ISD::TRUNCATE, DL: SDLoc(N), VT: BoolVT, Operand: Cond); |
550 | |
551 | return DAG.getSelect(DL: SDLoc(N), |
552 | VT: LHS.getValueType(), Cond, LHS, |
553 | RHS: GetScalarizedVector(Op: N->getOperand(Num: 2))); |
554 | } |
555 | |
556 | SDValue DAGTypeLegalizer::ScalarizeVecRes_SELECT(SDNode *N) { |
557 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
558 | return DAG.getSelect(DL: SDLoc(N), |
559 | VT: LHS.getValueType(), Cond: N->getOperand(Num: 0), LHS, |
560 | RHS: GetScalarizedVector(Op: N->getOperand(Num: 2))); |
561 | } |
562 | |
563 | SDValue DAGTypeLegalizer::ScalarizeVecRes_SELECT_CC(SDNode *N) { |
564 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 2)); |
565 | return DAG.getNode(Opcode: ISD::SELECT_CC, DL: SDLoc(N), VT: LHS.getValueType(), |
566 | N1: N->getOperand(Num: 0), N2: N->getOperand(Num: 1), |
567 | N3: LHS, N4: GetScalarizedVector(Op: N->getOperand(Num: 3)), |
568 | N5: N->getOperand(Num: 4)); |
569 | } |
570 | |
571 | SDValue DAGTypeLegalizer::ScalarizeVecRes_UNDEF(SDNode *N) { |
572 | return DAG.getUNDEF(VT: N->getValueType(ResNo: 0).getVectorElementType()); |
573 | } |
574 | |
575 | SDValue DAGTypeLegalizer::ScalarizeVecRes_VECTOR_SHUFFLE(SDNode *N) { |
576 | // Figure out if the scalar is the LHS or RHS and return it. |
577 | SDValue Arg = N->getOperand(Num: 2).getOperand(i: 0); |
578 | if (Arg.isUndef()) |
579 | return DAG.getUNDEF(VT: N->getValueType(ResNo: 0).getVectorElementType()); |
580 | unsigned Op = !cast<ConstantSDNode>(Val&: Arg)->isZero(); |
581 | return GetScalarizedVector(Op: N->getOperand(Num: Op)); |
582 | } |
583 | |
584 | SDValue DAGTypeLegalizer::ScalarizeVecRes_FP_TO_XINT_SAT(SDNode *N) { |
585 | SDValue Src = N->getOperand(Num: 0); |
586 | EVT SrcVT = Src.getValueType(); |
587 | SDLoc dl(N); |
588 | |
589 | // Handle case where result is scalarized but operand is not |
590 | if (getTypeAction(VT: SrcVT) == TargetLowering::TypeScalarizeVector) |
591 | Src = GetScalarizedVector(Op: Src); |
592 | else |
593 | Src = DAG.getNode( |
594 | Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: SrcVT.getVectorElementType(), N1: Src, |
595 | N2: DAG.getConstant(Val: 0, DL: dl, VT: TLI.getVectorIdxTy(DL: DAG.getDataLayout()))); |
596 | |
597 | EVT DstVT = N->getValueType(ResNo: 0).getVectorElementType(); |
598 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: DstVT, N1: Src, N2: N->getOperand(Num: 1)); |
599 | } |
600 | |
601 | SDValue DAGTypeLegalizer::ScalarizeVecRes_SETCC(SDNode *N) { |
602 | assert(N->getValueType(0).isVector() && |
603 | N->getOperand(0).getValueType().isVector() && |
604 | "Operand types must be vectors" ); |
605 | SDValue LHS = N->getOperand(Num: 0); |
606 | SDValue RHS = N->getOperand(Num: 1); |
607 | EVT OpVT = LHS.getValueType(); |
608 | EVT NVT = N->getValueType(ResNo: 0).getVectorElementType(); |
609 | SDLoc DL(N); |
610 | |
611 | // The result needs scalarizing, but it's not a given that the source does. |
612 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeScalarizeVector) { |
613 | LHS = GetScalarizedVector(Op: LHS); |
614 | RHS = GetScalarizedVector(Op: RHS); |
615 | } else { |
616 | EVT VT = OpVT.getVectorElementType(); |
617 | LHS = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: LHS, |
618 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
619 | RHS = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: RHS, |
620 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
621 | } |
622 | |
623 | // Turn it into a scalar SETCC. |
624 | SDValue Res = DAG.getNode(ISD::SETCC, DL, MVT::i1, LHS, RHS, |
625 | N->getOperand(Num: 2)); |
626 | // Vectors may have a different boolean contents to scalars. Promote the |
627 | // value appropriately. |
628 | ISD::NodeType ExtendCode = |
629 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: OpVT)); |
630 | return DAG.getNode(Opcode: ExtendCode, DL, VT: NVT, Operand: Res); |
631 | } |
632 | |
633 | SDValue DAGTypeLegalizer::ScalarizeVecRes_IS_FPCLASS(SDNode *N) { |
634 | SDLoc DL(N); |
635 | SDValue Arg = N->getOperand(Num: 0); |
636 | SDValue Test = N->getOperand(Num: 1); |
637 | EVT ArgVT = Arg.getValueType(); |
638 | EVT ResultVT = N->getValueType(ResNo: 0).getVectorElementType(); |
639 | |
640 | if (getTypeAction(VT: ArgVT) == TargetLowering::TypeScalarizeVector) { |
641 | Arg = GetScalarizedVector(Op: Arg); |
642 | } else { |
643 | EVT VT = ArgVT.getVectorElementType(); |
644 | Arg = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT, N1: Arg, |
645 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
646 | } |
647 | |
648 | SDValue Res = |
649 | DAG.getNode(ISD::IS_FPCLASS, DL, MVT::i1, {Arg, Test}, N->getFlags()); |
650 | // Vectors may have a different boolean contents to scalars. Promote the |
651 | // value appropriately. |
652 | ISD::NodeType ExtendCode = |
653 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: ArgVT)); |
654 | return DAG.getNode(Opcode: ExtendCode, DL, VT: ResultVT, Operand: Res); |
655 | } |
656 | |
657 | //===----------------------------------------------------------------------===// |
658 | // Operand Vector Scalarization <1 x ty> -> ty. |
659 | //===----------------------------------------------------------------------===// |
660 | |
661 | bool DAGTypeLegalizer::ScalarizeVectorOperand(SDNode *N, unsigned OpNo) { |
662 | LLVM_DEBUG(dbgs() << "Scalarize node operand " << OpNo << ": " ; |
663 | N->dump(&DAG)); |
664 | SDValue Res = SDValue(); |
665 | |
666 | switch (N->getOpcode()) { |
667 | default: |
668 | #ifndef NDEBUG |
669 | dbgs() << "ScalarizeVectorOperand Op #" << OpNo << ": " ; |
670 | N->dump(G: &DAG); |
671 | dbgs() << "\n" ; |
672 | #endif |
673 | report_fatal_error(reason: "Do not know how to scalarize this operator's " |
674 | "operand!\n" ); |
675 | case ISD::BITCAST: |
676 | Res = ScalarizeVecOp_BITCAST(N); |
677 | break; |
678 | case ISD::ANY_EXTEND: |
679 | case ISD::ZERO_EXTEND: |
680 | case ISD::SIGN_EXTEND: |
681 | case ISD::TRUNCATE: |
682 | case ISD::FP_TO_SINT: |
683 | case ISD::FP_TO_UINT: |
684 | case ISD::SINT_TO_FP: |
685 | case ISD::UINT_TO_FP: |
686 | case ISD::LRINT: |
687 | case ISD::LLRINT: |
688 | Res = ScalarizeVecOp_UnaryOp(N); |
689 | break; |
690 | case ISD::STRICT_SINT_TO_FP: |
691 | case ISD::STRICT_UINT_TO_FP: |
692 | case ISD::STRICT_FP_TO_SINT: |
693 | case ISD::STRICT_FP_TO_UINT: |
694 | Res = ScalarizeVecOp_UnaryOp_StrictFP(N); |
695 | break; |
696 | case ISD::CONCAT_VECTORS: |
697 | Res = ScalarizeVecOp_CONCAT_VECTORS(N); |
698 | break; |
699 | case ISD::EXTRACT_VECTOR_ELT: |
700 | Res = ScalarizeVecOp_EXTRACT_VECTOR_ELT(N); |
701 | break; |
702 | case ISD::VSELECT: |
703 | Res = ScalarizeVecOp_VSELECT(N); |
704 | break; |
705 | case ISD::SETCC: |
706 | Res = ScalarizeVecOp_VSETCC(N); |
707 | break; |
708 | case ISD::STORE: |
709 | Res = ScalarizeVecOp_STORE(N: cast<StoreSDNode>(Val: N), OpNo); |
710 | break; |
711 | case ISD::STRICT_FP_ROUND: |
712 | Res = ScalarizeVecOp_STRICT_FP_ROUND(N, OpNo); |
713 | break; |
714 | case ISD::FP_ROUND: |
715 | Res = ScalarizeVecOp_FP_ROUND(N, OpNo); |
716 | break; |
717 | case ISD::STRICT_FP_EXTEND: |
718 | Res = ScalarizeVecOp_STRICT_FP_EXTEND(N); |
719 | break; |
720 | case ISD::FP_EXTEND: |
721 | Res = ScalarizeVecOp_FP_EXTEND(N); |
722 | break; |
723 | case ISD::VECREDUCE_FADD: |
724 | case ISD::VECREDUCE_FMUL: |
725 | case ISD::VECREDUCE_ADD: |
726 | case ISD::VECREDUCE_MUL: |
727 | case ISD::VECREDUCE_AND: |
728 | case ISD::VECREDUCE_OR: |
729 | case ISD::VECREDUCE_XOR: |
730 | case ISD::VECREDUCE_SMAX: |
731 | case ISD::VECREDUCE_SMIN: |
732 | case ISD::VECREDUCE_UMAX: |
733 | case ISD::VECREDUCE_UMIN: |
734 | case ISD::VECREDUCE_FMAX: |
735 | case ISD::VECREDUCE_FMIN: |
736 | case ISD::VECREDUCE_FMAXIMUM: |
737 | case ISD::VECREDUCE_FMINIMUM: |
738 | Res = ScalarizeVecOp_VECREDUCE(N); |
739 | break; |
740 | case ISD::VECREDUCE_SEQ_FADD: |
741 | case ISD::VECREDUCE_SEQ_FMUL: |
742 | Res = ScalarizeVecOp_VECREDUCE_SEQ(N); |
743 | break; |
744 | } |
745 | |
746 | // If the result is null, the sub-method took care of registering results etc. |
747 | if (!Res.getNode()) return false; |
748 | |
749 | // If the result is N, the sub-method updated N in place. Tell the legalizer |
750 | // core about this. |
751 | if (Res.getNode() == N) |
752 | return true; |
753 | |
754 | assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 1 && |
755 | "Invalid operand expansion" ); |
756 | |
757 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
758 | return false; |
759 | } |
760 | |
761 | /// If the value to convert is a vector that needs to be scalarized, it must be |
762 | /// <1 x ty>. Convert the element instead. |
763 | SDValue DAGTypeLegalizer::ScalarizeVecOp_BITCAST(SDNode *N) { |
764 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
765 | return DAG.getNode(Opcode: ISD::BITCAST, DL: SDLoc(N), |
766 | VT: N->getValueType(ResNo: 0), Operand: Elt); |
767 | } |
768 | |
769 | /// If the input is a vector that needs to be scalarized, it must be <1 x ty>. |
770 | /// Do the operation on the element instead. |
771 | SDValue DAGTypeLegalizer::ScalarizeVecOp_UnaryOp(SDNode *N) { |
772 | assert(N->getValueType(0).getVectorNumElements() == 1 && |
773 | "Unexpected vector type!" ); |
774 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
775 | SDValue Op = DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), |
776 | VT: N->getValueType(ResNo: 0).getScalarType(), Operand: Elt); |
777 | // Revectorize the result so the types line up with what the uses of this |
778 | // expression expect. |
779 | return DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Op); |
780 | } |
781 | |
782 | /// If the input is a vector that needs to be scalarized, it must be <1 x ty>. |
783 | /// Do the strict FP operation on the element instead. |
784 | SDValue DAGTypeLegalizer::ScalarizeVecOp_UnaryOp_StrictFP(SDNode *N) { |
785 | assert(N->getValueType(0).getVectorNumElements() == 1 && |
786 | "Unexpected vector type!" ); |
787 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
788 | SDValue Res = DAG.getNode(N->getOpcode(), SDLoc(N), |
789 | { N->getValueType(0).getScalarType(), MVT::Other }, |
790 | { N->getOperand(0), Elt }); |
791 | // Legalize the chain result - switch anything that used the old chain to |
792 | // use the new one. |
793 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
794 | // Revectorize the result so the types line up with what the uses of this |
795 | // expression expect. |
796 | Res = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
797 | |
798 | // Do our own replacement and return SDValue() to tell the caller that we |
799 | // handled all replacements since caller can only handle a single result. |
800 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
801 | return SDValue(); |
802 | } |
803 | |
804 | /// The vectors to concatenate have length one - use a BUILD_VECTOR instead. |
805 | SDValue DAGTypeLegalizer::ScalarizeVecOp_CONCAT_VECTORS(SDNode *N) { |
806 | SmallVector<SDValue, 8> Ops(N->getNumOperands()); |
807 | for (unsigned i = 0, e = N->getNumOperands(); i < e; ++i) |
808 | Ops[i] = GetScalarizedVector(Op: N->getOperand(Num: i)); |
809 | return DAG.getBuildVector(VT: N->getValueType(ResNo: 0), DL: SDLoc(N), Ops); |
810 | } |
811 | |
812 | /// If the input is a vector that needs to be scalarized, it must be <1 x ty>, |
813 | /// so just return the element, ignoring the index. |
814 | SDValue DAGTypeLegalizer::(SDNode *N) { |
815 | EVT VT = N->getValueType(ResNo: 0); |
816 | SDValue Res = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
817 | if (Res.getValueType() != VT) |
818 | Res = VT.isFloatingPoint() |
819 | ? DAG.getNode(Opcode: ISD::FP_EXTEND, DL: SDLoc(N), VT, Operand: Res) |
820 | : DAG.getNode(Opcode: ISD::ANY_EXTEND, DL: SDLoc(N), VT, Operand: Res); |
821 | return Res; |
822 | } |
823 | |
824 | /// If the input condition is a vector that needs to be scalarized, it must be |
825 | /// <1 x i1>, so just convert to a normal ISD::SELECT |
826 | /// (still with vector output type since that was acceptable if we got here). |
827 | SDValue DAGTypeLegalizer::ScalarizeVecOp_VSELECT(SDNode *N) { |
828 | SDValue ScalarCond = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
829 | EVT VT = N->getValueType(ResNo: 0); |
830 | |
831 | return DAG.getNode(Opcode: ISD::SELECT, DL: SDLoc(N), VT, N1: ScalarCond, N2: N->getOperand(Num: 1), |
832 | N3: N->getOperand(Num: 2)); |
833 | } |
834 | |
835 | /// If the operand is a vector that needs to be scalarized then the |
836 | /// result must be v1i1, so just convert to a scalar SETCC and wrap |
837 | /// with a scalar_to_vector since the res type is legal if we got here |
838 | SDValue DAGTypeLegalizer::ScalarizeVecOp_VSETCC(SDNode *N) { |
839 | assert(N->getValueType(0).isVector() && |
840 | N->getOperand(0).getValueType().isVector() && |
841 | "Operand types must be vectors" ); |
842 | assert(N->getValueType(0) == MVT::v1i1 && "Expected v1i1 type" ); |
843 | |
844 | EVT VT = N->getValueType(ResNo: 0); |
845 | SDValue LHS = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
846 | SDValue RHS = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
847 | |
848 | EVT OpVT = N->getOperand(Num: 0).getValueType(); |
849 | EVT NVT = VT.getVectorElementType(); |
850 | SDLoc DL(N); |
851 | // Turn it into a scalar SETCC. |
852 | SDValue Res = DAG.getNode(ISD::SETCC, DL, MVT::i1, LHS, RHS, |
853 | N->getOperand(Num: 2)); |
854 | |
855 | // Vectors may have a different boolean contents to scalars. Promote the |
856 | // value appropriately. |
857 | ISD::NodeType ExtendCode = |
858 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: OpVT)); |
859 | |
860 | Res = DAG.getNode(Opcode: ExtendCode, DL, VT: NVT, Operand: Res); |
861 | |
862 | return DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL, VT, Operand: Res); |
863 | } |
864 | |
865 | /// If the value to store is a vector that needs to be scalarized, it must be |
866 | /// <1 x ty>. Just store the element. |
867 | SDValue DAGTypeLegalizer::ScalarizeVecOp_STORE(StoreSDNode *N, unsigned OpNo){ |
868 | assert(N->isUnindexed() && "Indexed store of one-element vector?" ); |
869 | assert(OpNo == 1 && "Do not know how to scalarize this operand!" ); |
870 | SDLoc dl(N); |
871 | |
872 | if (N->isTruncatingStore()) |
873 | return DAG.getTruncStore( |
874 | Chain: N->getChain(), dl, Val: GetScalarizedVector(Op: N->getOperand(Num: 1)), |
875 | Ptr: N->getBasePtr(), PtrInfo: N->getPointerInfo(), |
876 | SVT: N->getMemoryVT().getVectorElementType(), Alignment: N->getOriginalAlign(), |
877 | MMOFlags: N->getMemOperand()->getFlags(), AAInfo: N->getAAInfo()); |
878 | |
879 | return DAG.getStore(Chain: N->getChain(), dl, Val: GetScalarizedVector(Op: N->getOperand(Num: 1)), |
880 | Ptr: N->getBasePtr(), PtrInfo: N->getPointerInfo(), |
881 | Alignment: N->getOriginalAlign(), MMOFlags: N->getMemOperand()->getFlags(), |
882 | AAInfo: N->getAAInfo()); |
883 | } |
884 | |
885 | /// If the value to round is a vector that needs to be scalarized, it must be |
886 | /// <1 x ty>. Convert the element instead. |
887 | SDValue DAGTypeLegalizer::ScalarizeVecOp_FP_ROUND(SDNode *N, unsigned OpNo) { |
888 | assert(OpNo == 0 && "Wrong operand for scalarization!" ); |
889 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
890 | SDValue Res = DAG.getNode(Opcode: ISD::FP_ROUND, DL: SDLoc(N), |
891 | VT: N->getValueType(ResNo: 0).getVectorElementType(), N1: Elt, |
892 | N2: N->getOperand(Num: 1)); |
893 | return DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
894 | } |
895 | |
896 | SDValue DAGTypeLegalizer::ScalarizeVecOp_STRICT_FP_ROUND(SDNode *N, |
897 | unsigned OpNo) { |
898 | assert(OpNo == 1 && "Wrong operand for scalarization!" ); |
899 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
900 | SDValue Res = DAG.getNode(ISD::STRICT_FP_ROUND, SDLoc(N), |
901 | { N->getValueType(0).getVectorElementType(), |
902 | MVT::Other }, |
903 | { N->getOperand(0), Elt, N->getOperand(2) }); |
904 | // Legalize the chain result - switch anything that used the old chain to |
905 | // use the new one. |
906 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
907 | |
908 | Res = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
909 | |
910 | // Do our own replacement and return SDValue() to tell the caller that we |
911 | // handled all replacements since caller can only handle a single result. |
912 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
913 | return SDValue(); |
914 | } |
915 | |
916 | /// If the value to extend is a vector that needs to be scalarized, it must be |
917 | /// <1 x ty>. Convert the element instead. |
918 | SDValue DAGTypeLegalizer::ScalarizeVecOp_FP_EXTEND(SDNode *N) { |
919 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
920 | SDValue Res = DAG.getNode(Opcode: ISD::FP_EXTEND, DL: SDLoc(N), |
921 | VT: N->getValueType(ResNo: 0).getVectorElementType(), Operand: Elt); |
922 | return DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
923 | } |
924 | |
925 | /// If the value to extend is a vector that needs to be scalarized, it must be |
926 | /// <1 x ty>. Convert the element instead. |
927 | SDValue DAGTypeLegalizer::ScalarizeVecOp_STRICT_FP_EXTEND(SDNode *N) { |
928 | SDValue Elt = GetScalarizedVector(Op: N->getOperand(Num: 1)); |
929 | SDValue Res = |
930 | DAG.getNode(ISD::STRICT_FP_EXTEND, SDLoc(N), |
931 | {N->getValueType(0).getVectorElementType(), MVT::Other}, |
932 | {N->getOperand(0), Elt}); |
933 | // Legalize the chain result - switch anything that used the old chain to |
934 | // use the new one. |
935 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
936 | |
937 | Res = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
938 | |
939 | // Do our own replacement and return SDValue() to tell the caller that we |
940 | // handled all replacements since caller can only handle a single result. |
941 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
942 | return SDValue(); |
943 | } |
944 | |
945 | SDValue DAGTypeLegalizer::ScalarizeVecOp_VECREDUCE(SDNode *N) { |
946 | SDValue Res = GetScalarizedVector(Op: N->getOperand(Num: 0)); |
947 | // Result type may be wider than element type. |
948 | if (Res.getValueType() != N->getValueType(ResNo: 0)) |
949 | Res = DAG.getNode(Opcode: ISD::ANY_EXTEND, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: Res); |
950 | return Res; |
951 | } |
952 | |
953 | SDValue DAGTypeLegalizer::ScalarizeVecOp_VECREDUCE_SEQ(SDNode *N) { |
954 | SDValue AccOp = N->getOperand(Num: 0); |
955 | SDValue VecOp = N->getOperand(Num: 1); |
956 | |
957 | unsigned BaseOpc = ISD::getVecReduceBaseOpcode(VecReduceOpcode: N->getOpcode()); |
958 | |
959 | SDValue Op = GetScalarizedVector(Op: VecOp); |
960 | return DAG.getNode(Opcode: BaseOpc, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), |
961 | N1: AccOp, N2: Op, Flags: N->getFlags()); |
962 | } |
963 | |
964 | //===----------------------------------------------------------------------===// |
965 | // Result Vector Splitting |
966 | //===----------------------------------------------------------------------===// |
967 | |
968 | /// This method is called when the specified result of the specified node is |
969 | /// found to need vector splitting. At this point, the node may also have |
970 | /// invalid operands or may have other results that need legalization, we just |
971 | /// know that (at least) one result needs vector splitting. |
972 | void DAGTypeLegalizer::SplitVectorResult(SDNode *N, unsigned ResNo) { |
973 | LLVM_DEBUG(dbgs() << "Split node result: " ; N->dump(&DAG)); |
974 | SDValue Lo, Hi; |
975 | |
976 | // See if the target wants to custom expand this node. |
977 | if (CustomLowerNode(N, VT: N->getValueType(ResNo), LegalizeResult: true)) |
978 | return; |
979 | |
980 | switch (N->getOpcode()) { |
981 | default: |
982 | #ifndef NDEBUG |
983 | dbgs() << "SplitVectorResult #" << ResNo << ": " ; |
984 | N->dump(G: &DAG); |
985 | dbgs() << "\n" ; |
986 | #endif |
987 | report_fatal_error(reason: "Do not know how to split the result of this " |
988 | "operator!\n" ); |
989 | |
990 | case ISD::MERGE_VALUES: SplitRes_MERGE_VALUES(N, ResNo, Lo, Hi); break; |
991 | case ISD::AssertZext: SplitVecRes_AssertZext(N, Lo, Hi); break; |
992 | case ISD::VSELECT: |
993 | case ISD::SELECT: |
994 | case ISD::VP_MERGE: |
995 | case ISD::VP_SELECT: SplitRes_Select(N, Lo, Hi); break; |
996 | case ISD::SELECT_CC: SplitRes_SELECT_CC(N, Lo, Hi); break; |
997 | case ISD::UNDEF: SplitRes_UNDEF(N, Lo, Hi); break; |
998 | case ISD::BITCAST: SplitVecRes_BITCAST(N, Lo, Hi); break; |
999 | case ISD::BUILD_VECTOR: SplitVecRes_BUILD_VECTOR(N, Lo, Hi); break; |
1000 | case ISD::CONCAT_VECTORS: SplitVecRes_CONCAT_VECTORS(N, Lo, Hi); break; |
1001 | case ISD::EXTRACT_SUBVECTOR: SplitVecRes_EXTRACT_SUBVECTOR(N, Lo, Hi); break; |
1002 | case ISD::INSERT_SUBVECTOR: SplitVecRes_INSERT_SUBVECTOR(N, Lo, Hi); break; |
1003 | case ISD::FPOWI: |
1004 | case ISD::FLDEXP: |
1005 | case ISD::FCOPYSIGN: SplitVecRes_FPOp_MultiType(N, Lo, Hi); break; |
1006 | case ISD::IS_FPCLASS: SplitVecRes_IS_FPCLASS(N, Lo, Hi); break; |
1007 | case ISD::INSERT_VECTOR_ELT: SplitVecRes_INSERT_VECTOR_ELT(N, Lo, Hi); break; |
1008 | case ISD::SPLAT_VECTOR: |
1009 | case ISD::SCALAR_TO_VECTOR: |
1010 | SplitVecRes_ScalarOp(N, Lo, Hi); |
1011 | break; |
1012 | case ISD::STEP_VECTOR: |
1013 | SplitVecRes_STEP_VECTOR(N, Lo, Hi); |
1014 | break; |
1015 | case ISD::SIGN_EXTEND_INREG: SplitVecRes_InregOp(N, Lo, Hi); break; |
1016 | case ISD::LOAD: |
1017 | SplitVecRes_LOAD(LD: cast<LoadSDNode>(Val: N), Lo, Hi); |
1018 | break; |
1019 | case ISD::VP_LOAD: |
1020 | SplitVecRes_VP_LOAD(LD: cast<VPLoadSDNode>(Val: N), Lo, Hi); |
1021 | break; |
1022 | case ISD::EXPERIMENTAL_VP_STRIDED_LOAD: |
1023 | SplitVecRes_VP_STRIDED_LOAD(SLD: cast<VPStridedLoadSDNode>(Val: N), Lo, Hi); |
1024 | break; |
1025 | case ISD::MLOAD: |
1026 | SplitVecRes_MLOAD(MLD: cast<MaskedLoadSDNode>(Val: N), Lo, Hi); |
1027 | break; |
1028 | case ISD::MGATHER: |
1029 | case ISD::VP_GATHER: |
1030 | SplitVecRes_Gather(VPGT: cast<MemSDNode>(Val: N), Lo, Hi, /*SplitSETCC*/ true); |
1031 | break; |
1032 | case ISD::SETCC: |
1033 | case ISD::VP_SETCC: |
1034 | SplitVecRes_SETCC(N, Lo, Hi); |
1035 | break; |
1036 | case ISD::VECTOR_REVERSE: |
1037 | SplitVecRes_VECTOR_REVERSE(N, Lo, Hi); |
1038 | break; |
1039 | case ISD::VECTOR_SHUFFLE: |
1040 | SplitVecRes_VECTOR_SHUFFLE(N: cast<ShuffleVectorSDNode>(Val: N), Lo, Hi); |
1041 | break; |
1042 | case ISD::VECTOR_SPLICE: |
1043 | SplitVecRes_VECTOR_SPLICE(N, Lo, Hi); |
1044 | break; |
1045 | case ISD::VECTOR_DEINTERLEAVE: |
1046 | SplitVecRes_VECTOR_DEINTERLEAVE(N); |
1047 | return; |
1048 | case ISD::VECTOR_INTERLEAVE: |
1049 | SplitVecRes_VECTOR_INTERLEAVE(N); |
1050 | return; |
1051 | case ISD::VAARG: |
1052 | SplitVecRes_VAARG(N, Lo, Hi); |
1053 | break; |
1054 | |
1055 | case ISD::ANY_EXTEND_VECTOR_INREG: |
1056 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
1057 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
1058 | SplitVecRes_ExtVecInRegOp(N, Lo, Hi); |
1059 | break; |
1060 | |
1061 | case ISD::ABS: |
1062 | case ISD::VP_ABS: |
1063 | case ISD::BITREVERSE: |
1064 | case ISD::VP_BITREVERSE: |
1065 | case ISD::BSWAP: |
1066 | case ISD::VP_BSWAP: |
1067 | case ISD::CTLZ: |
1068 | case ISD::VP_CTLZ: |
1069 | case ISD::CTTZ: |
1070 | case ISD::VP_CTTZ: |
1071 | case ISD::CTLZ_ZERO_UNDEF: |
1072 | case ISD::VP_CTLZ_ZERO_UNDEF: |
1073 | case ISD::CTTZ_ZERO_UNDEF: |
1074 | case ISD::VP_CTTZ_ZERO_UNDEF: |
1075 | case ISD::CTPOP: |
1076 | case ISD::VP_CTPOP: |
1077 | case ISD::FABS: case ISD::VP_FABS: |
1078 | case ISD::FCEIL: |
1079 | case ISD::VP_FCEIL: |
1080 | case ISD::FCOS: |
1081 | case ISD::FEXP: |
1082 | case ISD::FEXP2: |
1083 | case ISD::FEXP10: |
1084 | case ISD::FFLOOR: |
1085 | case ISD::VP_FFLOOR: |
1086 | case ISD::FLOG: |
1087 | case ISD::FLOG10: |
1088 | case ISD::FLOG2: |
1089 | case ISD::FNEARBYINT: |
1090 | case ISD::VP_FNEARBYINT: |
1091 | case ISD::FNEG: case ISD::VP_FNEG: |
1092 | case ISD::FREEZE: |
1093 | case ISD::ARITH_FENCE: |
1094 | case ISD::FP_EXTEND: |
1095 | case ISD::VP_FP_EXTEND: |
1096 | case ISD::FP_ROUND: |
1097 | case ISD::VP_FP_ROUND: |
1098 | case ISD::FP_TO_SINT: |
1099 | case ISD::VP_FP_TO_SINT: |
1100 | case ISD::FP_TO_UINT: |
1101 | case ISD::VP_FP_TO_UINT: |
1102 | case ISD::FRINT: |
1103 | case ISD::VP_FRINT: |
1104 | case ISD::LRINT: |
1105 | case ISD::LLRINT: |
1106 | case ISD::FROUND: |
1107 | case ISD::VP_FROUND: |
1108 | case ISD::FROUNDEVEN: |
1109 | case ISD::VP_FROUNDEVEN: |
1110 | case ISD::FSIN: |
1111 | case ISD::FSQRT: case ISD::VP_SQRT: |
1112 | case ISD::FTRUNC: |
1113 | case ISD::VP_FROUNDTOZERO: |
1114 | case ISD::SINT_TO_FP: |
1115 | case ISD::VP_SINT_TO_FP: |
1116 | case ISD::TRUNCATE: |
1117 | case ISD::VP_TRUNCATE: |
1118 | case ISD::UINT_TO_FP: |
1119 | case ISD::VP_UINT_TO_FP: |
1120 | case ISD::FCANONICALIZE: |
1121 | SplitVecRes_UnaryOp(N, Lo, Hi); |
1122 | break; |
1123 | case ISD::FFREXP: |
1124 | SplitVecRes_FFREXP(N, ResNo, Lo, Hi); |
1125 | break; |
1126 | |
1127 | case ISD::ANY_EXTEND: |
1128 | case ISD::SIGN_EXTEND: |
1129 | case ISD::ZERO_EXTEND: |
1130 | case ISD::VP_SIGN_EXTEND: |
1131 | case ISD::VP_ZERO_EXTEND: |
1132 | SplitVecRes_ExtendOp(N, Lo, Hi); |
1133 | break; |
1134 | |
1135 | case ISD::ADD: case ISD::VP_ADD: |
1136 | case ISD::SUB: case ISD::VP_SUB: |
1137 | case ISD::MUL: case ISD::VP_MUL: |
1138 | case ISD::MULHS: |
1139 | case ISD::MULHU: |
1140 | case ISD::FADD: case ISD::VP_FADD: |
1141 | case ISD::FSUB: case ISD::VP_FSUB: |
1142 | case ISD::FMUL: case ISD::VP_FMUL: |
1143 | case ISD::FMINNUM: case ISD::VP_FMINNUM: |
1144 | case ISD::FMAXNUM: case ISD::VP_FMAXNUM: |
1145 | case ISD::FMINIMUM: |
1146 | case ISD::VP_FMINIMUM: |
1147 | case ISD::FMAXIMUM: |
1148 | case ISD::VP_FMAXIMUM: |
1149 | case ISD::SDIV: case ISD::VP_SDIV: |
1150 | case ISD::UDIV: case ISD::VP_UDIV: |
1151 | case ISD::FDIV: case ISD::VP_FDIV: |
1152 | case ISD::FPOW: |
1153 | case ISD::AND: case ISD::VP_AND: |
1154 | case ISD::OR: case ISD::VP_OR: |
1155 | case ISD::XOR: case ISD::VP_XOR: |
1156 | case ISD::SHL: case ISD::VP_SHL: |
1157 | case ISD::SRA: case ISD::VP_ASHR: |
1158 | case ISD::SRL: case ISD::VP_LSHR: |
1159 | case ISD::UREM: case ISD::VP_UREM: |
1160 | case ISD::SREM: case ISD::VP_SREM: |
1161 | case ISD::FREM: case ISD::VP_FREM: |
1162 | case ISD::SMIN: case ISD::VP_SMIN: |
1163 | case ISD::SMAX: case ISD::VP_SMAX: |
1164 | case ISD::UMIN: case ISD::VP_UMIN: |
1165 | case ISD::UMAX: case ISD::VP_UMAX: |
1166 | case ISD::SADDSAT: |
1167 | case ISD::UADDSAT: |
1168 | case ISD::SSUBSAT: |
1169 | case ISD::USUBSAT: |
1170 | case ISD::SSHLSAT: |
1171 | case ISD::USHLSAT: |
1172 | case ISD::ROTL: |
1173 | case ISD::ROTR: |
1174 | case ISD::VP_FCOPYSIGN: |
1175 | SplitVecRes_BinOp(N, Lo, Hi); |
1176 | break; |
1177 | case ISD::FMA: case ISD::VP_FMA: |
1178 | case ISD::FSHL: |
1179 | case ISD::VP_FSHL: |
1180 | case ISD::FSHR: |
1181 | case ISD::VP_FSHR: |
1182 | SplitVecRes_TernaryOp(N, Lo, Hi); |
1183 | break; |
1184 | |
1185 | #define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN) \ |
1186 | case ISD::STRICT_##DAGN: |
1187 | #include "llvm/IR/ConstrainedOps.def" |
1188 | SplitVecRes_StrictFPOp(N, Lo, Hi); |
1189 | break; |
1190 | |
1191 | case ISD::FP_TO_UINT_SAT: |
1192 | case ISD::FP_TO_SINT_SAT: |
1193 | SplitVecRes_FP_TO_XINT_SAT(N, Lo, Hi); |
1194 | break; |
1195 | |
1196 | case ISD::UADDO: |
1197 | case ISD::SADDO: |
1198 | case ISD::USUBO: |
1199 | case ISD::SSUBO: |
1200 | case ISD::UMULO: |
1201 | case ISD::SMULO: |
1202 | SplitVecRes_OverflowOp(N, ResNo, Lo, Hi); |
1203 | break; |
1204 | case ISD::SMULFIX: |
1205 | case ISD::SMULFIXSAT: |
1206 | case ISD::UMULFIX: |
1207 | case ISD::UMULFIXSAT: |
1208 | case ISD::SDIVFIX: |
1209 | case ISD::SDIVFIXSAT: |
1210 | case ISD::UDIVFIX: |
1211 | case ISD::UDIVFIXSAT: |
1212 | SplitVecRes_FIX(N, Lo, Hi); |
1213 | break; |
1214 | case ISD::EXPERIMENTAL_VP_REVERSE: |
1215 | SplitVecRes_VP_REVERSE(N, Lo, Hi); |
1216 | break; |
1217 | } |
1218 | |
1219 | // If Lo/Hi is null, the sub-method took care of registering results etc. |
1220 | if (Lo.getNode()) |
1221 | SetSplitVector(Op: SDValue(N, ResNo), Lo, Hi); |
1222 | } |
1223 | |
1224 | void DAGTypeLegalizer::IncrementPointer(MemSDNode *N, EVT MemVT, |
1225 | MachinePointerInfo &MPI, SDValue &Ptr, |
1226 | uint64_t *ScaledOffset) { |
1227 | SDLoc DL(N); |
1228 | unsigned IncrementSize = MemVT.getSizeInBits().getKnownMinValue() / 8; |
1229 | |
1230 | if (MemVT.isScalableVector()) { |
1231 | SDNodeFlags Flags; |
1232 | SDValue BytesIncrement = DAG.getVScale( |
1233 | DL, VT: Ptr.getValueType(), |
1234 | MulImm: APInt(Ptr.getValueSizeInBits().getFixedValue(), IncrementSize)); |
1235 | MPI = MachinePointerInfo(N->getPointerInfo().getAddrSpace()); |
1236 | Flags.setNoUnsignedWrap(true); |
1237 | if (ScaledOffset) |
1238 | *ScaledOffset += IncrementSize; |
1239 | Ptr = DAG.getNode(Opcode: ISD::ADD, DL, VT: Ptr.getValueType(), N1: Ptr, N2: BytesIncrement, |
1240 | Flags); |
1241 | } else { |
1242 | MPI = N->getPointerInfo().getWithOffset(O: IncrementSize); |
1243 | // Increment the pointer to the other half. |
1244 | Ptr = DAG.getObjectPtrOffset(SL: DL, Ptr, Offset: TypeSize::getFixed(ExactSize: IncrementSize)); |
1245 | } |
1246 | } |
1247 | |
1248 | std::pair<SDValue, SDValue> DAGTypeLegalizer::SplitMask(SDValue Mask) { |
1249 | return SplitMask(Mask, DL: SDLoc(Mask)); |
1250 | } |
1251 | |
1252 | std::pair<SDValue, SDValue> DAGTypeLegalizer::SplitMask(SDValue Mask, |
1253 | const SDLoc &DL) { |
1254 | SDValue MaskLo, MaskHi; |
1255 | EVT MaskVT = Mask.getValueType(); |
1256 | if (getTypeAction(VT: MaskVT) == TargetLowering::TypeSplitVector) |
1257 | GetSplitVector(Op: Mask, Lo&: MaskLo, Hi&: MaskHi); |
1258 | else |
1259 | std::tie(args&: MaskLo, args&: MaskHi) = DAG.SplitVector(N: Mask, DL); |
1260 | return std::make_pair(x&: MaskLo, y&: MaskHi); |
1261 | } |
1262 | |
1263 | void DAGTypeLegalizer::SplitVecRes_BinOp(SDNode *N, SDValue &Lo, SDValue &Hi) { |
1264 | SDValue LHSLo, LHSHi; |
1265 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LHSLo, Hi&: LHSHi); |
1266 | SDValue RHSLo, RHSHi; |
1267 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: RHSLo, Hi&: RHSHi); |
1268 | SDLoc dl(N); |
1269 | |
1270 | const SDNodeFlags Flags = N->getFlags(); |
1271 | unsigned Opcode = N->getOpcode(); |
1272 | if (N->getNumOperands() == 2) { |
1273 | Lo = DAG.getNode(Opcode, DL: dl, VT: LHSLo.getValueType(), N1: LHSLo, N2: RHSLo, Flags); |
1274 | Hi = DAG.getNode(Opcode, DL: dl, VT: LHSHi.getValueType(), N1: LHSHi, N2: RHSHi, Flags); |
1275 | return; |
1276 | } |
1277 | |
1278 | assert(N->getNumOperands() == 4 && "Unexpected number of operands!" ); |
1279 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
1280 | |
1281 | SDValue MaskLo, MaskHi; |
1282 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 2)); |
1283 | |
1284 | SDValue EVLLo, EVLHi; |
1285 | std::tie(args&: EVLLo, args&: EVLHi) = |
1286 | DAG.SplitEVL(N: N->getOperand(Num: 3), VecVT: N->getValueType(ResNo: 0), DL: dl); |
1287 | |
1288 | Lo = DAG.getNode(Opcode, DL: dl, VT: LHSLo.getValueType(), |
1289 | Ops: {LHSLo, RHSLo, MaskLo, EVLLo}, Flags); |
1290 | Hi = DAG.getNode(Opcode, DL: dl, VT: LHSHi.getValueType(), |
1291 | Ops: {LHSHi, RHSHi, MaskHi, EVLHi}, Flags); |
1292 | } |
1293 | |
1294 | void DAGTypeLegalizer::SplitVecRes_TernaryOp(SDNode *N, SDValue &Lo, |
1295 | SDValue &Hi) { |
1296 | SDValue Op0Lo, Op0Hi; |
1297 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: Op0Lo, Hi&: Op0Hi); |
1298 | SDValue Op1Lo, Op1Hi; |
1299 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: Op1Lo, Hi&: Op1Hi); |
1300 | SDValue Op2Lo, Op2Hi; |
1301 | GetSplitVector(Op: N->getOperand(Num: 2), Lo&: Op2Lo, Hi&: Op2Hi); |
1302 | SDLoc dl(N); |
1303 | |
1304 | const SDNodeFlags Flags = N->getFlags(); |
1305 | unsigned Opcode = N->getOpcode(); |
1306 | if (N->getNumOperands() == 3) { |
1307 | Lo = DAG.getNode(Opcode, DL: dl, VT: Op0Lo.getValueType(), N1: Op0Lo, N2: Op1Lo, N3: Op2Lo, Flags); |
1308 | Hi = DAG.getNode(Opcode, DL: dl, VT: Op0Hi.getValueType(), N1: Op0Hi, N2: Op1Hi, N3: Op2Hi, Flags); |
1309 | return; |
1310 | } |
1311 | |
1312 | assert(N->getNumOperands() == 5 && "Unexpected number of operands!" ); |
1313 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
1314 | |
1315 | SDValue MaskLo, MaskHi; |
1316 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 3)); |
1317 | |
1318 | SDValue EVLLo, EVLHi; |
1319 | std::tie(args&: EVLLo, args&: EVLHi) = |
1320 | DAG.SplitEVL(N: N->getOperand(Num: 4), VecVT: N->getValueType(ResNo: 0), DL: dl); |
1321 | |
1322 | Lo = DAG.getNode(Opcode, DL: dl, VT: Op0Lo.getValueType(), |
1323 | Ops: {Op0Lo, Op1Lo, Op2Lo, MaskLo, EVLLo}, Flags); |
1324 | Hi = DAG.getNode(Opcode, DL: dl, VT: Op0Hi.getValueType(), |
1325 | Ops: {Op0Hi, Op1Hi, Op2Hi, MaskHi, EVLHi}, Flags); |
1326 | } |
1327 | |
1328 | void DAGTypeLegalizer::SplitVecRes_FIX(SDNode *N, SDValue &Lo, SDValue &Hi) { |
1329 | SDValue LHSLo, LHSHi; |
1330 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LHSLo, Hi&: LHSHi); |
1331 | SDValue RHSLo, RHSHi; |
1332 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: RHSLo, Hi&: RHSHi); |
1333 | SDLoc dl(N); |
1334 | SDValue Op2 = N->getOperand(Num: 2); |
1335 | |
1336 | unsigned Opcode = N->getOpcode(); |
1337 | Lo = DAG.getNode(Opcode, DL: dl, VT: LHSLo.getValueType(), N1: LHSLo, N2: RHSLo, N3: Op2, |
1338 | Flags: N->getFlags()); |
1339 | Hi = DAG.getNode(Opcode, DL: dl, VT: LHSHi.getValueType(), N1: LHSHi, N2: RHSHi, N3: Op2, |
1340 | Flags: N->getFlags()); |
1341 | } |
1342 | |
1343 | void DAGTypeLegalizer::SplitVecRes_BITCAST(SDNode *N, SDValue &Lo, |
1344 | SDValue &Hi) { |
1345 | // We know the result is a vector. The input may be either a vector or a |
1346 | // scalar value. |
1347 | EVT LoVT, HiVT; |
1348 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1349 | SDLoc dl(N); |
1350 | |
1351 | SDValue InOp = N->getOperand(Num: 0); |
1352 | EVT InVT = InOp.getValueType(); |
1353 | |
1354 | // Handle some special cases efficiently. |
1355 | switch (getTypeAction(VT: InVT)) { |
1356 | case TargetLowering::TypeLegal: |
1357 | case TargetLowering::TypePromoteInteger: |
1358 | case TargetLowering::TypePromoteFloat: |
1359 | case TargetLowering::TypeSoftPromoteHalf: |
1360 | case TargetLowering::TypeSoftenFloat: |
1361 | case TargetLowering::TypeScalarizeVector: |
1362 | case TargetLowering::TypeWidenVector: |
1363 | break; |
1364 | case TargetLowering::TypeExpandInteger: |
1365 | case TargetLowering::TypeExpandFloat: |
1366 | // A scalar to vector conversion, where the scalar needs expansion. |
1367 | // If the vector is being split in two then we can just convert the |
1368 | // expanded pieces. |
1369 | if (LoVT == HiVT) { |
1370 | GetExpandedOp(Op: InOp, Lo, Hi); |
1371 | if (DAG.getDataLayout().isBigEndian()) |
1372 | std::swap(a&: Lo, b&: Hi); |
1373 | Lo = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: LoVT, Operand: Lo); |
1374 | Hi = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: HiVT, Operand: Hi); |
1375 | return; |
1376 | } |
1377 | break; |
1378 | case TargetLowering::TypeSplitVector: |
1379 | // If the input is a vector that needs to be split, convert each split |
1380 | // piece of the input now. |
1381 | GetSplitVector(Op: InOp, Lo, Hi); |
1382 | Lo = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: LoVT, Operand: Lo); |
1383 | Hi = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: HiVT, Operand: Hi); |
1384 | return; |
1385 | case TargetLowering::TypeScalarizeScalableVector: |
1386 | report_fatal_error(reason: "Scalarization of scalable vectors is not supported." ); |
1387 | } |
1388 | |
1389 | // In the general case, convert the input to an integer and split it by hand. |
1390 | EVT LoIntVT = EVT::getIntegerVT(Context&: *DAG.getContext(), BitWidth: LoVT.getSizeInBits()); |
1391 | EVT HiIntVT = EVT::getIntegerVT(Context&: *DAG.getContext(), BitWidth: HiVT.getSizeInBits()); |
1392 | if (DAG.getDataLayout().isBigEndian()) |
1393 | std::swap(a&: LoIntVT, b&: HiIntVT); |
1394 | |
1395 | SplitInteger(Op: BitConvertToInteger(Op: InOp), LoVT: LoIntVT, HiVT: HiIntVT, Lo, Hi); |
1396 | |
1397 | if (DAG.getDataLayout().isBigEndian()) |
1398 | std::swap(a&: Lo, b&: Hi); |
1399 | Lo = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: LoVT, Operand: Lo); |
1400 | Hi = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: HiVT, Operand: Hi); |
1401 | } |
1402 | |
1403 | void DAGTypeLegalizer::SplitVecRes_BUILD_VECTOR(SDNode *N, SDValue &Lo, |
1404 | SDValue &Hi) { |
1405 | EVT LoVT, HiVT; |
1406 | SDLoc dl(N); |
1407 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1408 | unsigned LoNumElts = LoVT.getVectorNumElements(); |
1409 | SmallVector<SDValue, 8> LoOps(N->op_begin(), N->op_begin()+LoNumElts); |
1410 | Lo = DAG.getBuildVector(VT: LoVT, DL: dl, Ops: LoOps); |
1411 | |
1412 | SmallVector<SDValue, 8> HiOps(N->op_begin()+LoNumElts, N->op_end()); |
1413 | Hi = DAG.getBuildVector(VT: HiVT, DL: dl, Ops: HiOps); |
1414 | } |
1415 | |
1416 | void DAGTypeLegalizer::SplitVecRes_CONCAT_VECTORS(SDNode *N, SDValue &Lo, |
1417 | SDValue &Hi) { |
1418 | assert(!(N->getNumOperands() & 1) && "Unsupported CONCAT_VECTORS" ); |
1419 | SDLoc dl(N); |
1420 | unsigned NumSubvectors = N->getNumOperands() / 2; |
1421 | if (NumSubvectors == 1) { |
1422 | Lo = N->getOperand(Num: 0); |
1423 | Hi = N->getOperand(Num: 1); |
1424 | return; |
1425 | } |
1426 | |
1427 | EVT LoVT, HiVT; |
1428 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1429 | |
1430 | SmallVector<SDValue, 8> LoOps(N->op_begin(), N->op_begin()+NumSubvectors); |
1431 | Lo = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: LoVT, Ops: LoOps); |
1432 | |
1433 | SmallVector<SDValue, 8> HiOps(N->op_begin()+NumSubvectors, N->op_end()); |
1434 | Hi = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: HiVT, Ops: HiOps); |
1435 | } |
1436 | |
1437 | void DAGTypeLegalizer::(SDNode *N, SDValue &Lo, |
1438 | SDValue &Hi) { |
1439 | SDValue Vec = N->getOperand(Num: 0); |
1440 | SDValue Idx = N->getOperand(Num: 1); |
1441 | SDLoc dl(N); |
1442 | |
1443 | EVT LoVT, HiVT; |
1444 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1445 | |
1446 | Lo = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: LoVT, N1: Vec, N2: Idx); |
1447 | uint64_t IdxVal = Idx->getAsZExtVal(); |
1448 | Hi = DAG.getNode( |
1449 | Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: HiVT, N1: Vec, |
1450 | N2: DAG.getVectorIdxConstant(Val: IdxVal + LoVT.getVectorMinNumElements(), DL: dl)); |
1451 | } |
1452 | |
1453 | void DAGTypeLegalizer::SplitVecRes_INSERT_SUBVECTOR(SDNode *N, SDValue &Lo, |
1454 | SDValue &Hi) { |
1455 | SDValue Vec = N->getOperand(Num: 0); |
1456 | SDValue SubVec = N->getOperand(Num: 1); |
1457 | SDValue Idx = N->getOperand(Num: 2); |
1458 | SDLoc dl(N); |
1459 | GetSplitVector(Op: Vec, Lo, Hi); |
1460 | |
1461 | EVT VecVT = Vec.getValueType(); |
1462 | EVT LoVT = Lo.getValueType(); |
1463 | EVT SubVecVT = SubVec.getValueType(); |
1464 | unsigned VecElems = VecVT.getVectorMinNumElements(); |
1465 | unsigned SubElems = SubVecVT.getVectorMinNumElements(); |
1466 | unsigned LoElems = LoVT.getVectorMinNumElements(); |
1467 | |
1468 | // If we know the index is in the first half, and we know the subvector |
1469 | // doesn't cross the boundary between the halves, we can avoid spilling the |
1470 | // vector, and insert into the lower half of the split vector directly. |
1471 | unsigned IdxVal = Idx->getAsZExtVal(); |
1472 | if (IdxVal + SubElems <= LoElems) { |
1473 | Lo = DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: LoVT, N1: Lo, N2: SubVec, N3: Idx); |
1474 | return; |
1475 | } |
1476 | // Similarly if the subvector is fully in the high half, but mind that we |
1477 | // can't tell whether a fixed-length subvector is fully within the high half |
1478 | // of a scalable vector. |
1479 | if (VecVT.isScalableVector() == SubVecVT.isScalableVector() && |
1480 | IdxVal >= LoElems && IdxVal + SubElems <= VecElems) { |
1481 | Hi = DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: Hi.getValueType(), N1: Hi, N2: SubVec, |
1482 | N3: DAG.getVectorIdxConstant(Val: IdxVal - LoElems, DL: dl)); |
1483 | return; |
1484 | } |
1485 | |
1486 | // Spill the vector to the stack. |
1487 | // In cases where the vector is illegal it will be broken down into parts |
1488 | // and stored in parts - we should use the alignment for the smallest part. |
1489 | Align SmallestAlign = DAG.getReducedAlign(VT: VecVT, /*UseABI=*/false); |
1490 | SDValue StackPtr = |
1491 | DAG.CreateStackTemporary(Bytes: VecVT.getStoreSize(), Alignment: SmallestAlign); |
1492 | auto &MF = DAG.getMachineFunction(); |
1493 | auto FrameIndex = cast<FrameIndexSDNode>(Val: StackPtr.getNode())->getIndex(); |
1494 | auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FI: FrameIndex); |
1495 | |
1496 | SDValue Store = DAG.getStore(Chain: DAG.getEntryNode(), dl, Val: Vec, Ptr: StackPtr, PtrInfo, |
1497 | Alignment: SmallestAlign); |
1498 | |
1499 | // Store the new subvector into the specified index. |
1500 | SDValue SubVecPtr = |
1501 | TLI.getVectorSubVecPointer(DAG, VecPtr: StackPtr, VecVT, SubVecVT, Index: Idx); |
1502 | Store = DAG.getStore(Chain: Store, dl, Val: SubVec, Ptr: SubVecPtr, |
1503 | PtrInfo: MachinePointerInfo::getUnknownStack(MF)); |
1504 | |
1505 | // Load the Lo part from the stack slot. |
1506 | Lo = DAG.getLoad(VT: Lo.getValueType(), dl, Chain: Store, Ptr: StackPtr, PtrInfo, |
1507 | Alignment: SmallestAlign); |
1508 | |
1509 | // Increment the pointer to the other part. |
1510 | auto *Load = cast<LoadSDNode>(Val&: Lo); |
1511 | MachinePointerInfo MPI = Load->getPointerInfo(); |
1512 | IncrementPointer(N: Load, MemVT: LoVT, MPI, Ptr&: StackPtr); |
1513 | |
1514 | // Load the Hi part from the stack slot. |
1515 | Hi = DAG.getLoad(VT: Hi.getValueType(), dl, Chain: Store, Ptr: StackPtr, PtrInfo: MPI, Alignment: SmallestAlign); |
1516 | } |
1517 | |
1518 | // Handle splitting an FP where the second operand does not match the first |
1519 | // type. The second operand may be a scalar, or a vector that has exactly as |
1520 | // many elements as the first |
1521 | void DAGTypeLegalizer::SplitVecRes_FPOp_MultiType(SDNode *N, SDValue &Lo, |
1522 | SDValue &Hi) { |
1523 | SDValue LHSLo, LHSHi; |
1524 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LHSLo, Hi&: LHSHi); |
1525 | SDLoc DL(N); |
1526 | |
1527 | SDValue RHSLo, RHSHi; |
1528 | SDValue RHS = N->getOperand(Num: 1); |
1529 | EVT RHSVT = RHS.getValueType(); |
1530 | if (RHSVT.isVector()) { |
1531 | if (getTypeAction(VT: RHSVT) == TargetLowering::TypeSplitVector) |
1532 | GetSplitVector(Op: RHS, Lo&: RHSLo, Hi&: RHSHi); |
1533 | else |
1534 | std::tie(args&: RHSLo, args&: RHSHi) = DAG.SplitVector(N: RHS, DL: SDLoc(RHS)); |
1535 | |
1536 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSLo.getValueType(), N1: LHSLo, N2: RHSLo); |
1537 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSHi.getValueType(), N1: LHSHi, N2: RHSHi); |
1538 | } else { |
1539 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSLo.getValueType(), N1: LHSLo, N2: RHS); |
1540 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSHi.getValueType(), N1: LHSHi, N2: RHS); |
1541 | } |
1542 | } |
1543 | |
1544 | void DAGTypeLegalizer::SplitVecRes_IS_FPCLASS(SDNode *N, SDValue &Lo, |
1545 | SDValue &Hi) { |
1546 | SDLoc DL(N); |
1547 | SDValue ArgLo, ArgHi; |
1548 | SDValue Test = N->getOperand(Num: 1); |
1549 | SDValue FpValue = N->getOperand(Num: 0); |
1550 | if (getTypeAction(VT: FpValue.getValueType()) == TargetLowering::TypeSplitVector) |
1551 | GetSplitVector(Op: FpValue, Lo&: ArgLo, Hi&: ArgHi); |
1552 | else |
1553 | std::tie(args&: ArgLo, args&: ArgHi) = DAG.SplitVector(N: FpValue, DL: SDLoc(FpValue)); |
1554 | EVT LoVT, HiVT; |
1555 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1556 | |
1557 | Lo = DAG.getNode(Opcode: ISD::IS_FPCLASS, DL, VT: LoVT, N1: ArgLo, N2: Test, Flags: N->getFlags()); |
1558 | Hi = DAG.getNode(Opcode: ISD::IS_FPCLASS, DL, VT: HiVT, N1: ArgHi, N2: Test, Flags: N->getFlags()); |
1559 | } |
1560 | |
1561 | void DAGTypeLegalizer::SplitVecRes_InregOp(SDNode *N, SDValue &Lo, |
1562 | SDValue &Hi) { |
1563 | SDValue LHSLo, LHSHi; |
1564 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LHSLo, Hi&: LHSHi); |
1565 | SDLoc dl(N); |
1566 | |
1567 | EVT LoVT, HiVT; |
1568 | std::tie(args&: LoVT, args&: HiVT) = |
1569 | DAG.GetSplitDestVTs(VT: cast<VTSDNode>(Val: N->getOperand(Num: 1))->getVT()); |
1570 | |
1571 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: LHSLo.getValueType(), N1: LHSLo, |
1572 | N2: DAG.getValueType(LoVT)); |
1573 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: LHSHi.getValueType(), N1: LHSHi, |
1574 | N2: DAG.getValueType(HiVT)); |
1575 | } |
1576 | |
1577 | void DAGTypeLegalizer::SplitVecRes_ExtVecInRegOp(SDNode *N, SDValue &Lo, |
1578 | SDValue &Hi) { |
1579 | unsigned Opcode = N->getOpcode(); |
1580 | SDValue N0 = N->getOperand(Num: 0); |
1581 | |
1582 | SDLoc dl(N); |
1583 | SDValue InLo, InHi; |
1584 | |
1585 | if (getTypeAction(VT: N0.getValueType()) == TargetLowering::TypeSplitVector) |
1586 | GetSplitVector(Op: N0, Lo&: InLo, Hi&: InHi); |
1587 | else |
1588 | std::tie(args&: InLo, args&: InHi) = DAG.SplitVectorOperand(N, OpNo: 0); |
1589 | |
1590 | EVT InLoVT = InLo.getValueType(); |
1591 | unsigned InNumElements = InLoVT.getVectorNumElements(); |
1592 | |
1593 | EVT OutLoVT, OutHiVT; |
1594 | std::tie(args&: OutLoVT, args&: OutHiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1595 | unsigned OutNumElements = OutLoVT.getVectorNumElements(); |
1596 | assert((2 * OutNumElements) <= InNumElements && |
1597 | "Illegal extend vector in reg split" ); |
1598 | |
1599 | // *_EXTEND_VECTOR_INREG instructions extend the lowest elements of the |
1600 | // input vector (i.e. we only use InLo): |
1601 | // OutLo will extend the first OutNumElements from InLo. |
1602 | // OutHi will extend the next OutNumElements from InLo. |
1603 | |
1604 | // Shuffle the elements from InLo for OutHi into the bottom elements to |
1605 | // create a 'fake' InHi. |
1606 | SmallVector<int, 8> SplitHi(InNumElements, -1); |
1607 | for (unsigned i = 0; i != OutNumElements; ++i) |
1608 | SplitHi[i] = i + OutNumElements; |
1609 | InHi = DAG.getVectorShuffle(VT: InLoVT, dl, N1: InLo, N2: DAG.getUNDEF(VT: InLoVT), Mask: SplitHi); |
1610 | |
1611 | Lo = DAG.getNode(Opcode, DL: dl, VT: OutLoVT, Operand: InLo); |
1612 | Hi = DAG.getNode(Opcode, DL: dl, VT: OutHiVT, Operand: InHi); |
1613 | } |
1614 | |
1615 | void DAGTypeLegalizer::SplitVecRes_StrictFPOp(SDNode *N, SDValue &Lo, |
1616 | SDValue &Hi) { |
1617 | unsigned NumOps = N->getNumOperands(); |
1618 | SDValue Chain = N->getOperand(Num: 0); |
1619 | EVT LoVT, HiVT; |
1620 | SDLoc dl(N); |
1621 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1622 | |
1623 | SmallVector<SDValue, 4> OpsLo(NumOps); |
1624 | SmallVector<SDValue, 4> OpsHi(NumOps); |
1625 | |
1626 | // The Chain is the first operand. |
1627 | OpsLo[0] = Chain; |
1628 | OpsHi[0] = Chain; |
1629 | |
1630 | // Now process the remaining operands. |
1631 | for (unsigned i = 1; i < NumOps; ++i) { |
1632 | SDValue Op = N->getOperand(Num: i); |
1633 | SDValue OpLo = Op; |
1634 | SDValue OpHi = Op; |
1635 | |
1636 | EVT InVT = Op.getValueType(); |
1637 | if (InVT.isVector()) { |
1638 | // If the input also splits, handle it directly for a |
1639 | // compile time speedup. Otherwise split it by hand. |
1640 | if (getTypeAction(VT: InVT) == TargetLowering::TypeSplitVector) |
1641 | GetSplitVector(Op, Lo&: OpLo, Hi&: OpHi); |
1642 | else |
1643 | std::tie(args&: OpLo, args&: OpHi) = DAG.SplitVectorOperand(N, OpNo: i); |
1644 | } |
1645 | |
1646 | OpsLo[i] = OpLo; |
1647 | OpsHi[i] = OpHi; |
1648 | } |
1649 | |
1650 | EVT LoValueVTs[] = {LoVT, MVT::Other}; |
1651 | EVT HiValueVTs[] = {HiVT, MVT::Other}; |
1652 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VTList: DAG.getVTList(LoValueVTs), Ops: OpsLo, |
1653 | Flags: N->getFlags()); |
1654 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VTList: DAG.getVTList(HiValueVTs), Ops: OpsHi, |
1655 | Flags: N->getFlags()); |
1656 | |
1657 | // Build a factor node to remember that this Op is independent of the |
1658 | // other one. |
1659 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
1660 | Lo.getValue(R: 1), Hi.getValue(R: 1)); |
1661 | |
1662 | // Legalize the chain result - switch anything that used the old chain to |
1663 | // use the new one. |
1664 | ReplaceValueWith(From: SDValue(N, 1), To: Chain); |
1665 | } |
1666 | |
1667 | SDValue DAGTypeLegalizer::UnrollVectorOp_StrictFP(SDNode *N, unsigned ResNE) { |
1668 | SDValue Chain = N->getOperand(Num: 0); |
1669 | EVT VT = N->getValueType(ResNo: 0); |
1670 | unsigned NE = VT.getVectorNumElements(); |
1671 | EVT EltVT = VT.getVectorElementType(); |
1672 | SDLoc dl(N); |
1673 | |
1674 | SmallVector<SDValue, 8> Scalars; |
1675 | SmallVector<SDValue, 4> Operands(N->getNumOperands()); |
1676 | |
1677 | // If ResNE is 0, fully unroll the vector op. |
1678 | if (ResNE == 0) |
1679 | ResNE = NE; |
1680 | else if (NE > ResNE) |
1681 | NE = ResNE; |
1682 | |
1683 | //The results of each unrolled operation, including the chain. |
1684 | EVT ChainVTs[] = {EltVT, MVT::Other}; |
1685 | SmallVector<SDValue, 8> Chains; |
1686 | |
1687 | unsigned i; |
1688 | for (i = 0; i != NE; ++i) { |
1689 | Operands[0] = Chain; |
1690 | for (unsigned j = 1, e = N->getNumOperands(); j != e; ++j) { |
1691 | SDValue Operand = N->getOperand(Num: j); |
1692 | EVT OperandVT = Operand.getValueType(); |
1693 | if (OperandVT.isVector()) { |
1694 | EVT OperandEltVT = OperandVT.getVectorElementType(); |
1695 | Operands[j] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: OperandEltVT, |
1696 | N1: Operand, N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
1697 | } else { |
1698 | Operands[j] = Operand; |
1699 | } |
1700 | } |
1701 | SDValue Scalar = DAG.getNode(N->getOpcode(), dl, ChainVTs, Operands); |
1702 | Scalar.getNode()->setFlags(N->getFlags()); |
1703 | |
1704 | //Add in the scalar as well as its chain value to the |
1705 | //result vectors. |
1706 | Scalars.push_back(Elt: Scalar); |
1707 | Chains.push_back(Elt: Scalar.getValue(R: 1)); |
1708 | } |
1709 | |
1710 | for (; i < ResNE; ++i) |
1711 | Scalars.push_back(Elt: DAG.getUNDEF(VT: EltVT)); |
1712 | |
1713 | // Build a new factor node to connect the chain back together. |
1714 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Chains); |
1715 | ReplaceValueWith(From: SDValue(N, 1), To: Chain); |
1716 | |
1717 | // Create a new BUILD_VECTOR node |
1718 | EVT VecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, NumElements: ResNE); |
1719 | return DAG.getBuildVector(VT: VecVT, DL: dl, Ops: Scalars); |
1720 | } |
1721 | |
1722 | void DAGTypeLegalizer::SplitVecRes_OverflowOp(SDNode *N, unsigned ResNo, |
1723 | SDValue &Lo, SDValue &Hi) { |
1724 | SDLoc dl(N); |
1725 | EVT ResVT = N->getValueType(ResNo: 0); |
1726 | EVT OvVT = N->getValueType(ResNo: 1); |
1727 | EVT LoResVT, HiResVT, LoOvVT, HiOvVT; |
1728 | std::tie(args&: LoResVT, args&: HiResVT) = DAG.GetSplitDestVTs(VT: ResVT); |
1729 | std::tie(args&: LoOvVT, args&: HiOvVT) = DAG.GetSplitDestVTs(VT: OvVT); |
1730 | |
1731 | SDValue LoLHS, HiLHS, LoRHS, HiRHS; |
1732 | if (getTypeAction(VT: ResVT) == TargetLowering::TypeSplitVector) { |
1733 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LoLHS, Hi&: HiLHS); |
1734 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: LoRHS, Hi&: HiRHS); |
1735 | } else { |
1736 | std::tie(args&: LoLHS, args&: HiLHS) = DAG.SplitVectorOperand(N, OpNo: 0); |
1737 | std::tie(args&: LoRHS, args&: HiRHS) = DAG.SplitVectorOperand(N, OpNo: 1); |
1738 | } |
1739 | |
1740 | unsigned Opcode = N->getOpcode(); |
1741 | SDVTList LoVTs = DAG.getVTList(VT1: LoResVT, VT2: LoOvVT); |
1742 | SDVTList HiVTs = DAG.getVTList(VT1: HiResVT, VT2: HiOvVT); |
1743 | SDNode *LoNode = DAG.getNode(Opcode, DL: dl, VTList: LoVTs, N1: LoLHS, N2: LoRHS).getNode(); |
1744 | SDNode *HiNode = DAG.getNode(Opcode, DL: dl, VTList: HiVTs, N1: HiLHS, N2: HiRHS).getNode(); |
1745 | LoNode->setFlags(N->getFlags()); |
1746 | HiNode->setFlags(N->getFlags()); |
1747 | |
1748 | Lo = SDValue(LoNode, ResNo); |
1749 | Hi = SDValue(HiNode, ResNo); |
1750 | |
1751 | // Replace the other vector result not being explicitly split here. |
1752 | unsigned OtherNo = 1 - ResNo; |
1753 | EVT OtherVT = N->getValueType(ResNo: OtherNo); |
1754 | if (getTypeAction(VT: OtherVT) == TargetLowering::TypeSplitVector) { |
1755 | SetSplitVector(Op: SDValue(N, OtherNo), |
1756 | Lo: SDValue(LoNode, OtherNo), Hi: SDValue(HiNode, OtherNo)); |
1757 | } else { |
1758 | SDValue OtherVal = DAG.getNode( |
1759 | Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: OtherVT, |
1760 | N1: SDValue(LoNode, OtherNo), N2: SDValue(HiNode, OtherNo)); |
1761 | ReplaceValueWith(From: SDValue(N, OtherNo), To: OtherVal); |
1762 | } |
1763 | } |
1764 | |
1765 | void DAGTypeLegalizer::SplitVecRes_INSERT_VECTOR_ELT(SDNode *N, SDValue &Lo, |
1766 | SDValue &Hi) { |
1767 | SDValue Vec = N->getOperand(Num: 0); |
1768 | SDValue Elt = N->getOperand(Num: 1); |
1769 | SDValue Idx = N->getOperand(Num: 2); |
1770 | SDLoc dl(N); |
1771 | GetSplitVector(Op: Vec, Lo, Hi); |
1772 | |
1773 | if (ConstantSDNode *CIdx = dyn_cast<ConstantSDNode>(Val&: Idx)) { |
1774 | unsigned IdxVal = CIdx->getZExtValue(); |
1775 | unsigned LoNumElts = Lo.getValueType().getVectorMinNumElements(); |
1776 | if (IdxVal < LoNumElts) { |
1777 | Lo = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, |
1778 | VT: Lo.getValueType(), N1: Lo, N2: Elt, N3: Idx); |
1779 | return; |
1780 | } else if (!Vec.getValueType().isScalableVector()) { |
1781 | Hi = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, VT: Hi.getValueType(), N1: Hi, N2: Elt, |
1782 | N3: DAG.getVectorIdxConstant(Val: IdxVal - LoNumElts, DL: dl)); |
1783 | return; |
1784 | } |
1785 | } |
1786 | |
1787 | // See if the target wants to custom expand this node. |
1788 | if (CustomLowerNode(N, VT: N->getValueType(ResNo: 0), LegalizeResult: true)) |
1789 | return; |
1790 | |
1791 | // Make the vector elements byte-addressable if they aren't already. |
1792 | EVT VecVT = Vec.getValueType(); |
1793 | EVT EltVT = VecVT.getVectorElementType(); |
1794 | if (VecVT.getScalarSizeInBits() < 8) { |
1795 | EltVT = MVT::i8; |
1796 | VecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, |
1797 | EC: VecVT.getVectorElementCount()); |
1798 | Vec = DAG.getNode(Opcode: ISD::ANY_EXTEND, DL: dl, VT: VecVT, Operand: Vec); |
1799 | // Extend the element type to match if needed. |
1800 | if (EltVT.bitsGT(VT: Elt.getValueType())) |
1801 | Elt = DAG.getNode(Opcode: ISD::ANY_EXTEND, DL: dl, VT: EltVT, Operand: Elt); |
1802 | } |
1803 | |
1804 | // Spill the vector to the stack. |
1805 | // In cases where the vector is illegal it will be broken down into parts |
1806 | // and stored in parts - we should use the alignment for the smallest part. |
1807 | Align SmallestAlign = DAG.getReducedAlign(VT: VecVT, /*UseABI=*/false); |
1808 | SDValue StackPtr = |
1809 | DAG.CreateStackTemporary(Bytes: VecVT.getStoreSize(), Alignment: SmallestAlign); |
1810 | auto &MF = DAG.getMachineFunction(); |
1811 | auto FrameIndex = cast<FrameIndexSDNode>(Val: StackPtr.getNode())->getIndex(); |
1812 | auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FI: FrameIndex); |
1813 | |
1814 | SDValue Store = DAG.getStore(Chain: DAG.getEntryNode(), dl, Val: Vec, Ptr: StackPtr, PtrInfo, |
1815 | Alignment: SmallestAlign); |
1816 | |
1817 | // Store the new element. This may be larger than the vector element type, |
1818 | // so use a truncating store. |
1819 | SDValue EltPtr = TLI.getVectorElementPointer(DAG, VecPtr: StackPtr, VecVT, Index: Idx); |
1820 | Store = DAG.getTruncStore( |
1821 | Chain: Store, dl, Val: Elt, Ptr: EltPtr, PtrInfo: MachinePointerInfo::getUnknownStack(MF), SVT: EltVT, |
1822 | Alignment: commonAlignment(A: SmallestAlign, |
1823 | Offset: EltVT.getFixedSizeInBits() / 8)); |
1824 | |
1825 | EVT LoVT, HiVT; |
1826 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: VecVT); |
1827 | |
1828 | // Load the Lo part from the stack slot. |
1829 | Lo = DAG.getLoad(VT: LoVT, dl, Chain: Store, Ptr: StackPtr, PtrInfo, Alignment: SmallestAlign); |
1830 | |
1831 | // Increment the pointer to the other part. |
1832 | auto Load = cast<LoadSDNode>(Val&: Lo); |
1833 | MachinePointerInfo MPI = Load->getPointerInfo(); |
1834 | IncrementPointer(N: Load, MemVT: LoVT, MPI, Ptr&: StackPtr); |
1835 | |
1836 | Hi = DAG.getLoad(VT: HiVT, dl, Chain: Store, Ptr: StackPtr, PtrInfo: MPI, Alignment: SmallestAlign); |
1837 | |
1838 | // If we adjusted the original type, we need to truncate the results. |
1839 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1840 | if (LoVT != Lo.getValueType()) |
1841 | Lo = DAG.getNode(Opcode: ISD::TRUNCATE, DL: dl, VT: LoVT, Operand: Lo); |
1842 | if (HiVT != Hi.getValueType()) |
1843 | Hi = DAG.getNode(Opcode: ISD::TRUNCATE, DL: dl, VT: HiVT, Operand: Hi); |
1844 | } |
1845 | |
1846 | void DAGTypeLegalizer::SplitVecRes_STEP_VECTOR(SDNode *N, SDValue &Lo, |
1847 | SDValue &Hi) { |
1848 | EVT LoVT, HiVT; |
1849 | SDLoc dl(N); |
1850 | assert(N->getValueType(0).isScalableVector() && |
1851 | "Only scalable vectors are supported for STEP_VECTOR" ); |
1852 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1853 | SDValue Step = N->getOperand(Num: 0); |
1854 | |
1855 | Lo = DAG.getNode(Opcode: ISD::STEP_VECTOR, DL: dl, VT: LoVT, Operand: Step); |
1856 | |
1857 | // Hi = Lo + (EltCnt * Step) |
1858 | EVT EltVT = Step.getValueType(); |
1859 | APInt StepVal = Step->getAsAPIntVal(); |
1860 | SDValue StartOfHi = |
1861 | DAG.getVScale(DL: dl, VT: EltVT, MulImm: StepVal * LoVT.getVectorMinNumElements()); |
1862 | StartOfHi = DAG.getSExtOrTrunc(Op: StartOfHi, DL: dl, VT: HiVT.getVectorElementType()); |
1863 | StartOfHi = DAG.getNode(Opcode: ISD::SPLAT_VECTOR, DL: dl, VT: HiVT, Operand: StartOfHi); |
1864 | |
1865 | Hi = DAG.getNode(Opcode: ISD::STEP_VECTOR, DL: dl, VT: HiVT, Operand: Step); |
1866 | Hi = DAG.getNode(Opcode: ISD::ADD, DL: dl, VT: HiVT, N1: Hi, N2: StartOfHi); |
1867 | } |
1868 | |
1869 | void DAGTypeLegalizer::SplitVecRes_ScalarOp(SDNode *N, SDValue &Lo, |
1870 | SDValue &Hi) { |
1871 | EVT LoVT, HiVT; |
1872 | SDLoc dl(N); |
1873 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
1874 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: LoVT, Operand: N->getOperand(Num: 0)); |
1875 | if (N->getOpcode() == ISD::SCALAR_TO_VECTOR) { |
1876 | Hi = DAG.getUNDEF(VT: HiVT); |
1877 | } else { |
1878 | assert(N->getOpcode() == ISD::SPLAT_VECTOR && "Unexpected opcode" ); |
1879 | Hi = Lo; |
1880 | } |
1881 | } |
1882 | |
1883 | void DAGTypeLegalizer::SplitVecRes_LOAD(LoadSDNode *LD, SDValue &Lo, |
1884 | SDValue &Hi) { |
1885 | assert(ISD::isUNINDEXEDLoad(LD) && "Indexed load during type legalization!" ); |
1886 | EVT LoVT, HiVT; |
1887 | SDLoc dl(LD); |
1888 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: LD->getValueType(ResNo: 0)); |
1889 | |
1890 | ISD::LoadExtType ExtType = LD->getExtensionType(); |
1891 | SDValue Ch = LD->getChain(); |
1892 | SDValue Ptr = LD->getBasePtr(); |
1893 | SDValue Offset = DAG.getUNDEF(VT: Ptr.getValueType()); |
1894 | EVT MemoryVT = LD->getMemoryVT(); |
1895 | MachineMemOperand::Flags MMOFlags = LD->getMemOperand()->getFlags(); |
1896 | AAMDNodes AAInfo = LD->getAAInfo(); |
1897 | |
1898 | EVT LoMemVT, HiMemVT; |
1899 | std::tie(args&: LoMemVT, args&: HiMemVT) = DAG.GetSplitDestVTs(VT: MemoryVT); |
1900 | |
1901 | if (!LoMemVT.isByteSized() || !HiMemVT.isByteSized()) { |
1902 | SDValue Value, NewChain; |
1903 | std::tie(args&: Value, args&: NewChain) = TLI.scalarizeVectorLoad(LD, DAG); |
1904 | std::tie(args&: Lo, args&: Hi) = DAG.SplitVector(N: Value, DL: dl); |
1905 | ReplaceValueWith(From: SDValue(LD, 1), To: NewChain); |
1906 | return; |
1907 | } |
1908 | |
1909 | Lo = DAG.getLoad(AM: ISD::UNINDEXED, ExtType, VT: LoVT, dl, Chain: Ch, Ptr, Offset, |
1910 | PtrInfo: LD->getPointerInfo(), MemVT: LoMemVT, Alignment: LD->getOriginalAlign(), |
1911 | MMOFlags, AAInfo); |
1912 | |
1913 | MachinePointerInfo MPI; |
1914 | IncrementPointer(N: LD, MemVT: LoMemVT, MPI, Ptr); |
1915 | |
1916 | Hi = DAG.getLoad(AM: ISD::UNINDEXED, ExtType, VT: HiVT, dl, Chain: Ch, Ptr, Offset, PtrInfo: MPI, |
1917 | MemVT: HiMemVT, Alignment: LD->getOriginalAlign(), MMOFlags, AAInfo); |
1918 | |
1919 | // Build a factor node to remember that this load is independent of the |
1920 | // other one. |
1921 | Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(R: 1), |
1922 | Hi.getValue(R: 1)); |
1923 | |
1924 | // Legalize the chain result - switch anything that used the old chain to |
1925 | // use the new one. |
1926 | ReplaceValueWith(From: SDValue(LD, 1), To: Ch); |
1927 | } |
1928 | |
1929 | void DAGTypeLegalizer::SplitVecRes_VP_LOAD(VPLoadSDNode *LD, SDValue &Lo, |
1930 | SDValue &Hi) { |
1931 | assert(LD->isUnindexed() && "Indexed VP load during type legalization!" ); |
1932 | EVT LoVT, HiVT; |
1933 | SDLoc dl(LD); |
1934 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: LD->getValueType(ResNo: 0)); |
1935 | |
1936 | ISD::LoadExtType ExtType = LD->getExtensionType(); |
1937 | SDValue Ch = LD->getChain(); |
1938 | SDValue Ptr = LD->getBasePtr(); |
1939 | SDValue Offset = LD->getOffset(); |
1940 | assert(Offset.isUndef() && "Unexpected indexed variable-length load offset" ); |
1941 | Align Alignment = LD->getOriginalAlign(); |
1942 | SDValue Mask = LD->getMask(); |
1943 | SDValue EVL = LD->getVectorLength(); |
1944 | EVT MemoryVT = LD->getMemoryVT(); |
1945 | |
1946 | EVT LoMemVT, HiMemVT; |
1947 | bool HiIsEmpty = false; |
1948 | std::tie(args&: LoMemVT, args&: HiMemVT) = |
1949 | DAG.GetDependentSplitDestVTs(VT: MemoryVT, EnvVT: LoVT, HiIsEmpty: &HiIsEmpty); |
1950 | |
1951 | // Split Mask operand |
1952 | SDValue MaskLo, MaskHi; |
1953 | if (Mask.getOpcode() == ISD::SETCC) { |
1954 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
1955 | } else { |
1956 | if (getTypeAction(VT: Mask.getValueType()) == TargetLowering::TypeSplitVector) |
1957 | GetSplitVector(Op: Mask, Lo&: MaskLo, Hi&: MaskHi); |
1958 | else |
1959 | std::tie(args&: MaskLo, args&: MaskHi) = DAG.SplitVector(N: Mask, DL: dl); |
1960 | } |
1961 | |
1962 | // Split EVL operand |
1963 | SDValue EVLLo, EVLHi; |
1964 | std::tie(args&: EVLLo, args&: EVLHi) = DAG.SplitEVL(N: EVL, VecVT: LD->getValueType(ResNo: 0), DL: dl); |
1965 | |
1966 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
1967 | PtrInfo: LD->getPointerInfo(), f: MachineMemOperand::MOLoad, |
1968 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: LD->getAAInfo(), Ranges: LD->getRanges()); |
1969 | |
1970 | Lo = |
1971 | DAG.getLoadVP(AM: LD->getAddressingMode(), ExtType, VT: LoVT, dl, Chain: Ch, Ptr, Offset, |
1972 | Mask: MaskLo, EVL: EVLLo, MemVT: LoMemVT, MMO, IsExpanding: LD->isExpandingLoad()); |
1973 | |
1974 | if (HiIsEmpty) { |
1975 | // The hi vp_load has zero storage size. We therefore simply set it to |
1976 | // the low vp_load and rely on subsequent removal from the chain. |
1977 | Hi = Lo; |
1978 | } else { |
1979 | // Generate hi vp_load. |
1980 | Ptr = TLI.IncrementMemoryAddress(Addr: Ptr, Mask: MaskLo, DL: dl, DataVT: LoMemVT, DAG, |
1981 | IsCompressedMemory: LD->isExpandingLoad()); |
1982 | |
1983 | MachinePointerInfo MPI; |
1984 | if (LoMemVT.isScalableVector()) |
1985 | MPI = MachinePointerInfo(LD->getPointerInfo().getAddrSpace()); |
1986 | else |
1987 | MPI = LD->getPointerInfo().getWithOffset( |
1988 | O: LoMemVT.getStoreSize().getFixedValue()); |
1989 | |
1990 | MMO = DAG.getMachineFunction().getMachineMemOperand( |
1991 | PtrInfo: MPI, f: MachineMemOperand::MOLoad, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
1992 | AAInfo: LD->getAAInfo(), Ranges: LD->getRanges()); |
1993 | |
1994 | Hi = DAG.getLoadVP(AM: LD->getAddressingMode(), ExtType, VT: HiVT, dl, Chain: Ch, Ptr, |
1995 | Offset, Mask: MaskHi, EVL: EVLHi, MemVT: HiMemVT, MMO, |
1996 | IsExpanding: LD->isExpandingLoad()); |
1997 | } |
1998 | |
1999 | // Build a factor node to remember that this load is independent of the |
2000 | // other one. |
2001 | Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(R: 1), |
2002 | Hi.getValue(R: 1)); |
2003 | |
2004 | // Legalize the chain result - switch anything that used the old chain to |
2005 | // use the new one. |
2006 | ReplaceValueWith(From: SDValue(LD, 1), To: Ch); |
2007 | } |
2008 | |
2009 | void DAGTypeLegalizer::SplitVecRes_VP_STRIDED_LOAD(VPStridedLoadSDNode *SLD, |
2010 | SDValue &Lo, SDValue &Hi) { |
2011 | assert(SLD->isUnindexed() && |
2012 | "Indexed VP strided load during type legalization!" ); |
2013 | assert(SLD->getOffset().isUndef() && |
2014 | "Unexpected indexed variable-length load offset" ); |
2015 | |
2016 | SDLoc DL(SLD); |
2017 | |
2018 | EVT LoVT, HiVT; |
2019 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: SLD->getValueType(ResNo: 0)); |
2020 | |
2021 | EVT LoMemVT, HiMemVT; |
2022 | bool HiIsEmpty = false; |
2023 | std::tie(args&: LoMemVT, args&: HiMemVT) = |
2024 | DAG.GetDependentSplitDestVTs(VT: SLD->getMemoryVT(), EnvVT: LoVT, HiIsEmpty: &HiIsEmpty); |
2025 | |
2026 | SDValue Mask = SLD->getMask(); |
2027 | SDValue LoMask, HiMask; |
2028 | if (Mask.getOpcode() == ISD::SETCC) { |
2029 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: LoMask, Hi&: HiMask); |
2030 | } else { |
2031 | if (getTypeAction(VT: Mask.getValueType()) == TargetLowering::TypeSplitVector) |
2032 | GetSplitVector(Op: Mask, Lo&: LoMask, Hi&: HiMask); |
2033 | else |
2034 | std::tie(args&: LoMask, args&: HiMask) = DAG.SplitVector(N: Mask, DL); |
2035 | } |
2036 | |
2037 | SDValue LoEVL, HiEVL; |
2038 | std::tie(args&: LoEVL, args&: HiEVL) = |
2039 | DAG.SplitEVL(N: SLD->getVectorLength(), VecVT: SLD->getValueType(ResNo: 0), DL); |
2040 | |
2041 | // Generate the low vp_strided_load |
2042 | Lo = DAG.getStridedLoadVP( |
2043 | AM: SLD->getAddressingMode(), ExtType: SLD->getExtensionType(), VT: LoVT, DL, |
2044 | Chain: SLD->getChain(), Ptr: SLD->getBasePtr(), Offset: SLD->getOffset(), Stride: SLD->getStride(), |
2045 | Mask: LoMask, EVL: LoEVL, MemVT: LoMemVT, MMO: SLD->getMemOperand(), IsExpanding: SLD->isExpandingLoad()); |
2046 | |
2047 | if (HiIsEmpty) { |
2048 | // The high vp_strided_load has zero storage size. We therefore simply set |
2049 | // it to the low vp_strided_load and rely on subsequent removal from the |
2050 | // chain. |
2051 | Hi = Lo; |
2052 | } else { |
2053 | // Generate the high vp_strided_load. |
2054 | // To calculate the high base address, we need to sum to the low base |
2055 | // address stride number of bytes for each element already loaded by low, |
2056 | // that is: Ptr = Ptr + (LoEVL * Stride) |
2057 | EVT PtrVT = SLD->getBasePtr().getValueType(); |
2058 | SDValue Increment = |
2059 | DAG.getNode(Opcode: ISD::MUL, DL, VT: PtrVT, N1: LoEVL, |
2060 | N2: DAG.getSExtOrTrunc(Op: SLD->getStride(), DL, VT: PtrVT)); |
2061 | SDValue Ptr = |
2062 | DAG.getNode(Opcode: ISD::ADD, DL, VT: PtrVT, N1: SLD->getBasePtr(), N2: Increment); |
2063 | |
2064 | Align Alignment = SLD->getOriginalAlign(); |
2065 | if (LoMemVT.isScalableVector()) |
2066 | Alignment = commonAlignment( |
2067 | A: Alignment, Offset: LoMemVT.getSizeInBits().getKnownMinValue() / 8); |
2068 | |
2069 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
2070 | PtrInfo: MachinePointerInfo(SLD->getPointerInfo().getAddrSpace()), |
2071 | f: MachineMemOperand::MOLoad, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
2072 | AAInfo: SLD->getAAInfo(), Ranges: SLD->getRanges()); |
2073 | |
2074 | Hi = DAG.getStridedLoadVP(AM: SLD->getAddressingMode(), ExtType: SLD->getExtensionType(), |
2075 | VT: HiVT, DL, Chain: SLD->getChain(), Ptr, Offset: SLD->getOffset(), |
2076 | Stride: SLD->getStride(), Mask: HiMask, EVL: HiEVL, MemVT: HiMemVT, MMO, |
2077 | IsExpanding: SLD->isExpandingLoad()); |
2078 | } |
2079 | |
2080 | // Build a factor node to remember that this load is independent of the |
2081 | // other one. |
2082 | SDValue Ch = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Lo.getValue(R: 1), |
2083 | Hi.getValue(R: 1)); |
2084 | |
2085 | // Legalize the chain result - switch anything that used the old chain to |
2086 | // use the new one. |
2087 | ReplaceValueWith(From: SDValue(SLD, 1), To: Ch); |
2088 | } |
2089 | |
2090 | void DAGTypeLegalizer::SplitVecRes_MLOAD(MaskedLoadSDNode *MLD, |
2091 | SDValue &Lo, SDValue &Hi) { |
2092 | assert(MLD->isUnindexed() && "Indexed masked load during type legalization!" ); |
2093 | EVT LoVT, HiVT; |
2094 | SDLoc dl(MLD); |
2095 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: MLD->getValueType(ResNo: 0)); |
2096 | |
2097 | SDValue Ch = MLD->getChain(); |
2098 | SDValue Ptr = MLD->getBasePtr(); |
2099 | SDValue Offset = MLD->getOffset(); |
2100 | assert(Offset.isUndef() && "Unexpected indexed masked load offset" ); |
2101 | SDValue Mask = MLD->getMask(); |
2102 | SDValue PassThru = MLD->getPassThru(); |
2103 | Align Alignment = MLD->getOriginalAlign(); |
2104 | ISD::LoadExtType ExtType = MLD->getExtensionType(); |
2105 | |
2106 | // Split Mask operand |
2107 | SDValue MaskLo, MaskHi; |
2108 | if (Mask.getOpcode() == ISD::SETCC) { |
2109 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
2110 | } else { |
2111 | if (getTypeAction(VT: Mask.getValueType()) == TargetLowering::TypeSplitVector) |
2112 | GetSplitVector(Op: Mask, Lo&: MaskLo, Hi&: MaskHi); |
2113 | else |
2114 | std::tie(args&: MaskLo, args&: MaskHi) = DAG.SplitVector(N: Mask, DL: dl); |
2115 | } |
2116 | |
2117 | EVT MemoryVT = MLD->getMemoryVT(); |
2118 | EVT LoMemVT, HiMemVT; |
2119 | bool HiIsEmpty = false; |
2120 | std::tie(args&: LoMemVT, args&: HiMemVT) = |
2121 | DAG.GetDependentSplitDestVTs(VT: MemoryVT, EnvVT: LoVT, HiIsEmpty: &HiIsEmpty); |
2122 | |
2123 | SDValue PassThruLo, PassThruHi; |
2124 | if (getTypeAction(VT: PassThru.getValueType()) == TargetLowering::TypeSplitVector) |
2125 | GetSplitVector(Op: PassThru, Lo&: PassThruLo, Hi&: PassThruHi); |
2126 | else |
2127 | std::tie(args&: PassThruLo, args&: PassThruHi) = DAG.SplitVector(N: PassThru, DL: dl); |
2128 | |
2129 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
2130 | PtrInfo: MLD->getPointerInfo(), f: MachineMemOperand::MOLoad, |
2131 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: MLD->getAAInfo(), |
2132 | Ranges: MLD->getRanges()); |
2133 | |
2134 | Lo = DAG.getMaskedLoad(VT: LoVT, dl, Chain: Ch, Base: Ptr, Offset, Mask: MaskLo, Src0: PassThruLo, MemVT: LoMemVT, |
2135 | MMO, AM: MLD->getAddressingMode(), ExtType, |
2136 | IsExpanding: MLD->isExpandingLoad()); |
2137 | |
2138 | if (HiIsEmpty) { |
2139 | // The hi masked load has zero storage size. We therefore simply set it to |
2140 | // the low masked load and rely on subsequent removal from the chain. |
2141 | Hi = Lo; |
2142 | } else { |
2143 | // Generate hi masked load. |
2144 | Ptr = TLI.IncrementMemoryAddress(Addr: Ptr, Mask: MaskLo, DL: dl, DataVT: LoMemVT, DAG, |
2145 | IsCompressedMemory: MLD->isExpandingLoad()); |
2146 | |
2147 | MachinePointerInfo MPI; |
2148 | if (LoMemVT.isScalableVector()) |
2149 | MPI = MachinePointerInfo(MLD->getPointerInfo().getAddrSpace()); |
2150 | else |
2151 | MPI = MLD->getPointerInfo().getWithOffset( |
2152 | O: LoMemVT.getStoreSize().getFixedValue()); |
2153 | |
2154 | MMO = DAG.getMachineFunction().getMachineMemOperand( |
2155 | PtrInfo: MPI, f: MachineMemOperand::MOLoad, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
2156 | AAInfo: MLD->getAAInfo(), Ranges: MLD->getRanges()); |
2157 | |
2158 | Hi = DAG.getMaskedLoad(VT: HiVT, dl, Chain: Ch, Base: Ptr, Offset, Mask: MaskHi, Src0: PassThruHi, |
2159 | MemVT: HiMemVT, MMO, AM: MLD->getAddressingMode(), ExtType, |
2160 | IsExpanding: MLD->isExpandingLoad()); |
2161 | } |
2162 | |
2163 | // Build a factor node to remember that this load is independent of the |
2164 | // other one. |
2165 | Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(R: 1), |
2166 | Hi.getValue(R: 1)); |
2167 | |
2168 | // Legalize the chain result - switch anything that used the old chain to |
2169 | // use the new one. |
2170 | ReplaceValueWith(From: SDValue(MLD, 1), To: Ch); |
2171 | |
2172 | } |
2173 | |
2174 | void DAGTypeLegalizer::SplitVecRes_Gather(MemSDNode *N, SDValue &Lo, |
2175 | SDValue &Hi, bool SplitSETCC) { |
2176 | EVT LoVT, HiVT; |
2177 | SDLoc dl(N); |
2178 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
2179 | |
2180 | SDValue Ch = N->getChain(); |
2181 | SDValue Ptr = N->getBasePtr(); |
2182 | struct Operands { |
2183 | SDValue Mask; |
2184 | SDValue Index; |
2185 | SDValue Scale; |
2186 | } Ops = [&]() -> Operands { |
2187 | if (auto *MSC = dyn_cast<MaskedGatherSDNode>(Val: N)) { |
2188 | return {.Mask: MSC->getMask(), .Index: MSC->getIndex(), .Scale: MSC->getScale()}; |
2189 | } |
2190 | auto *VPSC = cast<VPGatherSDNode>(Val: N); |
2191 | return {.Mask: VPSC->getMask(), .Index: VPSC->getIndex(), .Scale: VPSC->getScale()}; |
2192 | }(); |
2193 | |
2194 | EVT MemoryVT = N->getMemoryVT(); |
2195 | Align Alignment = N->getOriginalAlign(); |
2196 | |
2197 | // Split Mask operand |
2198 | SDValue MaskLo, MaskHi; |
2199 | if (SplitSETCC && Ops.Mask.getOpcode() == ISD::SETCC) { |
2200 | SplitVecRes_SETCC(N: Ops.Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
2201 | } else { |
2202 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: Ops.Mask, DL: dl); |
2203 | } |
2204 | |
2205 | EVT LoMemVT, HiMemVT; |
2206 | // Split MemoryVT |
2207 | std::tie(args&: LoMemVT, args&: HiMemVT) = DAG.GetSplitDestVTs(VT: MemoryVT); |
2208 | |
2209 | SDValue IndexHi, IndexLo; |
2210 | if (getTypeAction(VT: Ops.Index.getValueType()) == |
2211 | TargetLowering::TypeSplitVector) |
2212 | GetSplitVector(Op: Ops.Index, Lo&: IndexLo, Hi&: IndexHi); |
2213 | else |
2214 | std::tie(args&: IndexLo, args&: IndexHi) = DAG.SplitVector(N: Ops.Index, DL: dl); |
2215 | |
2216 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
2217 | PtrInfo: N->getPointerInfo(), f: MachineMemOperand::MOLoad, |
2218 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
2219 | |
2220 | if (auto *MGT = dyn_cast<MaskedGatherSDNode>(Val: N)) { |
2221 | SDValue PassThru = MGT->getPassThru(); |
2222 | SDValue PassThruLo, PassThruHi; |
2223 | if (getTypeAction(VT: PassThru.getValueType()) == |
2224 | TargetLowering::TypeSplitVector) |
2225 | GetSplitVector(Op: PassThru, Lo&: PassThruLo, Hi&: PassThruHi); |
2226 | else |
2227 | std::tie(args&: PassThruLo, args&: PassThruHi) = DAG.SplitVector(N: PassThru, DL: dl); |
2228 | |
2229 | ISD::LoadExtType ExtType = MGT->getExtensionType(); |
2230 | ISD::MemIndexType IndexTy = MGT->getIndexType(); |
2231 | |
2232 | SDValue OpsLo[] = {Ch, PassThruLo, MaskLo, Ptr, IndexLo, Ops.Scale}; |
2233 | Lo = DAG.getMaskedGather(VTs: DAG.getVTList(LoVT, MVT::Other), MemVT: LoMemVT, dl, |
2234 | Ops: OpsLo, MMO, IndexType: IndexTy, ExtTy: ExtType); |
2235 | |
2236 | SDValue OpsHi[] = {Ch, PassThruHi, MaskHi, Ptr, IndexHi, Ops.Scale}; |
2237 | Hi = DAG.getMaskedGather(VTs: DAG.getVTList(HiVT, MVT::Other), MemVT: HiMemVT, dl, |
2238 | Ops: OpsHi, MMO, IndexType: IndexTy, ExtTy: ExtType); |
2239 | } else { |
2240 | auto *VPGT = cast<VPGatherSDNode>(Val: N); |
2241 | SDValue EVLLo, EVLHi; |
2242 | std::tie(args&: EVLLo, args&: EVLHi) = |
2243 | DAG.SplitEVL(N: VPGT->getVectorLength(), VecVT: MemoryVT, DL: dl); |
2244 | |
2245 | SDValue OpsLo[] = {Ch, Ptr, IndexLo, Ops.Scale, MaskLo, EVLLo}; |
2246 | Lo = DAG.getGatherVP(VTs: DAG.getVTList(LoVT, MVT::Other), VT: LoMemVT, dl, Ops: OpsLo, |
2247 | MMO, IndexType: VPGT->getIndexType()); |
2248 | |
2249 | SDValue OpsHi[] = {Ch, Ptr, IndexHi, Ops.Scale, MaskHi, EVLHi}; |
2250 | Hi = DAG.getGatherVP(VTs: DAG.getVTList(HiVT, MVT::Other), VT: HiMemVT, dl, Ops: OpsHi, |
2251 | MMO, IndexType: VPGT->getIndexType()); |
2252 | } |
2253 | |
2254 | // Build a factor node to remember that this load is independent of the |
2255 | // other one. |
2256 | Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(R: 1), |
2257 | Hi.getValue(R: 1)); |
2258 | |
2259 | // Legalize the chain result - switch anything that used the old chain to |
2260 | // use the new one. |
2261 | ReplaceValueWith(From: SDValue(N, 1), To: Ch); |
2262 | } |
2263 | |
2264 | void DAGTypeLegalizer::SplitVecRes_SETCC(SDNode *N, SDValue &Lo, SDValue &Hi) { |
2265 | assert(N->getValueType(0).isVector() && |
2266 | N->getOperand(0).getValueType().isVector() && |
2267 | "Operand types must be vectors" ); |
2268 | |
2269 | EVT LoVT, HiVT; |
2270 | SDLoc DL(N); |
2271 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
2272 | |
2273 | // If the input also splits, handle it directly. Otherwise split it by hand. |
2274 | SDValue LL, LH, RL, RH; |
2275 | if (getTypeAction(VT: N->getOperand(Num: 0).getValueType()) == |
2276 | TargetLowering::TypeSplitVector) |
2277 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: LL, Hi&: LH); |
2278 | else |
2279 | std::tie(args&: LL, args&: LH) = DAG.SplitVectorOperand(N, OpNo: 0); |
2280 | |
2281 | if (getTypeAction(VT: N->getOperand(Num: 1).getValueType()) == |
2282 | TargetLowering::TypeSplitVector) |
2283 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: RL, Hi&: RH); |
2284 | else |
2285 | std::tie(args&: RL, args&: RH) = DAG.SplitVectorOperand(N, OpNo: 1); |
2286 | |
2287 | if (N->getOpcode() == ISD::SETCC) { |
2288 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LoVT, N1: LL, N2: RL, N3: N->getOperand(Num: 2)); |
2289 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: HiVT, N1: LH, N2: RH, N3: N->getOperand(Num: 2)); |
2290 | } else { |
2291 | assert(N->getOpcode() == ISD::VP_SETCC && "Expected VP_SETCC opcode" ); |
2292 | SDValue MaskLo, MaskHi, EVLLo, EVLHi; |
2293 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 3)); |
2294 | std::tie(args&: EVLLo, args&: EVLHi) = |
2295 | DAG.SplitEVL(N: N->getOperand(Num: 4), VecVT: N->getValueType(ResNo: 0), DL); |
2296 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LoVT, N1: LL, N2: RL, N3: N->getOperand(Num: 2), N4: MaskLo, |
2297 | N5: EVLLo); |
2298 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: HiVT, N1: LH, N2: RH, N3: N->getOperand(Num: 2), N4: MaskHi, |
2299 | N5: EVLHi); |
2300 | } |
2301 | } |
2302 | |
2303 | void DAGTypeLegalizer::SplitVecRes_UnaryOp(SDNode *N, SDValue &Lo, |
2304 | SDValue &Hi) { |
2305 | // Get the dest types - they may not match the input types, e.g. int_to_fp. |
2306 | EVT LoVT, HiVT; |
2307 | SDLoc dl(N); |
2308 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
2309 | |
2310 | // If the input also splits, handle it directly for a compile time speedup. |
2311 | // Otherwise split it by hand. |
2312 | EVT InVT = N->getOperand(Num: 0).getValueType(); |
2313 | if (getTypeAction(VT: InVT) == TargetLowering::TypeSplitVector) |
2314 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
2315 | else |
2316 | std::tie(args&: Lo, args&: Hi) = DAG.SplitVectorOperand(N, OpNo: 0); |
2317 | |
2318 | const SDNodeFlags Flags = N->getFlags(); |
2319 | unsigned Opcode = N->getOpcode(); |
2320 | if (N->getNumOperands() <= 2) { |
2321 | if (Opcode == ISD::FP_ROUND) { |
2322 | Lo = DAG.getNode(Opcode, DL: dl, VT: LoVT, N1: Lo, N2: N->getOperand(Num: 1), Flags); |
2323 | Hi = DAG.getNode(Opcode, DL: dl, VT: HiVT, N1: Hi, N2: N->getOperand(Num: 1), Flags); |
2324 | } else { |
2325 | Lo = DAG.getNode(Opcode, DL: dl, VT: LoVT, Operand: Lo, Flags); |
2326 | Hi = DAG.getNode(Opcode, DL: dl, VT: HiVT, Operand: Hi, Flags); |
2327 | } |
2328 | return; |
2329 | } |
2330 | |
2331 | assert(N->getNumOperands() == 3 && "Unexpected number of operands!" ); |
2332 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
2333 | |
2334 | SDValue MaskLo, MaskHi; |
2335 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 1)); |
2336 | |
2337 | SDValue EVLLo, EVLHi; |
2338 | std::tie(args&: EVLLo, args&: EVLHi) = |
2339 | DAG.SplitEVL(N: N->getOperand(Num: 2), VecVT: N->getValueType(ResNo: 0), DL: dl); |
2340 | |
2341 | Lo = DAG.getNode(Opcode, DL: dl, VT: LoVT, Ops: {Lo, MaskLo, EVLLo}, Flags); |
2342 | Hi = DAG.getNode(Opcode, DL: dl, VT: HiVT, Ops: {Hi, MaskHi, EVLHi}, Flags); |
2343 | } |
2344 | |
2345 | void DAGTypeLegalizer::SplitVecRes_FFREXP(SDNode *N, unsigned ResNo, |
2346 | SDValue &Lo, SDValue &Hi) { |
2347 | SDLoc dl(N); |
2348 | auto [LoVT, HiVT] = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
2349 | auto [LoVT1, HiVT1] = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 1)); |
2350 | |
2351 | // If the input also splits, handle it directly for a compile time speedup. |
2352 | // Otherwise split it by hand. |
2353 | EVT InVT = N->getOperand(Num: 0).getValueType(); |
2354 | if (getTypeAction(VT: InVT) == TargetLowering::TypeSplitVector) |
2355 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
2356 | else |
2357 | std::tie(args&: Lo, args&: Hi) = DAG.SplitVectorOperand(N, OpNo: 0); |
2358 | |
2359 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, ResultTys: {LoVT, LoVT1}, Ops: Lo); |
2360 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, ResultTys: {HiVT, HiVT1}, Ops: Hi); |
2361 | Lo->setFlags(N->getFlags()); |
2362 | Hi->setFlags(N->getFlags()); |
2363 | |
2364 | SDNode *HiNode = Hi.getNode(); |
2365 | SDNode *LoNode = Lo.getNode(); |
2366 | |
2367 | // Replace the other vector result not being explicitly split here. |
2368 | unsigned OtherNo = 1 - ResNo; |
2369 | EVT OtherVT = N->getValueType(ResNo: OtherNo); |
2370 | if (getTypeAction(VT: OtherVT) == TargetLowering::TypeSplitVector) { |
2371 | SetSplitVector(Op: SDValue(N, OtherNo), Lo: SDValue(LoNode, OtherNo), |
2372 | Hi: SDValue(HiNode, OtherNo)); |
2373 | } else { |
2374 | SDValue OtherVal = |
2375 | DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: OtherVT, N1: SDValue(LoNode, OtherNo), |
2376 | N2: SDValue(HiNode, OtherNo)); |
2377 | ReplaceValueWith(From: SDValue(N, OtherNo), To: OtherVal); |
2378 | } |
2379 | } |
2380 | |
2381 | void DAGTypeLegalizer::SplitVecRes_ExtendOp(SDNode *N, SDValue &Lo, |
2382 | SDValue &Hi) { |
2383 | SDLoc dl(N); |
2384 | EVT SrcVT = N->getOperand(Num: 0).getValueType(); |
2385 | EVT DestVT = N->getValueType(ResNo: 0); |
2386 | EVT LoVT, HiVT; |
2387 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT: DestVT); |
2388 | |
2389 | // We can do better than a generic split operation if the extend is doing |
2390 | // more than just doubling the width of the elements and the following are |
2391 | // true: |
2392 | // - The number of vector elements is even, |
2393 | // - the source type is legal, |
2394 | // - the type of a split source is illegal, |
2395 | // - the type of an extended (by doubling element size) source is legal, and |
2396 | // - the type of that extended source when split is legal. |
2397 | // |
2398 | // This won't necessarily completely legalize the operation, but it will |
2399 | // more effectively move in the right direction and prevent falling down |
2400 | // to scalarization in many cases due to the input vector being split too |
2401 | // far. |
2402 | if (SrcVT.getVectorElementCount().isKnownEven() && |
2403 | SrcVT.getScalarSizeInBits() * 2 < DestVT.getScalarSizeInBits()) { |
2404 | LLVMContext &Ctx = *DAG.getContext(); |
2405 | EVT NewSrcVT = SrcVT.widenIntegerVectorElementType(Context&: Ctx); |
2406 | EVT SplitSrcVT = SrcVT.getHalfNumVectorElementsVT(Context&: Ctx); |
2407 | |
2408 | EVT SplitLoVT, SplitHiVT; |
2409 | std::tie(args&: SplitLoVT, args&: SplitHiVT) = DAG.GetSplitDestVTs(VT: NewSrcVT); |
2410 | if (TLI.isTypeLegal(VT: SrcVT) && !TLI.isTypeLegal(VT: SplitSrcVT) && |
2411 | TLI.isTypeLegal(VT: NewSrcVT) && TLI.isTypeLegal(VT: SplitLoVT)) { |
2412 | LLVM_DEBUG(dbgs() << "Split vector extend via incremental extend:" ; |
2413 | N->dump(&DAG); dbgs() << "\n" ); |
2414 | if (!N->isVPOpcode()) { |
2415 | // Extend the source vector by one step. |
2416 | SDValue NewSrc = |
2417 | DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: NewSrcVT, Operand: N->getOperand(Num: 0)); |
2418 | // Get the low and high halves of the new, extended one step, vector. |
2419 | std::tie(args&: Lo, args&: Hi) = DAG.SplitVector(N: NewSrc, DL: dl); |
2420 | // Extend those vector halves the rest of the way. |
2421 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: LoVT, Operand: Lo); |
2422 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: HiVT, Operand: Hi); |
2423 | return; |
2424 | } |
2425 | |
2426 | // Extend the source vector by one step. |
2427 | SDValue NewSrc = |
2428 | DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: NewSrcVT, N1: N->getOperand(Num: 0), |
2429 | N2: N->getOperand(Num: 1), N3: N->getOperand(Num: 2)); |
2430 | // Get the low and high halves of the new, extended one step, vector. |
2431 | std::tie(args&: Lo, args&: Hi) = DAG.SplitVector(N: NewSrc, DL: dl); |
2432 | |
2433 | SDValue MaskLo, MaskHi; |
2434 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 1)); |
2435 | |
2436 | SDValue EVLLo, EVLHi; |
2437 | std::tie(args&: EVLLo, args&: EVLHi) = |
2438 | DAG.SplitEVL(N: N->getOperand(Num: 2), VecVT: N->getValueType(ResNo: 0), DL: dl); |
2439 | // Extend those vector halves the rest of the way. |
2440 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: LoVT, Ops: {Lo, MaskLo, EVLLo}); |
2441 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: HiVT, Ops: {Hi, MaskHi, EVLHi}); |
2442 | return; |
2443 | } |
2444 | } |
2445 | // Fall back to the generic unary operator splitting otherwise. |
2446 | SplitVecRes_UnaryOp(N, Lo, Hi); |
2447 | } |
2448 | |
2449 | void DAGTypeLegalizer::SplitVecRes_VECTOR_SHUFFLE(ShuffleVectorSDNode *N, |
2450 | SDValue &Lo, SDValue &Hi) { |
2451 | // The low and high parts of the original input give four input vectors. |
2452 | SDValue Inputs[4]; |
2453 | SDLoc DL(N); |
2454 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: Inputs[0], Hi&: Inputs[1]); |
2455 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: Inputs[2], Hi&: Inputs[3]); |
2456 | EVT NewVT = Inputs[0].getValueType(); |
2457 | unsigned NewElts = NewVT.getVectorNumElements(); |
2458 | |
2459 | auto &&IsConstant = [](const SDValue &N) { |
2460 | APInt SplatValue; |
2461 | return N.getResNo() == 0 && |
2462 | (ISD::isConstantSplatVector(N: N.getNode(), SplatValue) || |
2463 | ISD::isBuildVectorOfConstantSDNodes(N: N.getNode())); |
2464 | }; |
2465 | auto &&BuildVector = [NewElts, &DAG = DAG, NewVT, &DL](SDValue &Input1, |
2466 | SDValue &Input2, |
2467 | ArrayRef<int> Mask) { |
2468 | assert(Input1->getOpcode() == ISD::BUILD_VECTOR && |
2469 | Input2->getOpcode() == ISD::BUILD_VECTOR && |
2470 | "Expected build vector node." ); |
2471 | EVT EltVT = NewVT.getVectorElementType(); |
2472 | SmallVector<SDValue> Ops(NewElts, DAG.getUNDEF(VT: EltVT)); |
2473 | for (unsigned I = 0; I < NewElts; ++I) { |
2474 | if (Mask[I] == PoisonMaskElem) |
2475 | continue; |
2476 | unsigned Idx = Mask[I]; |
2477 | if (Idx >= NewElts) |
2478 | Ops[I] = Input2.getOperand(i: Idx - NewElts); |
2479 | else |
2480 | Ops[I] = Input1.getOperand(i: Idx); |
2481 | // Make the type of all elements the same as the element type. |
2482 | if (Ops[I].getValueType().bitsGT(VT: EltVT)) |
2483 | Ops[I] = DAG.getNode(Opcode: ISD::TRUNCATE, DL, VT: EltVT, Operand: Ops[I]); |
2484 | } |
2485 | return DAG.getBuildVector(VT: NewVT, DL, Ops); |
2486 | }; |
2487 | |
2488 | // If Lo or Hi uses elements from at most two of the four input vectors, then |
2489 | // express it as a vector shuffle of those two inputs. Otherwise extract the |
2490 | // input elements by hand and construct the Lo/Hi output using a BUILD_VECTOR. |
2491 | SmallVector<int> OrigMask(N->getMask()); |
2492 | // Try to pack incoming shuffles/inputs. |
2493 | auto &&TryPeekThroughShufflesInputs = [&Inputs, &NewVT, this, NewElts, |
2494 | &DL](SmallVectorImpl<int> &Mask) { |
2495 | // Check if all inputs are shuffles of the same operands or non-shuffles. |
2496 | MapVector<std::pair<SDValue, SDValue>, SmallVector<unsigned>> ShufflesIdxs; |
2497 | for (unsigned Idx = 0; Idx < std::size(Inputs); ++Idx) { |
2498 | SDValue Input = Inputs[Idx]; |
2499 | auto *Shuffle = dyn_cast<ShuffleVectorSDNode>(Val: Input.getNode()); |
2500 | if (!Shuffle || |
2501 | Input.getOperand(i: 0).getValueType() != Input.getValueType()) |
2502 | continue; |
2503 | ShufflesIdxs[std::make_pair(x: Input.getOperand(i: 0), y: Input.getOperand(i: 1))] |
2504 | .push_back(Elt: Idx); |
2505 | ShufflesIdxs[std::make_pair(x: Input.getOperand(i: 1), y: Input.getOperand(i: 0))] |
2506 | .push_back(Elt: Idx); |
2507 | } |
2508 | for (auto &P : ShufflesIdxs) { |
2509 | if (P.second.size() < 2) |
2510 | continue; |
2511 | // Use shuffles operands instead of shuffles themselves. |
2512 | // 1. Adjust mask. |
2513 | for (int &Idx : Mask) { |
2514 | if (Idx == PoisonMaskElem) |
2515 | continue; |
2516 | unsigned SrcRegIdx = Idx / NewElts; |
2517 | if (Inputs[SrcRegIdx].isUndef()) { |
2518 | Idx = PoisonMaskElem; |
2519 | continue; |
2520 | } |
2521 | auto *Shuffle = |
2522 | dyn_cast<ShuffleVectorSDNode>(Val: Inputs[SrcRegIdx].getNode()); |
2523 | if (!Shuffle || !is_contained(Range&: P.second, Element: SrcRegIdx)) |
2524 | continue; |
2525 | int MaskElt = Shuffle->getMaskElt(Idx: Idx % NewElts); |
2526 | if (MaskElt == PoisonMaskElem) { |
2527 | Idx = PoisonMaskElem; |
2528 | continue; |
2529 | } |
2530 | Idx = MaskElt % NewElts + |
2531 | P.second[Shuffle->getOperand(Num: MaskElt / NewElts) == P.first.first |
2532 | ? 0 |
2533 | : 1] * |
2534 | NewElts; |
2535 | } |
2536 | // 2. Update inputs. |
2537 | Inputs[P.second[0]] = P.first.first; |
2538 | Inputs[P.second[1]] = P.first.second; |
2539 | // Clear the pair data. |
2540 | P.second.clear(); |
2541 | ShufflesIdxs[std::make_pair(x&: P.first.second, y&: P.first.first)].clear(); |
2542 | } |
2543 | // Check if any concat_vectors can be simplified. |
2544 | SmallBitVector UsedSubVector(2 * std::size(Inputs)); |
2545 | for (int &Idx : Mask) { |
2546 | if (Idx == PoisonMaskElem) |
2547 | continue; |
2548 | unsigned SrcRegIdx = Idx / NewElts; |
2549 | if (Inputs[SrcRegIdx].isUndef()) { |
2550 | Idx = PoisonMaskElem; |
2551 | continue; |
2552 | } |
2553 | TargetLowering::LegalizeTypeAction TypeAction = |
2554 | getTypeAction(VT: Inputs[SrcRegIdx].getValueType()); |
2555 | if (Inputs[SrcRegIdx].getOpcode() == ISD::CONCAT_VECTORS && |
2556 | Inputs[SrcRegIdx].getNumOperands() == 2 && |
2557 | !Inputs[SrcRegIdx].getOperand(i: 1).isUndef() && |
2558 | (TypeAction == TargetLowering::TypeLegal || |
2559 | TypeAction == TargetLowering::TypeWidenVector)) |
2560 | UsedSubVector.set(2 * SrcRegIdx + (Idx % NewElts) / (NewElts / 2)); |
2561 | } |
2562 | if (UsedSubVector.count() > 1) { |
2563 | SmallVector<SmallVector<std::pair<unsigned, int>, 2>> Pairs; |
2564 | for (unsigned I = 0; I < std::size(Inputs); ++I) { |
2565 | if (UsedSubVector.test(Idx: 2 * I) == UsedSubVector.test(Idx: 2 * I + 1)) |
2566 | continue; |
2567 | if (Pairs.empty() || Pairs.back().size() == 2) |
2568 | Pairs.emplace_back(); |
2569 | if (UsedSubVector.test(Idx: 2 * I)) { |
2570 | Pairs.back().emplace_back(Args&: I, Args: 0); |
2571 | } else { |
2572 | assert(UsedSubVector.test(2 * I + 1) && |
2573 | "Expected to be used one of the subvectors." ); |
2574 | Pairs.back().emplace_back(Args&: I, Args: 1); |
2575 | } |
2576 | } |
2577 | if (!Pairs.empty() && Pairs.front().size() > 1) { |
2578 | // Adjust mask. |
2579 | for (int &Idx : Mask) { |
2580 | if (Idx == PoisonMaskElem) |
2581 | continue; |
2582 | unsigned SrcRegIdx = Idx / NewElts; |
2583 | auto *It = find_if( |
2584 | Range&: Pairs, P: [SrcRegIdx](ArrayRef<std::pair<unsigned, int>> Idxs) { |
2585 | return Idxs.front().first == SrcRegIdx || |
2586 | Idxs.back().first == SrcRegIdx; |
2587 | }); |
2588 | if (It == Pairs.end()) |
2589 | continue; |
2590 | Idx = It->front().first * NewElts + (Idx % NewElts) % (NewElts / 2) + |
2591 | (SrcRegIdx == It->front().first ? 0 : (NewElts / 2)); |
2592 | } |
2593 | // Adjust inputs. |
2594 | for (ArrayRef<std::pair<unsigned, int>> Idxs : Pairs) { |
2595 | Inputs[Idxs.front().first] = DAG.getNode( |
2596 | Opcode: ISD::CONCAT_VECTORS, DL, |
2597 | VT: Inputs[Idxs.front().first].getValueType(), |
2598 | N1: Inputs[Idxs.front().first].getOperand(i: Idxs.front().second), |
2599 | N2: Inputs[Idxs.back().first].getOperand(i: Idxs.back().second)); |
2600 | } |
2601 | } |
2602 | } |
2603 | bool Changed; |
2604 | do { |
2605 | // Try to remove extra shuffles (except broadcasts) and shuffles with the |
2606 | // reused operands. |
2607 | Changed = false; |
2608 | for (unsigned I = 0; I < std::size(Inputs); ++I) { |
2609 | auto *Shuffle = dyn_cast<ShuffleVectorSDNode>(Val: Inputs[I].getNode()); |
2610 | if (!Shuffle) |
2611 | continue; |
2612 | if (Shuffle->getOperand(Num: 0).getValueType() != NewVT) |
2613 | continue; |
2614 | int Op = -1; |
2615 | if (!Inputs[I].hasOneUse() && Shuffle->getOperand(Num: 1).isUndef() && |
2616 | !Shuffle->isSplat()) { |
2617 | Op = 0; |
2618 | } else if (!Inputs[I].hasOneUse() && |
2619 | !Shuffle->getOperand(Num: 1).isUndef()) { |
2620 | // Find the only used operand, if possible. |
2621 | for (int &Idx : Mask) { |
2622 | if (Idx == PoisonMaskElem) |
2623 | continue; |
2624 | unsigned SrcRegIdx = Idx / NewElts; |
2625 | if (SrcRegIdx != I) |
2626 | continue; |
2627 | int MaskElt = Shuffle->getMaskElt(Idx: Idx % NewElts); |
2628 | if (MaskElt == PoisonMaskElem) { |
2629 | Idx = PoisonMaskElem; |
2630 | continue; |
2631 | } |
2632 | int OpIdx = MaskElt / NewElts; |
2633 | if (Op == -1) { |
2634 | Op = OpIdx; |
2635 | continue; |
2636 | } |
2637 | if (Op != OpIdx) { |
2638 | Op = -1; |
2639 | break; |
2640 | } |
2641 | } |
2642 | } |
2643 | if (Op < 0) { |
2644 | // Try to check if one of the shuffle operands is used already. |
2645 | for (int OpIdx = 0; OpIdx < 2; ++OpIdx) { |
2646 | if (Shuffle->getOperand(Num: OpIdx).isUndef()) |
2647 | continue; |
2648 | auto *It = find(Range&: Inputs, Val: Shuffle->getOperand(Num: OpIdx)); |
2649 | if (It == std::end(arr&: Inputs)) |
2650 | continue; |
2651 | int FoundOp = std::distance(first: std::begin(arr&: Inputs), last: It); |
2652 | // Found that operand is used already. |
2653 | // 1. Fix the mask for the reused operand. |
2654 | for (int &Idx : Mask) { |
2655 | if (Idx == PoisonMaskElem) |
2656 | continue; |
2657 | unsigned SrcRegIdx = Idx / NewElts; |
2658 | if (SrcRegIdx != I) |
2659 | continue; |
2660 | int MaskElt = Shuffle->getMaskElt(Idx: Idx % NewElts); |
2661 | if (MaskElt == PoisonMaskElem) { |
2662 | Idx = PoisonMaskElem; |
2663 | continue; |
2664 | } |
2665 | int MaskIdx = MaskElt / NewElts; |
2666 | if (OpIdx == MaskIdx) |
2667 | Idx = MaskElt % NewElts + FoundOp * NewElts; |
2668 | } |
2669 | // 2. Set Op to the unused OpIdx. |
2670 | Op = (OpIdx + 1) % 2; |
2671 | break; |
2672 | } |
2673 | } |
2674 | if (Op >= 0) { |
2675 | Changed = true; |
2676 | Inputs[I] = Shuffle->getOperand(Num: Op); |
2677 | // Adjust mask. |
2678 | for (int &Idx : Mask) { |
2679 | if (Idx == PoisonMaskElem) |
2680 | continue; |
2681 | unsigned SrcRegIdx = Idx / NewElts; |
2682 | if (SrcRegIdx != I) |
2683 | continue; |
2684 | int MaskElt = Shuffle->getMaskElt(Idx: Idx % NewElts); |
2685 | int OpIdx = MaskElt / NewElts; |
2686 | if (OpIdx != Op) |
2687 | continue; |
2688 | Idx = MaskElt % NewElts + SrcRegIdx * NewElts; |
2689 | } |
2690 | } |
2691 | } |
2692 | } while (Changed); |
2693 | }; |
2694 | TryPeekThroughShufflesInputs(OrigMask); |
2695 | // Proces unique inputs. |
2696 | auto &&MakeUniqueInputs = [&Inputs, &IsConstant, |
2697 | NewElts](SmallVectorImpl<int> &Mask) { |
2698 | SetVector<SDValue> UniqueInputs; |
2699 | SetVector<SDValue> UniqueConstantInputs; |
2700 | for (const auto &I : Inputs) { |
2701 | if (IsConstant(I)) |
2702 | UniqueConstantInputs.insert(X: I); |
2703 | else if (!I.isUndef()) |
2704 | UniqueInputs.insert(X: I); |
2705 | } |
2706 | // Adjust mask in case of reused inputs. Also, need to insert constant |
2707 | // inputs at first, otherwise it affects the final outcome. |
2708 | if (UniqueInputs.size() != std::size(Inputs)) { |
2709 | auto &&UniqueVec = UniqueInputs.takeVector(); |
2710 | auto &&UniqueConstantVec = UniqueConstantInputs.takeVector(); |
2711 | unsigned ConstNum = UniqueConstantVec.size(); |
2712 | for (int &Idx : Mask) { |
2713 | if (Idx == PoisonMaskElem) |
2714 | continue; |
2715 | unsigned SrcRegIdx = Idx / NewElts; |
2716 | if (Inputs[SrcRegIdx].isUndef()) { |
2717 | Idx = PoisonMaskElem; |
2718 | continue; |
2719 | } |
2720 | const auto It = find(Range&: UniqueConstantVec, Val: Inputs[SrcRegIdx]); |
2721 | if (It != UniqueConstantVec.end()) { |
2722 | Idx = (Idx % NewElts) + |
2723 | NewElts * std::distance(first: UniqueConstantVec.begin(), last: It); |
2724 | assert(Idx >= 0 && "Expected defined mask idx." ); |
2725 | continue; |
2726 | } |
2727 | const auto RegIt = find(Range&: UniqueVec, Val: Inputs[SrcRegIdx]); |
2728 | assert(RegIt != UniqueVec.end() && "Cannot find non-const value." ); |
2729 | Idx = (Idx % NewElts) + |
2730 | NewElts * (std::distance(first: UniqueVec.begin(), last: RegIt) + ConstNum); |
2731 | assert(Idx >= 0 && "Expected defined mask idx." ); |
2732 | } |
2733 | copy(Range&: UniqueConstantVec, Out: std::begin(arr&: Inputs)); |
2734 | copy(Range&: UniqueVec, Out: std::next(x: std::begin(arr&: Inputs), n: ConstNum)); |
2735 | } |
2736 | }; |
2737 | MakeUniqueInputs(OrigMask); |
2738 | SDValue OrigInputs[4]; |
2739 | copy(Range&: Inputs, Out: std::begin(arr&: OrigInputs)); |
2740 | for (unsigned High = 0; High < 2; ++High) { |
2741 | SDValue &Output = High ? Hi : Lo; |
2742 | |
2743 | // Build a shuffle mask for the output, discovering on the fly which |
2744 | // input vectors to use as shuffle operands. |
2745 | unsigned FirstMaskIdx = High * NewElts; |
2746 | SmallVector<int> Mask(NewElts * std::size(Inputs), PoisonMaskElem); |
2747 | copy(Range: ArrayRef(OrigMask).slice(N: FirstMaskIdx, M: NewElts), Out: Mask.begin()); |
2748 | assert(!Output && "Expected default initialized initial value." ); |
2749 | TryPeekThroughShufflesInputs(Mask); |
2750 | MakeUniqueInputs(Mask); |
2751 | SDValue TmpInputs[4]; |
2752 | copy(Range&: Inputs, Out: std::begin(arr&: TmpInputs)); |
2753 | // Track changes in the output registers. |
2754 | int UsedIdx = -1; |
2755 | bool SecondIteration = false; |
2756 | auto &&AccumulateResults = [&UsedIdx, &SecondIteration](unsigned Idx) { |
2757 | if (UsedIdx < 0) { |
2758 | UsedIdx = Idx; |
2759 | return false; |
2760 | } |
2761 | if (UsedIdx >= 0 && static_cast<unsigned>(UsedIdx) == Idx) |
2762 | SecondIteration = true; |
2763 | return SecondIteration; |
2764 | }; |
2765 | processShuffleMasks( |
2766 | Mask, NumOfSrcRegs: std::size(Inputs), NumOfDestRegs: std::size(Inputs), |
2767 | /*NumOfUsedRegs=*/1, |
2768 | NoInputAction: [&Output, &DAG = DAG, NewVT]() { Output = DAG.getUNDEF(VT: NewVT); }, |
2769 | SingleInputAction: [&Output, &DAG = DAG, NewVT, &DL, &Inputs, |
2770 | &BuildVector](ArrayRef<int> Mask, unsigned Idx, unsigned /*Unused*/) { |
2771 | if (Inputs[Idx]->getOpcode() == ISD::BUILD_VECTOR) |
2772 | Output = BuildVector(Inputs[Idx], Inputs[Idx], Mask); |
2773 | else |
2774 | Output = DAG.getVectorShuffle(VT: NewVT, dl: DL, N1: Inputs[Idx], |
2775 | N2: DAG.getUNDEF(VT: NewVT), Mask); |
2776 | Inputs[Idx] = Output; |
2777 | }, |
2778 | ManyInputsAction: [&AccumulateResults, &Output, &DAG = DAG, NewVT, &DL, &Inputs, |
2779 | &TmpInputs, |
2780 | &BuildVector](ArrayRef<int> Mask, unsigned Idx1, unsigned Idx2) { |
2781 | if (AccumulateResults(Idx1)) { |
2782 | if (Inputs[Idx1]->getOpcode() == ISD::BUILD_VECTOR && |
2783 | Inputs[Idx2]->getOpcode() == ISD::BUILD_VECTOR) |
2784 | Output = BuildVector(Inputs[Idx1], Inputs[Idx2], Mask); |
2785 | else |
2786 | Output = DAG.getVectorShuffle(VT: NewVT, dl: DL, N1: Inputs[Idx1], |
2787 | N2: Inputs[Idx2], Mask); |
2788 | } else { |
2789 | if (TmpInputs[Idx1]->getOpcode() == ISD::BUILD_VECTOR && |
2790 | TmpInputs[Idx2]->getOpcode() == ISD::BUILD_VECTOR) |
2791 | Output = BuildVector(TmpInputs[Idx1], TmpInputs[Idx2], Mask); |
2792 | else |
2793 | Output = DAG.getVectorShuffle(VT: NewVT, dl: DL, N1: TmpInputs[Idx1], |
2794 | N2: TmpInputs[Idx2], Mask); |
2795 | } |
2796 | Inputs[Idx1] = Output; |
2797 | }); |
2798 | copy(Range&: OrigInputs, Out: std::begin(arr&: Inputs)); |
2799 | } |
2800 | } |
2801 | |
2802 | void DAGTypeLegalizer::SplitVecRes_VAARG(SDNode *N, SDValue &Lo, SDValue &Hi) { |
2803 | EVT OVT = N->getValueType(ResNo: 0); |
2804 | EVT NVT = OVT.getHalfNumVectorElementsVT(Context&: *DAG.getContext()); |
2805 | SDValue Chain = N->getOperand(Num: 0); |
2806 | SDValue Ptr = N->getOperand(Num: 1); |
2807 | SDValue SV = N->getOperand(Num: 2); |
2808 | SDLoc dl(N); |
2809 | |
2810 | const Align Alignment = |
2811 | DAG.getDataLayout().getABITypeAlign(Ty: NVT.getTypeForEVT(Context&: *DAG.getContext())); |
2812 | |
2813 | Lo = DAG.getVAArg(VT: NVT, dl, Chain, Ptr, SV, Align: Alignment.value()); |
2814 | Hi = DAG.getVAArg(VT: NVT, dl, Chain: Lo.getValue(R: 1), Ptr, SV, Align: Alignment.value()); |
2815 | Chain = Hi.getValue(R: 1); |
2816 | |
2817 | // Modified the chain - switch anything that used the old chain to use |
2818 | // the new one. |
2819 | ReplaceValueWith(From: SDValue(N, 1), To: Chain); |
2820 | } |
2821 | |
2822 | void DAGTypeLegalizer::SplitVecRes_FP_TO_XINT_SAT(SDNode *N, SDValue &Lo, |
2823 | SDValue &Hi) { |
2824 | EVT DstVTLo, DstVTHi; |
2825 | std::tie(args&: DstVTLo, args&: DstVTHi) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
2826 | SDLoc dl(N); |
2827 | |
2828 | SDValue SrcLo, SrcHi; |
2829 | EVT SrcVT = N->getOperand(Num: 0).getValueType(); |
2830 | if (getTypeAction(VT: SrcVT) == TargetLowering::TypeSplitVector) |
2831 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: SrcLo, Hi&: SrcHi); |
2832 | else |
2833 | std::tie(args&: SrcLo, args&: SrcHi) = DAG.SplitVectorOperand(N, OpNo: 0); |
2834 | |
2835 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: DstVTLo, N1: SrcLo, N2: N->getOperand(Num: 1)); |
2836 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: DstVTHi, N1: SrcHi, N2: N->getOperand(Num: 1)); |
2837 | } |
2838 | |
2839 | void DAGTypeLegalizer::SplitVecRes_VECTOR_REVERSE(SDNode *N, SDValue &Lo, |
2840 | SDValue &Hi) { |
2841 | SDValue InLo, InHi; |
2842 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: InLo, Hi&: InHi); |
2843 | SDLoc DL(N); |
2844 | |
2845 | Lo = DAG.getNode(Opcode: ISD::VECTOR_REVERSE, DL, VT: InHi.getValueType(), Operand: InHi); |
2846 | Hi = DAG.getNode(Opcode: ISD::VECTOR_REVERSE, DL, VT: InLo.getValueType(), Operand: InLo); |
2847 | } |
2848 | |
2849 | void DAGTypeLegalizer::SplitVecRes_VECTOR_SPLICE(SDNode *N, SDValue &Lo, |
2850 | SDValue &Hi) { |
2851 | EVT VT = N->getValueType(ResNo: 0); |
2852 | SDLoc DL(N); |
2853 | |
2854 | EVT LoVT, HiVT; |
2855 | std::tie(args&: LoVT, args&: HiVT) = DAG.GetSplitDestVTs(VT); |
2856 | |
2857 | SDValue Expanded = TLI.expandVectorSplice(Node: N, DAG); |
2858 | Lo = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: LoVT, N1: Expanded, |
2859 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
2860 | Hi = |
2861 | DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: HiVT, N1: Expanded, |
2862 | N2: DAG.getVectorIdxConstant(Val: LoVT.getVectorMinNumElements(), DL)); |
2863 | } |
2864 | |
2865 | void DAGTypeLegalizer::SplitVecRes_VP_REVERSE(SDNode *N, SDValue &Lo, |
2866 | SDValue &Hi) { |
2867 | EVT VT = N->getValueType(ResNo: 0); |
2868 | SDValue Val = N->getOperand(Num: 0); |
2869 | SDValue Mask = N->getOperand(Num: 1); |
2870 | SDValue EVL = N->getOperand(Num: 2); |
2871 | SDLoc DL(N); |
2872 | |
2873 | // Fallback to VP_STRIDED_STORE to stack followed by VP_LOAD. |
2874 | Align Alignment = DAG.getReducedAlign(VT, /*UseABI=*/false); |
2875 | |
2876 | EVT MemVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: VT.getVectorElementType(), |
2877 | EC: VT.getVectorElementCount()); |
2878 | SDValue StackPtr = DAG.CreateStackTemporary(Bytes: MemVT.getStoreSize(), Alignment); |
2879 | EVT PtrVT = StackPtr.getValueType(); |
2880 | auto &MF = DAG.getMachineFunction(); |
2881 | auto FrameIndex = cast<FrameIndexSDNode>(Val: StackPtr.getNode())->getIndex(); |
2882 | auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FI: FrameIndex); |
2883 | |
2884 | MachineMemOperand *StoreMMO = DAG.getMachineFunction().getMachineMemOperand( |
2885 | PtrInfo, f: MachineMemOperand::MOStore, s: MemoryLocation::UnknownSize, |
2886 | base_alignment: Alignment); |
2887 | MachineMemOperand *LoadMMO = DAG.getMachineFunction().getMachineMemOperand( |
2888 | PtrInfo, f: MachineMemOperand::MOLoad, s: MemoryLocation::UnknownSize, |
2889 | base_alignment: Alignment); |
2890 | |
2891 | unsigned EltWidth = VT.getScalarSizeInBits() / 8; |
2892 | SDValue NumElemMinus1 = |
2893 | DAG.getNode(Opcode: ISD::SUB, DL, VT: PtrVT, N1: DAG.getZExtOrTrunc(Op: EVL, DL, VT: PtrVT), |
2894 | N2: DAG.getConstant(Val: 1, DL, VT: PtrVT)); |
2895 | SDValue StartOffset = DAG.getNode(Opcode: ISD::MUL, DL, VT: PtrVT, N1: NumElemMinus1, |
2896 | N2: DAG.getConstant(Val: EltWidth, DL, VT: PtrVT)); |
2897 | SDValue StorePtr = DAG.getNode(Opcode: ISD::ADD, DL, VT: PtrVT, N1: StackPtr, N2: StartOffset); |
2898 | SDValue Stride = DAG.getConstant(Val: -(int64_t)EltWidth, DL, VT: PtrVT); |
2899 | |
2900 | SDValue TrueMask = DAG.getBoolConstant(V: true, DL, VT: Mask.getValueType(), OpVT: VT); |
2901 | SDValue Store = DAG.getStridedStoreVP(Chain: DAG.getEntryNode(), DL, Val, Ptr: StorePtr, |
2902 | Offset: DAG.getUNDEF(VT: PtrVT), Stride, Mask: TrueMask, |
2903 | EVL, MemVT, MMO: StoreMMO, AM: ISD::UNINDEXED); |
2904 | |
2905 | SDValue Load = DAG.getLoadVP(VT, dl: DL, Chain: Store, Ptr: StackPtr, Mask, EVL, MMO: LoadMMO); |
2906 | |
2907 | auto [LoVT, HiVT] = DAG.GetSplitDestVTs(VT); |
2908 | Lo = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: LoVT, N1: Load, |
2909 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
2910 | Hi = |
2911 | DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: HiVT, N1: Load, |
2912 | N2: DAG.getVectorIdxConstant(Val: LoVT.getVectorMinNumElements(), DL)); |
2913 | } |
2914 | |
2915 | void DAGTypeLegalizer::SplitVecRes_VECTOR_DEINTERLEAVE(SDNode *N) { |
2916 | |
2917 | SDValue Op0Lo, Op0Hi, Op1Lo, Op1Hi; |
2918 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: Op0Lo, Hi&: Op0Hi); |
2919 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: Op1Lo, Hi&: Op1Hi); |
2920 | EVT VT = Op0Lo.getValueType(); |
2921 | SDLoc DL(N); |
2922 | SDValue ResLo = DAG.getNode(Opcode: ISD::VECTOR_DEINTERLEAVE, DL, |
2923 | VTList: DAG.getVTList(VT1: VT, VT2: VT), N1: Op0Lo, N2: Op0Hi); |
2924 | SDValue ResHi = DAG.getNode(Opcode: ISD::VECTOR_DEINTERLEAVE, DL, |
2925 | VTList: DAG.getVTList(VT1: VT, VT2: VT), N1: Op1Lo, N2: Op1Hi); |
2926 | |
2927 | SetSplitVector(Op: SDValue(N, 0), Lo: ResLo.getValue(R: 0), Hi: ResHi.getValue(R: 0)); |
2928 | SetSplitVector(Op: SDValue(N, 1), Lo: ResLo.getValue(R: 1), Hi: ResHi.getValue(R: 1)); |
2929 | } |
2930 | |
2931 | void DAGTypeLegalizer::SplitVecRes_VECTOR_INTERLEAVE(SDNode *N) { |
2932 | SDValue Op0Lo, Op0Hi, Op1Lo, Op1Hi; |
2933 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: Op0Lo, Hi&: Op0Hi); |
2934 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: Op1Lo, Hi&: Op1Hi); |
2935 | EVT VT = Op0Lo.getValueType(); |
2936 | SDLoc DL(N); |
2937 | SDValue Res[] = {DAG.getNode(Opcode: ISD::VECTOR_INTERLEAVE, DL, |
2938 | VTList: DAG.getVTList(VT1: VT, VT2: VT), N1: Op0Lo, N2: Op1Lo), |
2939 | DAG.getNode(Opcode: ISD::VECTOR_INTERLEAVE, DL, |
2940 | VTList: DAG.getVTList(VT1: VT, VT2: VT), N1: Op0Hi, N2: Op1Hi)}; |
2941 | |
2942 | SetSplitVector(Op: SDValue(N, 0), Lo: Res[0].getValue(R: 0), Hi: Res[0].getValue(R: 1)); |
2943 | SetSplitVector(Op: SDValue(N, 1), Lo: Res[1].getValue(R: 0), Hi: Res[1].getValue(R: 1)); |
2944 | } |
2945 | |
2946 | //===----------------------------------------------------------------------===// |
2947 | // Operand Vector Splitting |
2948 | //===----------------------------------------------------------------------===// |
2949 | |
2950 | /// This method is called when the specified operand of the specified node is |
2951 | /// found to need vector splitting. At this point, all of the result types of |
2952 | /// the node are known to be legal, but other operands of the node may need |
2953 | /// legalization as well as the specified one. |
2954 | bool DAGTypeLegalizer::SplitVectorOperand(SDNode *N, unsigned OpNo) { |
2955 | LLVM_DEBUG(dbgs() << "Split node operand: " ; N->dump(&DAG)); |
2956 | SDValue Res = SDValue(); |
2957 | |
2958 | // See if the target wants to custom split this node. |
2959 | if (CustomLowerNode(N, VT: N->getOperand(Num: OpNo).getValueType(), LegalizeResult: false)) |
2960 | return false; |
2961 | |
2962 | switch (N->getOpcode()) { |
2963 | default: |
2964 | #ifndef NDEBUG |
2965 | dbgs() << "SplitVectorOperand Op #" << OpNo << ": " ; |
2966 | N->dump(G: &DAG); |
2967 | dbgs() << "\n" ; |
2968 | #endif |
2969 | report_fatal_error(reason: "Do not know how to split this operator's " |
2970 | "operand!\n" ); |
2971 | |
2972 | case ISD::VP_SETCC: |
2973 | case ISD::SETCC: Res = SplitVecOp_VSETCC(N); break; |
2974 | case ISD::BITCAST: Res = SplitVecOp_BITCAST(N); break; |
2975 | case ISD::EXTRACT_SUBVECTOR: Res = SplitVecOp_EXTRACT_SUBVECTOR(N); break; |
2976 | case ISD::INSERT_SUBVECTOR: Res = SplitVecOp_INSERT_SUBVECTOR(N, OpNo); break; |
2977 | case ISD::EXTRACT_VECTOR_ELT:Res = SplitVecOp_EXTRACT_VECTOR_ELT(N); break; |
2978 | case ISD::CONCAT_VECTORS: Res = SplitVecOp_CONCAT_VECTORS(N); break; |
2979 | case ISD::VP_TRUNCATE: |
2980 | case ISD::TRUNCATE: |
2981 | Res = SplitVecOp_TruncateHelper(N); |
2982 | break; |
2983 | case ISD::STRICT_FP_ROUND: |
2984 | case ISD::VP_FP_ROUND: |
2985 | case ISD::FP_ROUND: Res = SplitVecOp_FP_ROUND(N); break; |
2986 | case ISD::FCOPYSIGN: Res = SplitVecOp_FPOpDifferentTypes(N); break; |
2987 | case ISD::STORE: |
2988 | Res = SplitVecOp_STORE(N: cast<StoreSDNode>(Val: N), OpNo); |
2989 | break; |
2990 | case ISD::VP_STORE: |
2991 | Res = SplitVecOp_VP_STORE(N: cast<VPStoreSDNode>(Val: N), OpNo); |
2992 | break; |
2993 | case ISD::EXPERIMENTAL_VP_STRIDED_STORE: |
2994 | Res = SplitVecOp_VP_STRIDED_STORE(N: cast<VPStridedStoreSDNode>(Val: N), OpNo); |
2995 | break; |
2996 | case ISD::MSTORE: |
2997 | Res = SplitVecOp_MSTORE(N: cast<MaskedStoreSDNode>(Val: N), OpNo); |
2998 | break; |
2999 | case ISD::MSCATTER: |
3000 | case ISD::VP_SCATTER: |
3001 | Res = SplitVecOp_Scatter(N: cast<MemSDNode>(Val: N), OpNo); |
3002 | break; |
3003 | case ISD::MGATHER: |
3004 | case ISD::VP_GATHER: |
3005 | Res = SplitVecOp_Gather(MGT: cast<MemSDNode>(Val: N), OpNo); |
3006 | break; |
3007 | case ISD::VSELECT: |
3008 | Res = SplitVecOp_VSELECT(N, OpNo); |
3009 | break; |
3010 | case ISD::STRICT_SINT_TO_FP: |
3011 | case ISD::STRICT_UINT_TO_FP: |
3012 | case ISD::SINT_TO_FP: |
3013 | case ISD::UINT_TO_FP: |
3014 | case ISD::VP_SINT_TO_FP: |
3015 | case ISD::VP_UINT_TO_FP: |
3016 | if (N->getValueType(ResNo: 0).bitsLT( |
3017 | VT: N->getOperand(Num: N->isStrictFPOpcode() ? 1 : 0).getValueType())) |
3018 | Res = SplitVecOp_TruncateHelper(N); |
3019 | else |
3020 | Res = SplitVecOp_UnaryOp(N); |
3021 | break; |
3022 | case ISD::FP_TO_SINT_SAT: |
3023 | case ISD::FP_TO_UINT_SAT: |
3024 | Res = SplitVecOp_FP_TO_XINT_SAT(N); |
3025 | break; |
3026 | case ISD::FP_TO_SINT: |
3027 | case ISD::FP_TO_UINT: |
3028 | case ISD::VP_FP_TO_SINT: |
3029 | case ISD::VP_FP_TO_UINT: |
3030 | case ISD::STRICT_FP_TO_SINT: |
3031 | case ISD::STRICT_FP_TO_UINT: |
3032 | case ISD::STRICT_FP_EXTEND: |
3033 | case ISD::FP_EXTEND: |
3034 | case ISD::SIGN_EXTEND: |
3035 | case ISD::ZERO_EXTEND: |
3036 | case ISD::ANY_EXTEND: |
3037 | case ISD::FTRUNC: |
3038 | case ISD::LRINT: |
3039 | case ISD::LLRINT: |
3040 | Res = SplitVecOp_UnaryOp(N); |
3041 | break; |
3042 | case ISD::FLDEXP: |
3043 | Res = SplitVecOp_FPOpDifferentTypes(N); |
3044 | break; |
3045 | |
3046 | case ISD::ANY_EXTEND_VECTOR_INREG: |
3047 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
3048 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
3049 | Res = SplitVecOp_ExtVecInRegOp(N); |
3050 | break; |
3051 | |
3052 | case ISD::VECREDUCE_FADD: |
3053 | case ISD::VECREDUCE_FMUL: |
3054 | case ISD::VECREDUCE_ADD: |
3055 | case ISD::VECREDUCE_MUL: |
3056 | case ISD::VECREDUCE_AND: |
3057 | case ISD::VECREDUCE_OR: |
3058 | case ISD::VECREDUCE_XOR: |
3059 | case ISD::VECREDUCE_SMAX: |
3060 | case ISD::VECREDUCE_SMIN: |
3061 | case ISD::VECREDUCE_UMAX: |
3062 | case ISD::VECREDUCE_UMIN: |
3063 | case ISD::VECREDUCE_FMAX: |
3064 | case ISD::VECREDUCE_FMIN: |
3065 | case ISD::VECREDUCE_FMAXIMUM: |
3066 | case ISD::VECREDUCE_FMINIMUM: |
3067 | Res = SplitVecOp_VECREDUCE(N, OpNo); |
3068 | break; |
3069 | case ISD::VECREDUCE_SEQ_FADD: |
3070 | case ISD::VECREDUCE_SEQ_FMUL: |
3071 | Res = SplitVecOp_VECREDUCE_SEQ(N); |
3072 | break; |
3073 | case ISD::VP_REDUCE_FADD: |
3074 | case ISD::VP_REDUCE_SEQ_FADD: |
3075 | case ISD::VP_REDUCE_FMUL: |
3076 | case ISD::VP_REDUCE_SEQ_FMUL: |
3077 | case ISD::VP_REDUCE_ADD: |
3078 | case ISD::VP_REDUCE_MUL: |
3079 | case ISD::VP_REDUCE_AND: |
3080 | case ISD::VP_REDUCE_OR: |
3081 | case ISD::VP_REDUCE_XOR: |
3082 | case ISD::VP_REDUCE_SMAX: |
3083 | case ISD::VP_REDUCE_SMIN: |
3084 | case ISD::VP_REDUCE_UMAX: |
3085 | case ISD::VP_REDUCE_UMIN: |
3086 | case ISD::VP_REDUCE_FMAX: |
3087 | case ISD::VP_REDUCE_FMIN: |
3088 | Res = SplitVecOp_VP_REDUCE(N, OpNo); |
3089 | break; |
3090 | } |
3091 | |
3092 | // If the result is null, the sub-method took care of registering results etc. |
3093 | if (!Res.getNode()) return false; |
3094 | |
3095 | // If the result is N, the sub-method updated N in place. Tell the legalizer |
3096 | // core about this. |
3097 | if (Res.getNode() == N) |
3098 | return true; |
3099 | |
3100 | if (N->isStrictFPOpcode()) |
3101 | assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 2 && |
3102 | "Invalid operand expansion" ); |
3103 | else |
3104 | assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 1 && |
3105 | "Invalid operand expansion" ); |
3106 | |
3107 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
3108 | return false; |
3109 | } |
3110 | |
3111 | SDValue DAGTypeLegalizer::SplitVecOp_VSELECT(SDNode *N, unsigned OpNo) { |
3112 | // The only possibility for an illegal operand is the mask, since result type |
3113 | // legalization would have handled this node already otherwise. |
3114 | assert(OpNo == 0 && "Illegal operand must be mask" ); |
3115 | |
3116 | SDValue Mask = N->getOperand(Num: 0); |
3117 | SDValue Src0 = N->getOperand(Num: 1); |
3118 | SDValue Src1 = N->getOperand(Num: 2); |
3119 | EVT Src0VT = Src0.getValueType(); |
3120 | SDLoc DL(N); |
3121 | assert(Mask.getValueType().isVector() && "VSELECT without a vector mask?" ); |
3122 | |
3123 | SDValue Lo, Hi; |
3124 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
3125 | assert(Lo.getValueType() == Hi.getValueType() && |
3126 | "Lo and Hi have differing types" ); |
3127 | |
3128 | EVT LoOpVT, HiOpVT; |
3129 | std::tie(args&: LoOpVT, args&: HiOpVT) = DAG.GetSplitDestVTs(VT: Src0VT); |
3130 | assert(LoOpVT == HiOpVT && "Asymmetric vector split?" ); |
3131 | |
3132 | SDValue LoOp0, HiOp0, LoOp1, HiOp1, LoMask, HiMask; |
3133 | std::tie(args&: LoOp0, args&: HiOp0) = DAG.SplitVector(N: Src0, DL); |
3134 | std::tie(args&: LoOp1, args&: HiOp1) = DAG.SplitVector(N: Src1, DL); |
3135 | std::tie(args&: LoMask, args&: HiMask) = DAG.SplitVector(N: Mask, DL); |
3136 | |
3137 | SDValue LoSelect = |
3138 | DAG.getNode(Opcode: ISD::VSELECT, DL, VT: LoOpVT, N1: LoMask, N2: LoOp0, N3: LoOp1); |
3139 | SDValue HiSelect = |
3140 | DAG.getNode(Opcode: ISD::VSELECT, DL, VT: HiOpVT, N1: HiMask, N2: HiOp0, N3: HiOp1); |
3141 | |
3142 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: Src0VT, N1: LoSelect, N2: HiSelect); |
3143 | } |
3144 | |
3145 | SDValue DAGTypeLegalizer::SplitVecOp_VECREDUCE(SDNode *N, unsigned OpNo) { |
3146 | EVT ResVT = N->getValueType(ResNo: 0); |
3147 | SDValue Lo, Hi; |
3148 | SDLoc dl(N); |
3149 | |
3150 | SDValue VecOp = N->getOperand(Num: OpNo); |
3151 | EVT VecVT = VecOp.getValueType(); |
3152 | assert(VecVT.isVector() && "Can only split reduce vector operand" ); |
3153 | GetSplitVector(Op: VecOp, Lo, Hi); |
3154 | EVT LoOpVT, HiOpVT; |
3155 | std::tie(args&: LoOpVT, args&: HiOpVT) = DAG.GetSplitDestVTs(VT: VecVT); |
3156 | |
3157 | // Use the appropriate scalar instruction on the split subvectors before |
3158 | // reducing the now partially reduced smaller vector. |
3159 | unsigned CombineOpc = ISD::getVecReduceBaseOpcode(VecReduceOpcode: N->getOpcode()); |
3160 | SDValue Partial = DAG.getNode(Opcode: CombineOpc, DL: dl, VT: LoOpVT, N1: Lo, N2: Hi, Flags: N->getFlags()); |
3161 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: ResVT, Operand: Partial, Flags: N->getFlags()); |
3162 | } |
3163 | |
3164 | SDValue DAGTypeLegalizer::SplitVecOp_VECREDUCE_SEQ(SDNode *N) { |
3165 | EVT ResVT = N->getValueType(ResNo: 0); |
3166 | SDValue Lo, Hi; |
3167 | SDLoc dl(N); |
3168 | |
3169 | SDValue AccOp = N->getOperand(Num: 0); |
3170 | SDValue VecOp = N->getOperand(Num: 1); |
3171 | SDNodeFlags Flags = N->getFlags(); |
3172 | |
3173 | EVT VecVT = VecOp.getValueType(); |
3174 | assert(VecVT.isVector() && "Can only split reduce vector operand" ); |
3175 | GetSplitVector(Op: VecOp, Lo, Hi); |
3176 | EVT LoOpVT, HiOpVT; |
3177 | std::tie(args&: LoOpVT, args&: HiOpVT) = DAG.GetSplitDestVTs(VT: VecVT); |
3178 | |
3179 | // Reduce low half. |
3180 | SDValue Partial = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: ResVT, N1: AccOp, N2: Lo, Flags); |
3181 | |
3182 | // Reduce high half, using low half result as initial value. |
3183 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: ResVT, N1: Partial, N2: Hi, Flags); |
3184 | } |
3185 | |
3186 | SDValue DAGTypeLegalizer::SplitVecOp_VP_REDUCE(SDNode *N, unsigned OpNo) { |
3187 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
3188 | assert(OpNo == 1 && "Can only split reduce vector operand" ); |
3189 | |
3190 | unsigned Opc = N->getOpcode(); |
3191 | EVT ResVT = N->getValueType(ResNo: 0); |
3192 | SDValue Lo, Hi; |
3193 | SDLoc dl(N); |
3194 | |
3195 | SDValue VecOp = N->getOperand(Num: OpNo); |
3196 | EVT VecVT = VecOp.getValueType(); |
3197 | assert(VecVT.isVector() && "Can only split reduce vector operand" ); |
3198 | GetSplitVector(Op: VecOp, Lo, Hi); |
3199 | |
3200 | SDValue MaskLo, MaskHi; |
3201 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 2)); |
3202 | |
3203 | SDValue EVLLo, EVLHi; |
3204 | std::tie(args&: EVLLo, args&: EVLHi) = DAG.SplitEVL(N: N->getOperand(Num: 3), VecVT, DL: dl); |
3205 | |
3206 | const SDNodeFlags Flags = N->getFlags(); |
3207 | |
3208 | SDValue ResLo = |
3209 | DAG.getNode(Opcode: Opc, DL: dl, VT: ResVT, Ops: {N->getOperand(Num: 0), Lo, MaskLo, EVLLo}, Flags); |
3210 | return DAG.getNode(Opcode: Opc, DL: dl, VT: ResVT, Ops: {ResLo, Hi, MaskHi, EVLHi}, Flags); |
3211 | } |
3212 | |
3213 | SDValue DAGTypeLegalizer::SplitVecOp_UnaryOp(SDNode *N) { |
3214 | // The result has a legal vector type, but the input needs splitting. |
3215 | EVT ResVT = N->getValueType(ResNo: 0); |
3216 | SDValue Lo, Hi; |
3217 | SDLoc dl(N); |
3218 | GetSplitVector(Op: N->getOperand(Num: N->isStrictFPOpcode() ? 1 : 0), Lo, Hi); |
3219 | EVT InVT = Lo.getValueType(); |
3220 | |
3221 | EVT OutVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: ResVT.getVectorElementType(), |
3222 | EC: InVT.getVectorElementCount()); |
3223 | |
3224 | if (N->isStrictFPOpcode()) { |
3225 | Lo = DAG.getNode(N->getOpcode(), dl, { OutVT, MVT::Other }, |
3226 | { N->getOperand(0), Lo }); |
3227 | Hi = DAG.getNode(N->getOpcode(), dl, { OutVT, MVT::Other }, |
3228 | { N->getOperand(0), Hi }); |
3229 | |
3230 | // Build a factor node to remember that this operation is independent |
3231 | // of the other one. |
3232 | SDValue Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(R: 1), |
3233 | Hi.getValue(R: 1)); |
3234 | |
3235 | // Legalize the chain result - switch anything that used the old chain to |
3236 | // use the new one. |
3237 | ReplaceValueWith(From: SDValue(N, 1), To: Ch); |
3238 | } else if (N->getNumOperands() == 3) { |
3239 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
3240 | SDValue MaskLo, MaskHi, EVLLo, EVLHi; |
3241 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 1)); |
3242 | std::tie(args&: EVLLo, args&: EVLHi) = |
3243 | DAG.SplitEVL(N: N->getOperand(Num: 2), VecVT: N->getValueType(ResNo: 0), DL: dl); |
3244 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: OutVT, N1: Lo, N2: MaskLo, N3: EVLLo); |
3245 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: OutVT, N1: Hi, N2: MaskHi, N3: EVLHi); |
3246 | } else { |
3247 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: OutVT, Operand: Lo); |
3248 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: OutVT, Operand: Hi); |
3249 | } |
3250 | |
3251 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: ResVT, N1: Lo, N2: Hi); |
3252 | } |
3253 | |
3254 | SDValue DAGTypeLegalizer::SplitVecOp_BITCAST(SDNode *N) { |
3255 | // For example, i64 = BITCAST v4i16 on alpha. Typically the vector will |
3256 | // end up being split all the way down to individual components. Convert the |
3257 | // split pieces into integers and reassemble. |
3258 | SDValue Lo, Hi; |
3259 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
3260 | Lo = BitConvertToInteger(Op: Lo); |
3261 | Hi = BitConvertToInteger(Op: Hi); |
3262 | |
3263 | if (DAG.getDataLayout().isBigEndian()) |
3264 | std::swap(a&: Lo, b&: Hi); |
3265 | |
3266 | return DAG.getNode(Opcode: ISD::BITCAST, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), |
3267 | Operand: JoinIntegers(Lo, Hi)); |
3268 | } |
3269 | |
3270 | SDValue DAGTypeLegalizer::SplitVecOp_INSERT_SUBVECTOR(SDNode *N, |
3271 | unsigned OpNo) { |
3272 | assert(OpNo == 1 && "Invalid OpNo; can only split SubVec." ); |
3273 | // We know that the result type is legal. |
3274 | EVT ResVT = N->getValueType(ResNo: 0); |
3275 | |
3276 | SDValue Vec = N->getOperand(Num: 0); |
3277 | SDValue SubVec = N->getOperand(Num: 1); |
3278 | SDValue Idx = N->getOperand(Num: 2); |
3279 | SDLoc dl(N); |
3280 | |
3281 | SDValue Lo, Hi; |
3282 | GetSplitVector(Op: SubVec, Lo, Hi); |
3283 | |
3284 | uint64_t IdxVal = Idx->getAsZExtVal(); |
3285 | uint64_t LoElts = Lo.getValueType().getVectorMinNumElements(); |
3286 | |
3287 | SDValue FirstInsertion = |
3288 | DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: ResVT, N1: Vec, N2: Lo, N3: Idx); |
3289 | SDValue SecondInsertion = |
3290 | DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: ResVT, N1: FirstInsertion, N2: Hi, |
3291 | N3: DAG.getVectorIdxConstant(Val: IdxVal + LoElts, DL: dl)); |
3292 | |
3293 | return SecondInsertion; |
3294 | } |
3295 | |
3296 | SDValue DAGTypeLegalizer::(SDNode *N) { |
3297 | // We know that the extracted result type is legal. |
3298 | EVT SubVT = N->getValueType(ResNo: 0); |
3299 | SDValue Idx = N->getOperand(Num: 1); |
3300 | SDLoc dl(N); |
3301 | SDValue Lo, Hi; |
3302 | |
3303 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
3304 | |
3305 | uint64_t LoEltsMin = Lo.getValueType().getVectorMinNumElements(); |
3306 | uint64_t IdxVal = Idx->getAsZExtVal(); |
3307 | |
3308 | if (IdxVal < LoEltsMin) { |
3309 | assert(IdxVal + SubVT.getVectorMinNumElements() <= LoEltsMin && |
3310 | "Extracted subvector crosses vector split!" ); |
3311 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: SubVT, N1: Lo, N2: Idx); |
3312 | } else if (SubVT.isScalableVector() == |
3313 | N->getOperand(Num: 0).getValueType().isScalableVector()) |
3314 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: SubVT, N1: Hi, |
3315 | N2: DAG.getVectorIdxConstant(Val: IdxVal - LoEltsMin, DL: dl)); |
3316 | |
3317 | // After this point the DAG node only permits extracting fixed-width |
3318 | // subvectors from scalable vectors. |
3319 | assert(SubVT.isFixedLengthVector() && |
3320 | "Extracting scalable subvector from fixed-width unsupported" ); |
3321 | |
3322 | // If the element type is i1 and we're not promoting the result, then we may |
3323 | // end up loading the wrong data since the bits are packed tightly into |
3324 | // bytes. For example, if we extract a v4i1 (legal) from a nxv4i1 (legal) |
3325 | // type at index 4, then we will load a byte starting at index 0. |
3326 | if (SubVT.getScalarType() == MVT::i1) |
3327 | report_fatal_error(reason: "Don't know how to extract fixed-width predicate " |
3328 | "subvector from a scalable predicate vector" ); |
3329 | |
3330 | // Spill the vector to the stack. We should use the alignment for |
3331 | // the smallest part. |
3332 | SDValue Vec = N->getOperand(Num: 0); |
3333 | EVT VecVT = Vec.getValueType(); |
3334 | Align SmallestAlign = DAG.getReducedAlign(VT: VecVT, /*UseABI=*/false); |
3335 | SDValue StackPtr = |
3336 | DAG.CreateStackTemporary(Bytes: VecVT.getStoreSize(), Alignment: SmallestAlign); |
3337 | auto &MF = DAG.getMachineFunction(); |
3338 | auto FrameIndex = cast<FrameIndexSDNode>(Val: StackPtr.getNode())->getIndex(); |
3339 | auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FI: FrameIndex); |
3340 | |
3341 | SDValue Store = DAG.getStore(Chain: DAG.getEntryNode(), dl, Val: Vec, Ptr: StackPtr, PtrInfo, |
3342 | Alignment: SmallestAlign); |
3343 | |
3344 | // Extract the subvector by loading the correct part. |
3345 | StackPtr = TLI.getVectorSubVecPointer(DAG, VecPtr: StackPtr, VecVT, SubVecVT: SubVT, Index: Idx); |
3346 | |
3347 | return DAG.getLoad( |
3348 | VT: SubVT, dl, Chain: Store, Ptr: StackPtr, |
3349 | PtrInfo: MachinePointerInfo::getUnknownStack(MF&: DAG.getMachineFunction())); |
3350 | } |
3351 | |
3352 | SDValue DAGTypeLegalizer::(SDNode *N) { |
3353 | SDValue Vec = N->getOperand(Num: 0); |
3354 | SDValue Idx = N->getOperand(Num: 1); |
3355 | EVT VecVT = Vec.getValueType(); |
3356 | |
3357 | if (const ConstantSDNode *Index = dyn_cast<ConstantSDNode>(Val&: Idx)) { |
3358 | uint64_t IdxVal = Index->getZExtValue(); |
3359 | |
3360 | SDValue Lo, Hi; |
3361 | GetSplitVector(Op: Vec, Lo, Hi); |
3362 | |
3363 | uint64_t LoElts = Lo.getValueType().getVectorMinNumElements(); |
3364 | |
3365 | if (IdxVal < LoElts) |
3366 | return SDValue(DAG.UpdateNodeOperands(N, Op1: Lo, Op2: Idx), 0); |
3367 | else if (!Vec.getValueType().isScalableVector()) |
3368 | return SDValue(DAG.UpdateNodeOperands(N, Op1: Hi, |
3369 | Op2: DAG.getConstant(Val: IdxVal - LoElts, DL: SDLoc(N), |
3370 | VT: Idx.getValueType())), 0); |
3371 | } |
3372 | |
3373 | // See if the target wants to custom expand this node. |
3374 | if (CustomLowerNode(N, VT: N->getValueType(ResNo: 0), LegalizeResult: true)) |
3375 | return SDValue(); |
3376 | |
3377 | // Make the vector elements byte-addressable if they aren't already. |
3378 | SDLoc dl(N); |
3379 | EVT EltVT = VecVT.getVectorElementType(); |
3380 | if (VecVT.getScalarSizeInBits() < 8) { |
3381 | EltVT = MVT::i8; |
3382 | VecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, |
3383 | EC: VecVT.getVectorElementCount()); |
3384 | Vec = DAG.getNode(Opcode: ISD::ANY_EXTEND, DL: dl, VT: VecVT, Operand: Vec); |
3385 | } |
3386 | |
3387 | // Store the vector to the stack. |
3388 | // In cases where the vector is illegal it will be broken down into parts |
3389 | // and stored in parts - we should use the alignment for the smallest part. |
3390 | Align SmallestAlign = DAG.getReducedAlign(VT: VecVT, /*UseABI=*/false); |
3391 | SDValue StackPtr = |
3392 | DAG.CreateStackTemporary(Bytes: VecVT.getStoreSize(), Alignment: SmallestAlign); |
3393 | auto &MF = DAG.getMachineFunction(); |
3394 | auto FrameIndex = cast<FrameIndexSDNode>(Val: StackPtr.getNode())->getIndex(); |
3395 | auto PtrInfo = MachinePointerInfo::getFixedStack(MF, FI: FrameIndex); |
3396 | SDValue Store = DAG.getStore(Chain: DAG.getEntryNode(), dl, Val: Vec, Ptr: StackPtr, PtrInfo, |
3397 | Alignment: SmallestAlign); |
3398 | |
3399 | // Load back the required element. |
3400 | StackPtr = TLI.getVectorElementPointer(DAG, VecPtr: StackPtr, VecVT, Index: Idx); |
3401 | |
3402 | // FIXME: This is to handle i1 vectors with elements promoted to i8. |
3403 | // i1 vector handling needs general improvement. |
3404 | if (N->getValueType(ResNo: 0).bitsLT(VT: EltVT)) { |
3405 | SDValue Load = DAG.getLoad(VT: EltVT, dl, Chain: Store, Ptr: StackPtr, |
3406 | PtrInfo: MachinePointerInfo::getUnknownStack(MF&: DAG.getMachineFunction())); |
3407 | return DAG.getZExtOrTrunc(Op: Load, DL: dl, VT: N->getValueType(ResNo: 0)); |
3408 | } |
3409 | |
3410 | return DAG.getExtLoad( |
3411 | ExtType: ISD::EXTLOAD, dl, VT: N->getValueType(ResNo: 0), Chain: Store, Ptr: StackPtr, |
3412 | PtrInfo: MachinePointerInfo::getUnknownStack(MF&: DAG.getMachineFunction()), MemVT: EltVT, |
3413 | Alignment: commonAlignment(A: SmallestAlign, Offset: EltVT.getFixedSizeInBits() / 8)); |
3414 | } |
3415 | |
3416 | SDValue DAGTypeLegalizer::SplitVecOp_ExtVecInRegOp(SDNode *N) { |
3417 | SDValue Lo, Hi; |
3418 | |
3419 | // *_EXTEND_VECTOR_INREG only reference the lower half of the input, so |
3420 | // splitting the result has the same effect as splitting the input operand. |
3421 | SplitVecRes_ExtVecInRegOp(N, Lo, Hi); |
3422 | |
3423 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: SDLoc(N), VT: N->getValueType(ResNo: 0), N1: Lo, N2: Hi); |
3424 | } |
3425 | |
3426 | SDValue DAGTypeLegalizer::SplitVecOp_Gather(MemSDNode *N, unsigned OpNo) { |
3427 | (void)OpNo; |
3428 | SDValue Lo, Hi; |
3429 | SplitVecRes_Gather(N, Lo, Hi); |
3430 | |
3431 | SDValue Res = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: N, VT: N->getValueType(ResNo: 0), N1: Lo, N2: Hi); |
3432 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
3433 | return SDValue(); |
3434 | } |
3435 | |
3436 | SDValue DAGTypeLegalizer::SplitVecOp_VP_STORE(VPStoreSDNode *N, unsigned OpNo) { |
3437 | assert(N->isUnindexed() && "Indexed vp_store of vector?" ); |
3438 | SDValue Ch = N->getChain(); |
3439 | SDValue Ptr = N->getBasePtr(); |
3440 | SDValue Offset = N->getOffset(); |
3441 | assert(Offset.isUndef() && "Unexpected VP store offset" ); |
3442 | SDValue Mask = N->getMask(); |
3443 | SDValue EVL = N->getVectorLength(); |
3444 | SDValue Data = N->getValue(); |
3445 | Align Alignment = N->getOriginalAlign(); |
3446 | SDLoc DL(N); |
3447 | |
3448 | SDValue DataLo, DataHi; |
3449 | if (getTypeAction(VT: Data.getValueType()) == TargetLowering::TypeSplitVector) |
3450 | // Split Data operand |
3451 | GetSplitVector(Op: Data, Lo&: DataLo, Hi&: DataHi); |
3452 | else |
3453 | std::tie(args&: DataLo, args&: DataHi) = DAG.SplitVector(N: Data, DL); |
3454 | |
3455 | // Split Mask operand |
3456 | SDValue MaskLo, MaskHi; |
3457 | if (OpNo == 1 && Mask.getOpcode() == ISD::SETCC) { |
3458 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
3459 | } else { |
3460 | if (getTypeAction(VT: Mask.getValueType()) == TargetLowering::TypeSplitVector) |
3461 | GetSplitVector(Op: Mask, Lo&: MaskLo, Hi&: MaskHi); |
3462 | else |
3463 | std::tie(args&: MaskLo, args&: MaskHi) = DAG.SplitVector(N: Mask, DL); |
3464 | } |
3465 | |
3466 | EVT MemoryVT = N->getMemoryVT(); |
3467 | EVT LoMemVT, HiMemVT; |
3468 | bool HiIsEmpty = false; |
3469 | std::tie(args&: LoMemVT, args&: HiMemVT) = |
3470 | DAG.GetDependentSplitDestVTs(VT: MemoryVT, EnvVT: DataLo.getValueType(), HiIsEmpty: &HiIsEmpty); |
3471 | |
3472 | // Split EVL |
3473 | SDValue EVLLo, EVLHi; |
3474 | std::tie(args&: EVLLo, args&: EVLHi) = DAG.SplitEVL(N: EVL, VecVT: Data.getValueType(), DL); |
3475 | |
3476 | SDValue Lo, Hi; |
3477 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
3478 | PtrInfo: N->getPointerInfo(), f: MachineMemOperand::MOStore, |
3479 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3480 | |
3481 | Lo = DAG.getStoreVP(Chain: Ch, dl: DL, Val: DataLo, Ptr, Offset, Mask: MaskLo, EVL: EVLLo, MemVT: LoMemVT, MMO, |
3482 | AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), |
3483 | IsCompressing: N->isCompressingStore()); |
3484 | |
3485 | // If the hi vp_store has zero storage size, only the lo vp_store is needed. |
3486 | if (HiIsEmpty) |
3487 | return Lo; |
3488 | |
3489 | Ptr = TLI.IncrementMemoryAddress(Addr: Ptr, Mask: MaskLo, DL, DataVT: LoMemVT, DAG, |
3490 | IsCompressedMemory: N->isCompressingStore()); |
3491 | |
3492 | MachinePointerInfo MPI; |
3493 | if (LoMemVT.isScalableVector()) { |
3494 | Alignment = commonAlignment(A: Alignment, |
3495 | Offset: LoMemVT.getSizeInBits().getKnownMinValue() / 8); |
3496 | MPI = MachinePointerInfo(N->getPointerInfo().getAddrSpace()); |
3497 | } else |
3498 | MPI = N->getPointerInfo().getWithOffset( |
3499 | O: LoMemVT.getStoreSize().getFixedValue()); |
3500 | |
3501 | MMO = DAG.getMachineFunction().getMachineMemOperand( |
3502 | PtrInfo: MPI, f: MachineMemOperand::MOStore, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
3503 | AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3504 | |
3505 | Hi = DAG.getStoreVP(Chain: Ch, dl: DL, Val: DataHi, Ptr, Offset, Mask: MaskHi, EVL: EVLHi, MemVT: HiMemVT, MMO, |
3506 | AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), |
3507 | IsCompressing: N->isCompressingStore()); |
3508 | |
3509 | // Build a factor node to remember that this store is independent of the |
3510 | // other one. |
3511 | return DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Lo, Hi); |
3512 | } |
3513 | |
3514 | SDValue DAGTypeLegalizer::SplitVecOp_VP_STRIDED_STORE(VPStridedStoreSDNode *N, |
3515 | unsigned OpNo) { |
3516 | assert(N->isUnindexed() && "Indexed vp_strided_store of a vector?" ); |
3517 | assert(N->getOffset().isUndef() && "Unexpected VP strided store offset" ); |
3518 | |
3519 | SDLoc DL(N); |
3520 | |
3521 | SDValue Data = N->getValue(); |
3522 | SDValue LoData, HiData; |
3523 | if (getTypeAction(VT: Data.getValueType()) == TargetLowering::TypeSplitVector) |
3524 | GetSplitVector(Op: Data, Lo&: LoData, Hi&: HiData); |
3525 | else |
3526 | std::tie(args&: LoData, args&: HiData) = DAG.SplitVector(N: Data, DL); |
3527 | |
3528 | EVT LoMemVT, HiMemVT; |
3529 | bool HiIsEmpty = false; |
3530 | std::tie(args&: LoMemVT, args&: HiMemVT) = DAG.GetDependentSplitDestVTs( |
3531 | VT: N->getMemoryVT(), EnvVT: LoData.getValueType(), HiIsEmpty: &HiIsEmpty); |
3532 | |
3533 | SDValue Mask = N->getMask(); |
3534 | SDValue LoMask, HiMask; |
3535 | if (OpNo == 1 && Mask.getOpcode() == ISD::SETCC) |
3536 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: LoMask, Hi&: HiMask); |
3537 | else if (getTypeAction(VT: Mask.getValueType()) == |
3538 | TargetLowering::TypeSplitVector) |
3539 | GetSplitVector(Op: Mask, Lo&: LoMask, Hi&: HiMask); |
3540 | else |
3541 | std::tie(args&: LoMask, args&: HiMask) = DAG.SplitVector(N: Mask, DL); |
3542 | |
3543 | SDValue LoEVL, HiEVL; |
3544 | std::tie(args&: LoEVL, args&: HiEVL) = |
3545 | DAG.SplitEVL(N: N->getVectorLength(), VecVT: Data.getValueType(), DL); |
3546 | |
3547 | // Generate the low vp_strided_store |
3548 | SDValue Lo = DAG.getStridedStoreVP( |
3549 | Chain: N->getChain(), DL, Val: LoData, Ptr: N->getBasePtr(), Offset: N->getOffset(), |
3550 | Stride: N->getStride(), Mask: LoMask, EVL: LoEVL, MemVT: LoMemVT, MMO: N->getMemOperand(), |
3551 | AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), IsCompressing: N->isCompressingStore()); |
3552 | |
3553 | // If the high vp_strided_store has zero storage size, only the low |
3554 | // vp_strided_store is needed. |
3555 | if (HiIsEmpty) |
3556 | return Lo; |
3557 | |
3558 | // Generate the high vp_strided_store. |
3559 | // To calculate the high base address, we need to sum to the low base |
3560 | // address stride number of bytes for each element already stored by low, |
3561 | // that is: Ptr = Ptr + (LoEVL * Stride) |
3562 | EVT PtrVT = N->getBasePtr().getValueType(); |
3563 | SDValue Increment = |
3564 | DAG.getNode(Opcode: ISD::MUL, DL, VT: PtrVT, N1: LoEVL, |
3565 | N2: DAG.getSExtOrTrunc(Op: N->getStride(), DL, VT: PtrVT)); |
3566 | SDValue Ptr = DAG.getNode(Opcode: ISD::ADD, DL, VT: PtrVT, N1: N->getBasePtr(), N2: Increment); |
3567 | |
3568 | Align Alignment = N->getOriginalAlign(); |
3569 | if (LoMemVT.isScalableVector()) |
3570 | Alignment = commonAlignment(A: Alignment, |
3571 | Offset: LoMemVT.getSizeInBits().getKnownMinValue() / 8); |
3572 | |
3573 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
3574 | PtrInfo: MachinePointerInfo(N->getPointerInfo().getAddrSpace()), |
3575 | f: MachineMemOperand::MOStore, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
3576 | AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3577 | |
3578 | SDValue Hi = DAG.getStridedStoreVP( |
3579 | Chain: N->getChain(), DL, Val: HiData, Ptr, Offset: N->getOffset(), Stride: N->getStride(), Mask: HiMask, |
3580 | EVL: HiEVL, MemVT: HiMemVT, MMO, AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), |
3581 | IsCompressing: N->isCompressingStore()); |
3582 | |
3583 | // Build a factor node to remember that this store is independent of the |
3584 | // other one. |
3585 | return DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Lo, Hi); |
3586 | } |
3587 | |
3588 | SDValue DAGTypeLegalizer::SplitVecOp_MSTORE(MaskedStoreSDNode *N, |
3589 | unsigned OpNo) { |
3590 | assert(N->isUnindexed() && "Indexed masked store of vector?" ); |
3591 | SDValue Ch = N->getChain(); |
3592 | SDValue Ptr = N->getBasePtr(); |
3593 | SDValue Offset = N->getOffset(); |
3594 | assert(Offset.isUndef() && "Unexpected indexed masked store offset" ); |
3595 | SDValue Mask = N->getMask(); |
3596 | SDValue Data = N->getValue(); |
3597 | Align Alignment = N->getOriginalAlign(); |
3598 | SDLoc DL(N); |
3599 | |
3600 | SDValue DataLo, DataHi; |
3601 | if (getTypeAction(VT: Data.getValueType()) == TargetLowering::TypeSplitVector) |
3602 | // Split Data operand |
3603 | GetSplitVector(Op: Data, Lo&: DataLo, Hi&: DataHi); |
3604 | else |
3605 | std::tie(args&: DataLo, args&: DataHi) = DAG.SplitVector(N: Data, DL); |
3606 | |
3607 | // Split Mask operand |
3608 | SDValue MaskLo, MaskHi; |
3609 | if (OpNo == 1 && Mask.getOpcode() == ISD::SETCC) { |
3610 | SplitVecRes_SETCC(N: Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
3611 | } else { |
3612 | if (getTypeAction(VT: Mask.getValueType()) == TargetLowering::TypeSplitVector) |
3613 | GetSplitVector(Op: Mask, Lo&: MaskLo, Hi&: MaskHi); |
3614 | else |
3615 | std::tie(args&: MaskLo, args&: MaskHi) = DAG.SplitVector(N: Mask, DL); |
3616 | } |
3617 | |
3618 | EVT MemoryVT = N->getMemoryVT(); |
3619 | EVT LoMemVT, HiMemVT; |
3620 | bool HiIsEmpty = false; |
3621 | std::tie(args&: LoMemVT, args&: HiMemVT) = |
3622 | DAG.GetDependentSplitDestVTs(VT: MemoryVT, EnvVT: DataLo.getValueType(), HiIsEmpty: &HiIsEmpty); |
3623 | |
3624 | SDValue Lo, Hi, Res; |
3625 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
3626 | PtrInfo: N->getPointerInfo(), f: MachineMemOperand::MOStore, |
3627 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3628 | |
3629 | Lo = DAG.getMaskedStore(Chain: Ch, dl: DL, Val: DataLo, Base: Ptr, Offset, Mask: MaskLo, MemVT: LoMemVT, MMO, |
3630 | AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), |
3631 | IsCompressing: N->isCompressingStore()); |
3632 | |
3633 | if (HiIsEmpty) { |
3634 | // The hi masked store has zero storage size. |
3635 | // Only the lo masked store is needed. |
3636 | Res = Lo; |
3637 | } else { |
3638 | |
3639 | Ptr = TLI.IncrementMemoryAddress(Addr: Ptr, Mask: MaskLo, DL, DataVT: LoMemVT, DAG, |
3640 | IsCompressedMemory: N->isCompressingStore()); |
3641 | |
3642 | MachinePointerInfo MPI; |
3643 | if (LoMemVT.isScalableVector()) { |
3644 | Alignment = commonAlignment( |
3645 | A: Alignment, Offset: LoMemVT.getSizeInBits().getKnownMinValue() / 8); |
3646 | MPI = MachinePointerInfo(N->getPointerInfo().getAddrSpace()); |
3647 | } else |
3648 | MPI = N->getPointerInfo().getWithOffset( |
3649 | O: LoMemVT.getStoreSize().getFixedValue()); |
3650 | |
3651 | MMO = DAG.getMachineFunction().getMachineMemOperand( |
3652 | PtrInfo: MPI, f: MachineMemOperand::MOStore, s: MemoryLocation::UnknownSize, base_alignment: Alignment, |
3653 | AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3654 | |
3655 | Hi = DAG.getMaskedStore(Chain: Ch, dl: DL, Val: DataHi, Base: Ptr, Offset, Mask: MaskHi, MemVT: HiMemVT, MMO, |
3656 | AM: N->getAddressingMode(), IsTruncating: N->isTruncatingStore(), |
3657 | IsCompressing: N->isCompressingStore()); |
3658 | |
3659 | // Build a factor node to remember that this store is independent of the |
3660 | // other one. |
3661 | Res = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Lo, Hi); |
3662 | } |
3663 | |
3664 | return Res; |
3665 | } |
3666 | |
3667 | SDValue DAGTypeLegalizer::SplitVecOp_Scatter(MemSDNode *N, unsigned OpNo) { |
3668 | SDValue Ch = N->getChain(); |
3669 | SDValue Ptr = N->getBasePtr(); |
3670 | EVT MemoryVT = N->getMemoryVT(); |
3671 | Align Alignment = N->getOriginalAlign(); |
3672 | SDLoc DL(N); |
3673 | struct Operands { |
3674 | SDValue Mask; |
3675 | SDValue Index; |
3676 | SDValue Scale; |
3677 | SDValue Data; |
3678 | } Ops = [&]() -> Operands { |
3679 | if (auto *MSC = dyn_cast<MaskedScatterSDNode>(Val: N)) { |
3680 | return {.Mask: MSC->getMask(), .Index: MSC->getIndex(), .Scale: MSC->getScale(), |
3681 | .Data: MSC->getValue()}; |
3682 | } |
3683 | auto *VPSC = cast<VPScatterSDNode>(Val: N); |
3684 | return {.Mask: VPSC->getMask(), .Index: VPSC->getIndex(), .Scale: VPSC->getScale(), |
3685 | .Data: VPSC->getValue()}; |
3686 | }(); |
3687 | // Split all operands |
3688 | |
3689 | EVT LoMemVT, HiMemVT; |
3690 | std::tie(args&: LoMemVT, args&: HiMemVT) = DAG.GetSplitDestVTs(VT: MemoryVT); |
3691 | |
3692 | SDValue DataLo, DataHi; |
3693 | if (getTypeAction(VT: Ops.Data.getValueType()) == TargetLowering::TypeSplitVector) |
3694 | // Split Data operand |
3695 | GetSplitVector(Op: Ops.Data, Lo&: DataLo, Hi&: DataHi); |
3696 | else |
3697 | std::tie(args&: DataLo, args&: DataHi) = DAG.SplitVector(N: Ops.Data, DL); |
3698 | |
3699 | // Split Mask operand |
3700 | SDValue MaskLo, MaskHi; |
3701 | if (OpNo == 1 && Ops.Mask.getOpcode() == ISD::SETCC) { |
3702 | SplitVecRes_SETCC(N: Ops.Mask.getNode(), Lo&: MaskLo, Hi&: MaskHi); |
3703 | } else { |
3704 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: Ops.Mask, DL); |
3705 | } |
3706 | |
3707 | SDValue IndexHi, IndexLo; |
3708 | if (getTypeAction(VT: Ops.Index.getValueType()) == |
3709 | TargetLowering::TypeSplitVector) |
3710 | GetSplitVector(Op: Ops.Index, Lo&: IndexLo, Hi&: IndexHi); |
3711 | else |
3712 | std::tie(args&: IndexLo, args&: IndexHi) = DAG.SplitVector(N: Ops.Index, DL); |
3713 | |
3714 | SDValue Lo; |
3715 | MachineMemOperand *MMO = DAG.getMachineFunction().getMachineMemOperand( |
3716 | PtrInfo: N->getPointerInfo(), f: MachineMemOperand::MOStore, |
3717 | s: MemoryLocation::UnknownSize, base_alignment: Alignment, AAInfo: N->getAAInfo(), Ranges: N->getRanges()); |
3718 | |
3719 | if (auto *MSC = dyn_cast<MaskedScatterSDNode>(Val: N)) { |
3720 | SDValue OpsLo[] = {Ch, DataLo, MaskLo, Ptr, IndexLo, Ops.Scale}; |
3721 | Lo = |
3722 | DAG.getMaskedScatter(VTs: DAG.getVTList(MVT::Other), MemVT: LoMemVT, dl: DL, Ops: OpsLo, MMO, |
3723 | IndexType: MSC->getIndexType(), IsTruncating: MSC->isTruncatingStore()); |
3724 | |
3725 | // The order of the Scatter operation after split is well defined. The "Hi" |
3726 | // part comes after the "Lo". So these two operations should be chained one |
3727 | // after another. |
3728 | SDValue OpsHi[] = {Lo, DataHi, MaskHi, Ptr, IndexHi, Ops.Scale}; |
3729 | return DAG.getMaskedScatter(VTs: DAG.getVTList(MVT::Other), MemVT: HiMemVT, dl: DL, Ops: OpsHi, |
3730 | MMO, IndexType: MSC->getIndexType(), |
3731 | IsTruncating: MSC->isTruncatingStore()); |
3732 | } |
3733 | auto *VPSC = cast<VPScatterSDNode>(Val: N); |
3734 | SDValue EVLLo, EVLHi; |
3735 | std::tie(args&: EVLLo, args&: EVLHi) = |
3736 | DAG.SplitEVL(N: VPSC->getVectorLength(), VecVT: Ops.Data.getValueType(), DL); |
3737 | |
3738 | SDValue OpsLo[] = {Ch, DataLo, Ptr, IndexLo, Ops.Scale, MaskLo, EVLLo}; |
3739 | Lo = DAG.getScatterVP(VTs: DAG.getVTList(MVT::Other), VT: LoMemVT, dl: DL, Ops: OpsLo, MMO, |
3740 | IndexType: VPSC->getIndexType()); |
3741 | |
3742 | // The order of the Scatter operation after split is well defined. The "Hi" |
3743 | // part comes after the "Lo". So these two operations should be chained one |
3744 | // after another. |
3745 | SDValue OpsHi[] = {Lo, DataHi, Ptr, IndexHi, Ops.Scale, MaskHi, EVLHi}; |
3746 | return DAG.getScatterVP(VTs: DAG.getVTList(MVT::Other), VT: HiMemVT, dl: DL, Ops: OpsHi, MMO, |
3747 | IndexType: VPSC->getIndexType()); |
3748 | } |
3749 | |
3750 | SDValue DAGTypeLegalizer::SplitVecOp_STORE(StoreSDNode *N, unsigned OpNo) { |
3751 | assert(N->isUnindexed() && "Indexed store of vector?" ); |
3752 | assert(OpNo == 1 && "Can only split the stored value" ); |
3753 | SDLoc DL(N); |
3754 | |
3755 | bool isTruncating = N->isTruncatingStore(); |
3756 | SDValue Ch = N->getChain(); |
3757 | SDValue Ptr = N->getBasePtr(); |
3758 | EVT MemoryVT = N->getMemoryVT(); |
3759 | Align Alignment = N->getOriginalAlign(); |
3760 | MachineMemOperand::Flags MMOFlags = N->getMemOperand()->getFlags(); |
3761 | AAMDNodes AAInfo = N->getAAInfo(); |
3762 | SDValue Lo, Hi; |
3763 | GetSplitVector(Op: N->getOperand(Num: 1), Lo, Hi); |
3764 | |
3765 | EVT LoMemVT, HiMemVT; |
3766 | std::tie(args&: LoMemVT, args&: HiMemVT) = DAG.GetSplitDestVTs(VT: MemoryVT); |
3767 | |
3768 | // Scalarize if the split halves are not byte-sized. |
3769 | if (!LoMemVT.isByteSized() || !HiMemVT.isByteSized()) |
3770 | return TLI.scalarizeVectorStore(ST: N, DAG); |
3771 | |
3772 | if (isTruncating) |
3773 | Lo = DAG.getTruncStore(Chain: Ch, dl: DL, Val: Lo, Ptr, PtrInfo: N->getPointerInfo(), SVT: LoMemVT, |
3774 | Alignment, MMOFlags, AAInfo); |
3775 | else |
3776 | Lo = DAG.getStore(Chain: Ch, dl: DL, Val: Lo, Ptr, PtrInfo: N->getPointerInfo(), Alignment, MMOFlags, |
3777 | AAInfo); |
3778 | |
3779 | MachinePointerInfo MPI; |
3780 | IncrementPointer(N, MemVT: LoMemVT, MPI, Ptr); |
3781 | |
3782 | if (isTruncating) |
3783 | Hi = DAG.getTruncStore(Chain: Ch, dl: DL, Val: Hi, Ptr, PtrInfo: MPI, |
3784 | SVT: HiMemVT, Alignment, MMOFlags, AAInfo); |
3785 | else |
3786 | Hi = DAG.getStore(Chain: Ch, dl: DL, Val: Hi, Ptr, PtrInfo: MPI, Alignment, MMOFlags, AAInfo); |
3787 | |
3788 | return DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Lo, Hi); |
3789 | } |
3790 | |
3791 | SDValue DAGTypeLegalizer::SplitVecOp_CONCAT_VECTORS(SDNode *N) { |
3792 | SDLoc DL(N); |
3793 | |
3794 | // The input operands all must have the same type, and we know the result |
3795 | // type is valid. Convert this to a buildvector which extracts all the |
3796 | // input elements. |
3797 | // TODO: If the input elements are power-two vectors, we could convert this to |
3798 | // a new CONCAT_VECTORS node with elements that are half-wide. |
3799 | SmallVector<SDValue, 32> Elts; |
3800 | EVT EltVT = N->getValueType(ResNo: 0).getVectorElementType(); |
3801 | for (const SDValue &Op : N->op_values()) { |
3802 | for (unsigned i = 0, e = Op.getValueType().getVectorNumElements(); |
3803 | i != e; ++i) { |
3804 | Elts.push_back(Elt: DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT: EltVT, N1: Op, |
3805 | N2: DAG.getVectorIdxConstant(Val: i, DL))); |
3806 | } |
3807 | } |
3808 | |
3809 | return DAG.getBuildVector(VT: N->getValueType(ResNo: 0), DL, Ops: Elts); |
3810 | } |
3811 | |
3812 | SDValue DAGTypeLegalizer::SplitVecOp_TruncateHelper(SDNode *N) { |
3813 | // The result type is legal, but the input type is illegal. If splitting |
3814 | // ends up with the result type of each half still being legal, just |
3815 | // do that. If, however, that would result in an illegal result type, |
3816 | // we can try to get more clever with power-two vectors. Specifically, |
3817 | // split the input type, but also widen the result element size, then |
3818 | // concatenate the halves and truncate again. For example, consider a target |
3819 | // where v8i8 is legal and v8i32 is not (ARM, which doesn't have 256-bit |
3820 | // vectors). To perform a "%res = v8i8 trunc v8i32 %in" we do: |
3821 | // %inlo = v4i32 extract_subvector %in, 0 |
3822 | // %inhi = v4i32 extract_subvector %in, 4 |
3823 | // %lo16 = v4i16 trunc v4i32 %inlo |
3824 | // %hi16 = v4i16 trunc v4i32 %inhi |
3825 | // %in16 = v8i16 concat_vectors v4i16 %lo16, v4i16 %hi16 |
3826 | // %res = v8i8 trunc v8i16 %in16 |
3827 | // |
3828 | // Without this transform, the original truncate would end up being |
3829 | // scalarized, which is pretty much always a last resort. |
3830 | unsigned OpNo = N->isStrictFPOpcode() ? 1 : 0; |
3831 | SDValue InVec = N->getOperand(Num: OpNo); |
3832 | EVT InVT = InVec->getValueType(ResNo: 0); |
3833 | EVT OutVT = N->getValueType(ResNo: 0); |
3834 | ElementCount NumElements = OutVT.getVectorElementCount(); |
3835 | bool IsFloat = OutVT.isFloatingPoint(); |
3836 | |
3837 | unsigned InElementSize = InVT.getScalarSizeInBits(); |
3838 | unsigned OutElementSize = OutVT.getScalarSizeInBits(); |
3839 | |
3840 | // Determine the split output VT. If its legal we can just split dirctly. |
3841 | EVT LoOutVT, HiOutVT; |
3842 | std::tie(args&: LoOutVT, args&: HiOutVT) = DAG.GetSplitDestVTs(VT: OutVT); |
3843 | assert(LoOutVT == HiOutVT && "Unequal split?" ); |
3844 | |
3845 | // If the input elements are only 1/2 the width of the result elements, |
3846 | // just use the normal splitting. Our trick only work if there's room |
3847 | // to split more than once. |
3848 | if (isTypeLegal(VT: LoOutVT) || |
3849 | InElementSize <= OutElementSize * 2) |
3850 | return SplitVecOp_UnaryOp(N); |
3851 | SDLoc DL(N); |
3852 | |
3853 | // Don't touch if this will be scalarized. |
3854 | EVT FinalVT = InVT; |
3855 | while (getTypeAction(VT: FinalVT) == TargetLowering::TypeSplitVector) |
3856 | FinalVT = FinalVT.getHalfNumVectorElementsVT(Context&: *DAG.getContext()); |
3857 | |
3858 | if (getTypeAction(VT: FinalVT) == TargetLowering::TypeScalarizeVector) |
3859 | return SplitVecOp_UnaryOp(N); |
3860 | |
3861 | // Get the split input vector. |
3862 | SDValue InLoVec, InHiVec; |
3863 | GetSplitVector(Op: InVec, Lo&: InLoVec, Hi&: InHiVec); |
3864 | |
3865 | // Truncate them to 1/2 the element size. |
3866 | // |
3867 | // This assumes the number of elements is a power of two; any vector that |
3868 | // isn't should be widened, not split. |
3869 | EVT HalfElementVT = IsFloat ? |
3870 | EVT::getFloatingPointVT(BitWidth: InElementSize/2) : |
3871 | EVT::getIntegerVT(Context&: *DAG.getContext(), BitWidth: InElementSize/2); |
3872 | EVT HalfVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: HalfElementVT, |
3873 | EC: NumElements.divideCoefficientBy(RHS: 2)); |
3874 | |
3875 | SDValue HalfLo; |
3876 | SDValue HalfHi; |
3877 | SDValue Chain; |
3878 | if (N->isStrictFPOpcode()) { |
3879 | HalfLo = DAG.getNode(N->getOpcode(), DL, {HalfVT, MVT::Other}, |
3880 | {N->getOperand(0), InLoVec}); |
3881 | HalfHi = DAG.getNode(N->getOpcode(), DL, {HalfVT, MVT::Other}, |
3882 | {N->getOperand(0), InHiVec}); |
3883 | // Legalize the chain result - switch anything that used the old chain to |
3884 | // use the new one. |
3885 | Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, HalfLo.getValue(R: 1), |
3886 | HalfHi.getValue(R: 1)); |
3887 | } else { |
3888 | HalfLo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: HalfVT, Operand: InLoVec); |
3889 | HalfHi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: HalfVT, Operand: InHiVec); |
3890 | } |
3891 | |
3892 | // Concatenate them to get the full intermediate truncation result. |
3893 | EVT InterVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: HalfElementVT, EC: NumElements); |
3894 | SDValue InterVec = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: InterVT, N1: HalfLo, |
3895 | N2: HalfHi); |
3896 | // Now finish up by truncating all the way down to the original result |
3897 | // type. This should normally be something that ends up being legal directly, |
3898 | // but in theory if a target has very wide vectors and an annoyingly |
3899 | // restricted set of legal types, this split can chain to build things up. |
3900 | |
3901 | if (N->isStrictFPOpcode()) { |
3902 | SDValue Res = DAG.getNode( |
3903 | ISD::STRICT_FP_ROUND, DL, {OutVT, MVT::Other}, |
3904 | {Chain, InterVec, |
3905 | DAG.getTargetConstant(0, DL, TLI.getPointerTy(DAG.getDataLayout()))}); |
3906 | // Relink the chain |
3907 | ReplaceValueWith(From: SDValue(N, 1), To: SDValue(Res.getNode(), 1)); |
3908 | return Res; |
3909 | } |
3910 | |
3911 | return IsFloat |
3912 | ? DAG.getNode(Opcode: ISD::FP_ROUND, DL, VT: OutVT, N1: InterVec, |
3913 | N2: DAG.getTargetConstant( |
3914 | Val: 0, DL, VT: TLI.getPointerTy(DL: DAG.getDataLayout()))) |
3915 | : DAG.getNode(Opcode: ISD::TRUNCATE, DL, VT: OutVT, Operand: InterVec); |
3916 | } |
3917 | |
3918 | SDValue DAGTypeLegalizer::SplitVecOp_VSETCC(SDNode *N) { |
3919 | assert(N->getValueType(0).isVector() && |
3920 | N->getOperand(0).getValueType().isVector() && |
3921 | "Operand types must be vectors" ); |
3922 | // The result has a legal vector type, but the input needs splitting. |
3923 | SDValue Lo0, Hi0, Lo1, Hi1, LoRes, HiRes; |
3924 | SDLoc DL(N); |
3925 | GetSplitVector(Op: N->getOperand(Num: 0), Lo&: Lo0, Hi&: Hi0); |
3926 | GetSplitVector(Op: N->getOperand(Num: 1), Lo&: Lo1, Hi&: Hi1); |
3927 | auto PartEltCnt = Lo0.getValueType().getVectorElementCount(); |
3928 | |
3929 | LLVMContext &Context = *DAG.getContext(); |
3930 | EVT PartResVT = EVT::getVectorVT(Context, MVT::i1, PartEltCnt); |
3931 | EVT WideResVT = EVT::getVectorVT(Context, MVT::i1, PartEltCnt*2); |
3932 | |
3933 | if (N->getOpcode() == ISD::SETCC) { |
3934 | LoRes = DAG.getNode(Opcode: ISD::SETCC, DL, VT: PartResVT, N1: Lo0, N2: Lo1, N3: N->getOperand(Num: 2)); |
3935 | HiRes = DAG.getNode(Opcode: ISD::SETCC, DL, VT: PartResVT, N1: Hi0, N2: Hi1, N3: N->getOperand(Num: 2)); |
3936 | } else { |
3937 | assert(N->getOpcode() == ISD::VP_SETCC && "Expected VP_SETCC opcode" ); |
3938 | SDValue MaskLo, MaskHi, EVLLo, EVLHi; |
3939 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 3)); |
3940 | std::tie(args&: EVLLo, args&: EVLHi) = |
3941 | DAG.SplitEVL(N: N->getOperand(Num: 4), VecVT: N->getValueType(ResNo: 0), DL); |
3942 | LoRes = DAG.getNode(Opcode: ISD::VP_SETCC, DL, VT: PartResVT, N1: Lo0, N2: Lo1, |
3943 | N3: N->getOperand(Num: 2), N4: MaskLo, N5: EVLLo); |
3944 | HiRes = DAG.getNode(Opcode: ISD::VP_SETCC, DL, VT: PartResVT, N1: Hi0, N2: Hi1, |
3945 | N3: N->getOperand(Num: 2), N4: MaskHi, N5: EVLHi); |
3946 | } |
3947 | SDValue Con = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: WideResVT, N1: LoRes, N2: HiRes); |
3948 | |
3949 | EVT OpVT = N->getOperand(Num: 0).getValueType(); |
3950 | ISD::NodeType ExtendCode = |
3951 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: OpVT)); |
3952 | return DAG.getNode(Opcode: ExtendCode, DL, VT: N->getValueType(ResNo: 0), Operand: Con); |
3953 | } |
3954 | |
3955 | |
3956 | SDValue DAGTypeLegalizer::SplitVecOp_FP_ROUND(SDNode *N) { |
3957 | // The result has a legal vector type, but the input needs splitting. |
3958 | EVT ResVT = N->getValueType(ResNo: 0); |
3959 | SDValue Lo, Hi; |
3960 | SDLoc DL(N); |
3961 | GetSplitVector(Op: N->getOperand(Num: N->isStrictFPOpcode() ? 1 : 0), Lo, Hi); |
3962 | EVT InVT = Lo.getValueType(); |
3963 | |
3964 | EVT OutVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: ResVT.getVectorElementType(), |
3965 | EC: InVT.getVectorElementCount()); |
3966 | |
3967 | if (N->isStrictFPOpcode()) { |
3968 | Lo = DAG.getNode(N->getOpcode(), DL, { OutVT, MVT::Other }, |
3969 | { N->getOperand(0), Lo, N->getOperand(2) }); |
3970 | Hi = DAG.getNode(N->getOpcode(), DL, { OutVT, MVT::Other }, |
3971 | { N->getOperand(0), Hi, N->getOperand(2) }); |
3972 | // Legalize the chain result - switch anything that used the old chain to |
3973 | // use the new one. |
3974 | SDValue NewChain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, |
3975 | Lo.getValue(1), Hi.getValue(1)); |
3976 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
3977 | } else if (N->getOpcode() == ISD::VP_FP_ROUND) { |
3978 | SDValue MaskLo, MaskHi, EVLLo, EVLHi; |
3979 | std::tie(args&: MaskLo, args&: MaskHi) = SplitMask(Mask: N->getOperand(Num: 1)); |
3980 | std::tie(args&: EVLLo, args&: EVLHi) = |
3981 | DAG.SplitEVL(N: N->getOperand(Num: 2), VecVT: N->getValueType(ResNo: 0), DL); |
3982 | Lo = DAG.getNode(Opcode: ISD::VP_FP_ROUND, DL, VT: OutVT, N1: Lo, N2: MaskLo, N3: EVLLo); |
3983 | Hi = DAG.getNode(Opcode: ISD::VP_FP_ROUND, DL, VT: OutVT, N1: Hi, N2: MaskHi, N3: EVLHi); |
3984 | } else { |
3985 | Lo = DAG.getNode(Opcode: ISD::FP_ROUND, DL, VT: OutVT, N1: Lo, N2: N->getOperand(Num: 1)); |
3986 | Hi = DAG.getNode(Opcode: ISD::FP_ROUND, DL, VT: OutVT, N1: Hi, N2: N->getOperand(Num: 1)); |
3987 | } |
3988 | |
3989 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: ResVT, N1: Lo, N2: Hi); |
3990 | } |
3991 | |
3992 | // Split a vector type in an FP binary operation where the second operand has a |
3993 | // different type from the first. |
3994 | // |
3995 | // The result (and the first input) has a legal vector type, but the second |
3996 | // input needs splitting. |
3997 | SDValue DAGTypeLegalizer::SplitVecOp_FPOpDifferentTypes(SDNode *N) { |
3998 | SDLoc DL(N); |
3999 | |
4000 | EVT LHSLoVT, LHSHiVT; |
4001 | std::tie(args&: LHSLoVT, args&: LHSHiVT) = DAG.GetSplitDestVTs(VT: N->getValueType(ResNo: 0)); |
4002 | |
4003 | if (!isTypeLegal(VT: LHSLoVT) || !isTypeLegal(VT: LHSHiVT)) |
4004 | return DAG.UnrollVectorOp(N, ResNE: N->getValueType(ResNo: 0).getVectorNumElements()); |
4005 | |
4006 | SDValue LHSLo, LHSHi; |
4007 | std::tie(args&: LHSLo, args&: LHSHi) = |
4008 | DAG.SplitVector(N: N->getOperand(Num: 0), DL, LoVT: LHSLoVT, HiVT: LHSHiVT); |
4009 | |
4010 | SDValue RHSLo, RHSHi; |
4011 | std::tie(args&: RHSLo, args&: RHSHi) = DAG.SplitVector(N: N->getOperand(Num: 1), DL); |
4012 | |
4013 | SDValue Lo = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSLoVT, N1: LHSLo, N2: RHSLo); |
4014 | SDValue Hi = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LHSHiVT, N1: LHSHi, N2: RHSHi); |
4015 | |
4016 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: N->getValueType(ResNo: 0), N1: Lo, N2: Hi); |
4017 | } |
4018 | |
4019 | SDValue DAGTypeLegalizer::SplitVecOp_FP_TO_XINT_SAT(SDNode *N) { |
4020 | EVT ResVT = N->getValueType(ResNo: 0); |
4021 | SDValue Lo, Hi; |
4022 | SDLoc dl(N); |
4023 | GetSplitVector(Op: N->getOperand(Num: 0), Lo, Hi); |
4024 | EVT InVT = Lo.getValueType(); |
4025 | |
4026 | EVT NewResVT = |
4027 | EVT::getVectorVT(Context&: *DAG.getContext(), VT: ResVT.getVectorElementType(), |
4028 | EC: InVT.getVectorElementCount()); |
4029 | |
4030 | Lo = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: NewResVT, N1: Lo, N2: N->getOperand(Num: 1)); |
4031 | Hi = DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: NewResVT, N1: Hi, N2: N->getOperand(Num: 1)); |
4032 | |
4033 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: ResVT, N1: Lo, N2: Hi); |
4034 | } |
4035 | |
4036 | //===----------------------------------------------------------------------===// |
4037 | // Result Vector Widening |
4038 | //===----------------------------------------------------------------------===// |
4039 | |
4040 | void DAGTypeLegalizer::WidenVectorResult(SDNode *N, unsigned ResNo) { |
4041 | LLVM_DEBUG(dbgs() << "Widen node result " << ResNo << ": " ; N->dump(&DAG)); |
4042 | |
4043 | // See if the target wants to custom widen this node. |
4044 | if (CustomWidenLowerNode(N, VT: N->getValueType(ResNo))) |
4045 | return; |
4046 | |
4047 | SDValue Res = SDValue(); |
4048 | |
4049 | auto unrollExpandedOp = [&]() { |
4050 | // We're going to widen this vector op to a legal type by padding with undef |
4051 | // elements. If the wide vector op is eventually going to be expanded to |
4052 | // scalar libcalls, then unroll into scalar ops now to avoid unnecessary |
4053 | // libcalls on the undef elements. |
4054 | EVT VT = N->getValueType(ResNo: 0); |
4055 | EVT WideVecVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
4056 | if (!TLI.isOperationLegalOrCustom(Op: N->getOpcode(), VT: WideVecVT) && |
4057 | TLI.isOperationExpand(Op: N->getOpcode(), VT: VT.getScalarType())) { |
4058 | Res = DAG.UnrollVectorOp(N, ResNE: WideVecVT.getVectorNumElements()); |
4059 | return true; |
4060 | } |
4061 | return false; |
4062 | }; |
4063 | |
4064 | switch (N->getOpcode()) { |
4065 | default: |
4066 | #ifndef NDEBUG |
4067 | dbgs() << "WidenVectorResult #" << ResNo << ": " ; |
4068 | N->dump(G: &DAG); |
4069 | dbgs() << "\n" ; |
4070 | #endif |
4071 | report_fatal_error(reason: "Do not know how to widen the result of this operator!" ); |
4072 | |
4073 | case ISD::MERGE_VALUES: Res = WidenVecRes_MERGE_VALUES(N, ResNo); break; |
4074 | case ISD::AssertZext: Res = WidenVecRes_AssertZext(N); break; |
4075 | case ISD::BITCAST: Res = WidenVecRes_BITCAST(N); break; |
4076 | case ISD::BUILD_VECTOR: Res = WidenVecRes_BUILD_VECTOR(N); break; |
4077 | case ISD::CONCAT_VECTORS: Res = WidenVecRes_CONCAT_VECTORS(N); break; |
4078 | case ISD::INSERT_SUBVECTOR: |
4079 | Res = WidenVecRes_INSERT_SUBVECTOR(N); |
4080 | break; |
4081 | case ISD::EXTRACT_SUBVECTOR: Res = WidenVecRes_EXTRACT_SUBVECTOR(N); break; |
4082 | case ISD::INSERT_VECTOR_ELT: Res = WidenVecRes_INSERT_VECTOR_ELT(N); break; |
4083 | case ISD::LOAD: Res = WidenVecRes_LOAD(N); break; |
4084 | case ISD::STEP_VECTOR: |
4085 | case ISD::SPLAT_VECTOR: |
4086 | case ISD::SCALAR_TO_VECTOR: |
4087 | Res = WidenVecRes_ScalarOp(N); |
4088 | break; |
4089 | case ISD::SIGN_EXTEND_INREG: Res = WidenVecRes_InregOp(N); break; |
4090 | case ISD::VSELECT: |
4091 | case ISD::SELECT: |
4092 | case ISD::VP_SELECT: |
4093 | case ISD::VP_MERGE: |
4094 | Res = WidenVecRes_Select(N); |
4095 | break; |
4096 | case ISD::SELECT_CC: Res = WidenVecRes_SELECT_CC(N); break; |
4097 | case ISD::VP_SETCC: |
4098 | case ISD::SETCC: Res = WidenVecRes_SETCC(N); break; |
4099 | case ISD::UNDEF: Res = WidenVecRes_UNDEF(N); break; |
4100 | case ISD::VECTOR_SHUFFLE: |
4101 | Res = WidenVecRes_VECTOR_SHUFFLE(N: cast<ShuffleVectorSDNode>(Val: N)); |
4102 | break; |
4103 | case ISD::VP_LOAD: |
4104 | Res = WidenVecRes_VP_LOAD(N: cast<VPLoadSDNode>(Val: N)); |
4105 | break; |
4106 | case ISD::EXPERIMENTAL_VP_STRIDED_LOAD: |
4107 | Res = WidenVecRes_VP_STRIDED_LOAD(N: cast<VPStridedLoadSDNode>(Val: N)); |
4108 | break; |
4109 | case ISD::MLOAD: |
4110 | Res = WidenVecRes_MLOAD(N: cast<MaskedLoadSDNode>(Val: N)); |
4111 | break; |
4112 | case ISD::MGATHER: |
4113 | Res = WidenVecRes_MGATHER(N: cast<MaskedGatherSDNode>(Val: N)); |
4114 | break; |
4115 | case ISD::VP_GATHER: |
4116 | Res = WidenVecRes_VP_GATHER(N: cast<VPGatherSDNode>(Val: N)); |
4117 | break; |
4118 | case ISD::VECTOR_REVERSE: |
4119 | Res = WidenVecRes_VECTOR_REVERSE(N); |
4120 | break; |
4121 | |
4122 | case ISD::ADD: case ISD::VP_ADD: |
4123 | case ISD::AND: case ISD::VP_AND: |
4124 | case ISD::MUL: case ISD::VP_MUL: |
4125 | case ISD::MULHS: |
4126 | case ISD::MULHU: |
4127 | case ISD::OR: case ISD::VP_OR: |
4128 | case ISD::SUB: case ISD::VP_SUB: |
4129 | case ISD::XOR: case ISD::VP_XOR: |
4130 | case ISD::SHL: case ISD::VP_SHL: |
4131 | case ISD::SRA: case ISD::VP_ASHR: |
4132 | case ISD::SRL: case ISD::VP_LSHR: |
4133 | case ISD::FMINNUM: case ISD::VP_FMINNUM: |
4134 | case ISD::FMAXNUM: case ISD::VP_FMAXNUM: |
4135 | case ISD::FMINIMUM: |
4136 | case ISD::VP_FMINIMUM: |
4137 | case ISD::FMAXIMUM: |
4138 | case ISD::VP_FMAXIMUM: |
4139 | case ISD::SMIN: case ISD::VP_SMIN: |
4140 | case ISD::SMAX: case ISD::VP_SMAX: |
4141 | case ISD::UMIN: case ISD::VP_UMIN: |
4142 | case ISD::UMAX: case ISD::VP_UMAX: |
4143 | case ISD::UADDSAT: |
4144 | case ISD::SADDSAT: |
4145 | case ISD::USUBSAT: |
4146 | case ISD::SSUBSAT: |
4147 | case ISD::SSHLSAT: |
4148 | case ISD::USHLSAT: |
4149 | case ISD::ROTL: |
4150 | case ISD::ROTR: |
4151 | case ISD::AVGFLOORS: |
4152 | case ISD::AVGFLOORU: |
4153 | case ISD::AVGCEILS: |
4154 | case ISD::AVGCEILU: |
4155 | // Vector-predicated binary op widening. Note that -- unlike the |
4156 | // unpredicated versions -- we don't have to worry about trapping on |
4157 | // operations like UDIV, FADD, etc., as we pass on the original vector |
4158 | // length parameter. This means the widened elements containing garbage |
4159 | // aren't active. |
4160 | case ISD::VP_SDIV: |
4161 | case ISD::VP_UDIV: |
4162 | case ISD::VP_SREM: |
4163 | case ISD::VP_UREM: |
4164 | case ISD::VP_FADD: |
4165 | case ISD::VP_FSUB: |
4166 | case ISD::VP_FMUL: |
4167 | case ISD::VP_FDIV: |
4168 | case ISD::VP_FREM: |
4169 | case ISD::VP_FCOPYSIGN: |
4170 | Res = WidenVecRes_Binary(N); |
4171 | break; |
4172 | |
4173 | case ISD::FPOW: |
4174 | case ISD::FREM: |
4175 | if (unrollExpandedOp()) |
4176 | break; |
4177 | // If the target has custom/legal support for the scalar FP intrinsic ops |
4178 | // (they are probably not destined to become libcalls), then widen those |
4179 | // like any other binary ops. |
4180 | [[fallthrough]]; |
4181 | |
4182 | case ISD::FADD: |
4183 | case ISD::FMUL: |
4184 | case ISD::FSUB: |
4185 | case ISD::FDIV: |
4186 | case ISD::SDIV: |
4187 | case ISD::UDIV: |
4188 | case ISD::SREM: |
4189 | case ISD::UREM: |
4190 | Res = WidenVecRes_BinaryCanTrap(N); |
4191 | break; |
4192 | |
4193 | case ISD::SMULFIX: |
4194 | case ISD::SMULFIXSAT: |
4195 | case ISD::UMULFIX: |
4196 | case ISD::UMULFIXSAT: |
4197 | // These are binary operations, but with an extra operand that shouldn't |
4198 | // be widened (the scale). |
4199 | Res = WidenVecRes_BinaryWithExtraScalarOp(N); |
4200 | break; |
4201 | |
4202 | #define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN) \ |
4203 | case ISD::STRICT_##DAGN: |
4204 | #include "llvm/IR/ConstrainedOps.def" |
4205 | Res = WidenVecRes_StrictFP(N); |
4206 | break; |
4207 | |
4208 | case ISD::UADDO: |
4209 | case ISD::SADDO: |
4210 | case ISD::USUBO: |
4211 | case ISD::SSUBO: |
4212 | case ISD::UMULO: |
4213 | case ISD::SMULO: |
4214 | Res = WidenVecRes_OverflowOp(N, ResNo); |
4215 | break; |
4216 | |
4217 | case ISD::FCOPYSIGN: |
4218 | Res = WidenVecRes_FCOPYSIGN(N); |
4219 | break; |
4220 | |
4221 | case ISD::IS_FPCLASS: |
4222 | Res = WidenVecRes_IS_FPCLASS(N); |
4223 | break; |
4224 | |
4225 | case ISD::FLDEXP: |
4226 | case ISD::FPOWI: |
4227 | if (!unrollExpandedOp()) |
4228 | Res = WidenVecRes_ExpOp(N); |
4229 | break; |
4230 | |
4231 | case ISD::ANY_EXTEND_VECTOR_INREG: |
4232 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
4233 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
4234 | Res = WidenVecRes_EXTEND_VECTOR_INREG(N); |
4235 | break; |
4236 | |
4237 | case ISD::ANY_EXTEND: |
4238 | case ISD::FP_EXTEND: |
4239 | case ISD::VP_FP_EXTEND: |
4240 | case ISD::FP_ROUND: |
4241 | case ISD::VP_FP_ROUND: |
4242 | case ISD::FP_TO_SINT: |
4243 | case ISD::VP_FP_TO_SINT: |
4244 | case ISD::FP_TO_UINT: |
4245 | case ISD::VP_FP_TO_UINT: |
4246 | case ISD::SIGN_EXTEND: |
4247 | case ISD::VP_SIGN_EXTEND: |
4248 | case ISD::SINT_TO_FP: |
4249 | case ISD::VP_SINT_TO_FP: |
4250 | case ISD::VP_TRUNCATE: |
4251 | case ISD::TRUNCATE: |
4252 | case ISD::UINT_TO_FP: |
4253 | case ISD::VP_UINT_TO_FP: |
4254 | case ISD::ZERO_EXTEND: |
4255 | case ISD::VP_ZERO_EXTEND: |
4256 | Res = WidenVecRes_Convert(N); |
4257 | break; |
4258 | |
4259 | case ISD::FP_TO_SINT_SAT: |
4260 | case ISD::FP_TO_UINT_SAT: |
4261 | Res = WidenVecRes_FP_TO_XINT_SAT(N); |
4262 | break; |
4263 | |
4264 | case ISD::LRINT: |
4265 | case ISD::LLRINT: |
4266 | Res = WidenVecRes_XRINT(N); |
4267 | break; |
4268 | |
4269 | case ISD::FABS: |
4270 | case ISD::FCEIL: |
4271 | case ISD::FCOS: |
4272 | case ISD::FEXP: |
4273 | case ISD::FEXP2: |
4274 | case ISD::FEXP10: |
4275 | case ISD::FFLOOR: |
4276 | case ISD::FLOG: |
4277 | case ISD::FLOG10: |
4278 | case ISD::FLOG2: |
4279 | case ISD::FNEARBYINT: |
4280 | case ISD::FRINT: |
4281 | case ISD::FROUND: |
4282 | case ISD::FROUNDEVEN: |
4283 | case ISD::FSIN: |
4284 | case ISD::FSQRT: |
4285 | case ISD::FTRUNC: |
4286 | if (unrollExpandedOp()) |
4287 | break; |
4288 | // If the target has custom/legal support for the scalar FP intrinsic ops |
4289 | // (they are probably not destined to become libcalls), then widen those |
4290 | // like any other unary ops. |
4291 | [[fallthrough]]; |
4292 | |
4293 | case ISD::ABS: |
4294 | case ISD::VP_ABS: |
4295 | case ISD::BITREVERSE: |
4296 | case ISD::VP_BITREVERSE: |
4297 | case ISD::BSWAP: |
4298 | case ISD::VP_BSWAP: |
4299 | case ISD::CTLZ: |
4300 | case ISD::VP_CTLZ: |
4301 | case ISD::CTLZ_ZERO_UNDEF: |
4302 | case ISD::VP_CTLZ_ZERO_UNDEF: |
4303 | case ISD::CTPOP: |
4304 | case ISD::VP_CTPOP: |
4305 | case ISD::CTTZ: |
4306 | case ISD::VP_CTTZ: |
4307 | case ISD::CTTZ_ZERO_UNDEF: |
4308 | case ISD::VP_CTTZ_ZERO_UNDEF: |
4309 | case ISD::FNEG: case ISD::VP_FNEG: |
4310 | case ISD::VP_FABS: |
4311 | case ISD::VP_SQRT: |
4312 | case ISD::VP_FCEIL: |
4313 | case ISD::VP_FFLOOR: |
4314 | case ISD::VP_FRINT: |
4315 | case ISD::VP_FNEARBYINT: |
4316 | case ISD::VP_FROUND: |
4317 | case ISD::VP_FROUNDEVEN: |
4318 | case ISD::VP_FROUNDTOZERO: |
4319 | case ISD::FREEZE: |
4320 | case ISD::ARITH_FENCE: |
4321 | case ISD::FCANONICALIZE: |
4322 | Res = WidenVecRes_Unary(N); |
4323 | break; |
4324 | case ISD::FMA: case ISD::VP_FMA: |
4325 | case ISD::FSHL: |
4326 | case ISD::VP_FSHL: |
4327 | case ISD::FSHR: |
4328 | case ISD::VP_FSHR: |
4329 | Res = WidenVecRes_Ternary(N); |
4330 | break; |
4331 | } |
4332 | |
4333 | // If Res is null, the sub-method took care of registering the result. |
4334 | if (Res.getNode()) |
4335 | SetWidenedVector(Op: SDValue(N, ResNo), Result: Res); |
4336 | } |
4337 | |
4338 | SDValue DAGTypeLegalizer::WidenVecRes_Ternary(SDNode *N) { |
4339 | // Ternary op widening. |
4340 | SDLoc dl(N); |
4341 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4342 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4343 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4344 | SDValue InOp3 = GetWidenedVector(Op: N->getOperand(Num: 2)); |
4345 | if (N->getNumOperands() == 3) |
4346 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, N1: InOp1, N2: InOp2, N3: InOp3); |
4347 | |
4348 | assert(N->getNumOperands() == 5 && "Unexpected number of operands!" ); |
4349 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
4350 | |
4351 | SDValue Mask = |
4352 | GetWidenedMask(Mask: N->getOperand(Num: 3), EC: WidenVT.getVectorElementCount()); |
4353 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, |
4354 | Ops: {InOp1, InOp2, InOp3, Mask, N->getOperand(Num: 4)}); |
4355 | } |
4356 | |
4357 | SDValue DAGTypeLegalizer::WidenVecRes_Binary(SDNode *N) { |
4358 | // Binary op widening. |
4359 | SDLoc dl(N); |
4360 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4361 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4362 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4363 | if (N->getNumOperands() == 2) |
4364 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, N1: InOp1, N2: InOp2, |
4365 | Flags: N->getFlags()); |
4366 | |
4367 | assert(N->getNumOperands() == 4 && "Unexpected number of operands!" ); |
4368 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
4369 | |
4370 | SDValue Mask = |
4371 | GetWidenedMask(Mask: N->getOperand(Num: 2), EC: WidenVT.getVectorElementCount()); |
4372 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, |
4373 | Ops: {InOp1, InOp2, Mask, N->getOperand(Num: 3)}, Flags: N->getFlags()); |
4374 | } |
4375 | |
4376 | SDValue DAGTypeLegalizer::(SDNode *N) { |
4377 | // Binary op widening, but with an extra operand that shouldn't be widened. |
4378 | SDLoc dl(N); |
4379 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4380 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4381 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4382 | SDValue InOp3 = N->getOperand(Num: 2); |
4383 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, N1: InOp1, N2: InOp2, N3: InOp3, |
4384 | Flags: N->getFlags()); |
4385 | } |
4386 | |
4387 | // Given a vector of operations that have been broken up to widen, see |
4388 | // if we can collect them together into the next widest legal VT. This |
4389 | // implementation is trap-safe. |
4390 | static SDValue CollectOpsToWiden(SelectionDAG &DAG, const TargetLowering &TLI, |
4391 | SmallVectorImpl<SDValue> &ConcatOps, |
4392 | unsigned ConcatEnd, EVT VT, EVT MaxVT, |
4393 | EVT WidenVT) { |
4394 | // Check to see if we have a single operation with the widen type. |
4395 | if (ConcatEnd == 1) { |
4396 | VT = ConcatOps[0].getValueType(); |
4397 | if (VT == WidenVT) |
4398 | return ConcatOps[0]; |
4399 | } |
4400 | |
4401 | SDLoc dl(ConcatOps[0]); |
4402 | EVT WidenEltVT = WidenVT.getVectorElementType(); |
4403 | |
4404 | // while (Some element of ConcatOps is not of type MaxVT) { |
4405 | // From the end of ConcatOps, collect elements of the same type and put |
4406 | // them into an op of the next larger supported type |
4407 | // } |
4408 | while (ConcatOps[ConcatEnd-1].getValueType() != MaxVT) { |
4409 | int Idx = ConcatEnd - 1; |
4410 | VT = ConcatOps[Idx--].getValueType(); |
4411 | while (Idx >= 0 && ConcatOps[Idx].getValueType() == VT) |
4412 | Idx--; |
4413 | |
4414 | int NextSize = VT.isVector() ? VT.getVectorNumElements() : 1; |
4415 | EVT NextVT; |
4416 | do { |
4417 | NextSize *= 2; |
4418 | NextVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: WidenEltVT, NumElements: NextSize); |
4419 | } while (!TLI.isTypeLegal(VT: NextVT)); |
4420 | |
4421 | if (!VT.isVector()) { |
4422 | // Scalar type, create an INSERT_VECTOR_ELEMENT of type NextVT |
4423 | SDValue VecOp = DAG.getUNDEF(VT: NextVT); |
4424 | unsigned NumToInsert = ConcatEnd - Idx - 1; |
4425 | for (unsigned i = 0, OpIdx = Idx+1; i < NumToInsert; i++, OpIdx++) { |
4426 | VecOp = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, VT: NextVT, N1: VecOp, |
4427 | N2: ConcatOps[OpIdx], N3: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
4428 | } |
4429 | ConcatOps[Idx+1] = VecOp; |
4430 | ConcatEnd = Idx + 2; |
4431 | } else { |
4432 | // Vector type, create a CONCAT_VECTORS of type NextVT |
4433 | SDValue undefVec = DAG.getUNDEF(VT); |
4434 | unsigned OpsToConcat = NextSize/VT.getVectorNumElements(); |
4435 | SmallVector<SDValue, 16> SubConcatOps(OpsToConcat); |
4436 | unsigned RealVals = ConcatEnd - Idx - 1; |
4437 | unsigned SubConcatEnd = 0; |
4438 | unsigned SubConcatIdx = Idx + 1; |
4439 | while (SubConcatEnd < RealVals) |
4440 | SubConcatOps[SubConcatEnd++] = ConcatOps[++Idx]; |
4441 | while (SubConcatEnd < OpsToConcat) |
4442 | SubConcatOps[SubConcatEnd++] = undefVec; |
4443 | ConcatOps[SubConcatIdx] = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, |
4444 | VT: NextVT, Ops: SubConcatOps); |
4445 | ConcatEnd = SubConcatIdx + 1; |
4446 | } |
4447 | } |
4448 | |
4449 | // Check to see if we have a single operation with the widen type. |
4450 | if (ConcatEnd == 1) { |
4451 | VT = ConcatOps[0].getValueType(); |
4452 | if (VT == WidenVT) |
4453 | return ConcatOps[0]; |
4454 | } |
4455 | |
4456 | // add undefs of size MaxVT until ConcatOps grows to length of WidenVT |
4457 | unsigned NumOps = WidenVT.getVectorNumElements()/MaxVT.getVectorNumElements(); |
4458 | if (NumOps != ConcatEnd ) { |
4459 | SDValue UndefVal = DAG.getUNDEF(VT: MaxVT); |
4460 | for (unsigned j = ConcatEnd; j < NumOps; ++j) |
4461 | ConcatOps[j] = UndefVal; |
4462 | } |
4463 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, |
4464 | Ops: ArrayRef(ConcatOps.data(), NumOps)); |
4465 | } |
4466 | |
4467 | SDValue DAGTypeLegalizer::WidenVecRes_BinaryCanTrap(SDNode *N) { |
4468 | // Binary op widening for operations that can trap. |
4469 | unsigned Opcode = N->getOpcode(); |
4470 | SDLoc dl(N); |
4471 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4472 | EVT WidenEltVT = WidenVT.getVectorElementType(); |
4473 | EVT VT = WidenVT; |
4474 | unsigned NumElts = VT.getVectorMinNumElements(); |
4475 | const SDNodeFlags Flags = N->getFlags(); |
4476 | while (!TLI.isTypeLegal(VT) && NumElts != 1) { |
4477 | NumElts = NumElts / 2; |
4478 | VT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: WidenEltVT, NumElements: NumElts); |
4479 | } |
4480 | |
4481 | if (NumElts != 1 && !TLI.canOpTrap(Op: N->getOpcode(), VT)) { |
4482 | // Operation doesn't trap so just widen as normal. |
4483 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4484 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4485 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, N1: InOp1, N2: InOp2, Flags); |
4486 | } |
4487 | |
4488 | // FIXME: Improve support for scalable vectors. |
4489 | assert(!VT.isScalableVector() && "Scalable vectors not handled yet." ); |
4490 | |
4491 | // No legal vector version so unroll the vector operation and then widen. |
4492 | if (NumElts == 1) |
4493 | return DAG.UnrollVectorOp(N, ResNE: WidenVT.getVectorNumElements()); |
4494 | |
4495 | // Since the operation can trap, apply operation on the original vector. |
4496 | EVT MaxVT = VT; |
4497 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4498 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4499 | unsigned CurNumElts = N->getValueType(ResNo: 0).getVectorNumElements(); |
4500 | |
4501 | SmallVector<SDValue, 16> ConcatOps(CurNumElts); |
4502 | unsigned ConcatEnd = 0; // Current ConcatOps index. |
4503 | int Idx = 0; // Current Idx into input vectors. |
4504 | |
4505 | // NumElts := greatest legal vector size (at most WidenVT) |
4506 | // while (orig. vector has unhandled elements) { |
4507 | // take munches of size NumElts from the beginning and add to ConcatOps |
4508 | // NumElts := next smaller supported vector size or 1 |
4509 | // } |
4510 | while (CurNumElts != 0) { |
4511 | while (CurNumElts >= NumElts) { |
4512 | SDValue EOp1 = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT, N1: InOp1, |
4513 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4514 | SDValue EOp2 = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT, N1: InOp2, |
4515 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4516 | ConcatOps[ConcatEnd++] = DAG.getNode(Opcode, DL: dl, VT, N1: EOp1, N2: EOp2, Flags); |
4517 | Idx += NumElts; |
4518 | CurNumElts -= NumElts; |
4519 | } |
4520 | do { |
4521 | NumElts = NumElts / 2; |
4522 | VT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: WidenEltVT, NumElements: NumElts); |
4523 | } while (!TLI.isTypeLegal(VT) && NumElts != 1); |
4524 | |
4525 | if (NumElts == 1) { |
4526 | for (unsigned i = 0; i != CurNumElts; ++i, ++Idx) { |
4527 | SDValue EOp1 = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: WidenEltVT, |
4528 | N1: InOp1, N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4529 | SDValue EOp2 = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: WidenEltVT, |
4530 | N1: InOp2, N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4531 | ConcatOps[ConcatEnd++] = DAG.getNode(Opcode, DL: dl, VT: WidenEltVT, |
4532 | N1: EOp1, N2: EOp2, Flags); |
4533 | } |
4534 | CurNumElts = 0; |
4535 | } |
4536 | } |
4537 | |
4538 | return CollectOpsToWiden(DAG, TLI, ConcatOps, ConcatEnd, VT, MaxVT, WidenVT); |
4539 | } |
4540 | |
4541 | SDValue DAGTypeLegalizer::WidenVecRes_StrictFP(SDNode *N) { |
4542 | switch (N->getOpcode()) { |
4543 | case ISD::STRICT_FSETCC: |
4544 | case ISD::STRICT_FSETCCS: |
4545 | return WidenVecRes_STRICT_FSETCC(N); |
4546 | case ISD::STRICT_FP_EXTEND: |
4547 | case ISD::STRICT_FP_ROUND: |
4548 | case ISD::STRICT_FP_TO_SINT: |
4549 | case ISD::STRICT_FP_TO_UINT: |
4550 | case ISD::STRICT_SINT_TO_FP: |
4551 | case ISD::STRICT_UINT_TO_FP: |
4552 | return WidenVecRes_Convert_StrictFP(N); |
4553 | default: |
4554 | break; |
4555 | } |
4556 | |
4557 | // StrictFP op widening for operations that can trap. |
4558 | unsigned NumOpers = N->getNumOperands(); |
4559 | unsigned Opcode = N->getOpcode(); |
4560 | SDLoc dl(N); |
4561 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4562 | EVT WidenEltVT = WidenVT.getVectorElementType(); |
4563 | EVT VT = WidenVT; |
4564 | unsigned NumElts = VT.getVectorNumElements(); |
4565 | while (!TLI.isTypeLegal(VT) && NumElts != 1) { |
4566 | NumElts = NumElts / 2; |
4567 | VT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: WidenEltVT, NumElements: NumElts); |
4568 | } |
4569 | |
4570 | // No legal vector version so unroll the vector operation and then widen. |
4571 | if (NumElts == 1) |
4572 | return UnrollVectorOp_StrictFP(N, ResNE: WidenVT.getVectorNumElements()); |
4573 | |
4574 | // Since the operation can trap, apply operation on the original vector. |
4575 | EVT MaxVT = VT; |
4576 | SmallVector<SDValue, 4> InOps; |
4577 | unsigned CurNumElts = N->getValueType(ResNo: 0).getVectorNumElements(); |
4578 | |
4579 | SmallVector<SDValue, 16> ConcatOps(CurNumElts); |
4580 | SmallVector<SDValue, 16> Chains; |
4581 | unsigned ConcatEnd = 0; // Current ConcatOps index. |
4582 | int Idx = 0; // Current Idx into input vectors. |
4583 | |
4584 | // The Chain is the first operand. |
4585 | InOps.push_back(Elt: N->getOperand(Num: 0)); |
4586 | |
4587 | // Now process the remaining operands. |
4588 | for (unsigned i = 1; i < NumOpers; ++i) { |
4589 | SDValue Oper = N->getOperand(Num: i); |
4590 | |
4591 | EVT OpVT = Oper.getValueType(); |
4592 | if (OpVT.isVector()) { |
4593 | if (getTypeAction(VT: OpVT) == TargetLowering::TypeWidenVector) |
4594 | Oper = GetWidenedVector(Op: Oper); |
4595 | else { |
4596 | EVT WideOpVT = |
4597 | EVT::getVectorVT(Context&: *DAG.getContext(), VT: OpVT.getVectorElementType(), |
4598 | EC: WidenVT.getVectorElementCount()); |
4599 | Oper = DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: WideOpVT, |
4600 | N1: DAG.getUNDEF(VT: WideOpVT), N2: Oper, |
4601 | N3: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
4602 | } |
4603 | } |
4604 | |
4605 | InOps.push_back(Elt: Oper); |
4606 | } |
4607 | |
4608 | // NumElts := greatest legal vector size (at most WidenVT) |
4609 | // while (orig. vector has unhandled elements) { |
4610 | // take munches of size NumElts from the beginning and add to ConcatOps |
4611 | // NumElts := next smaller supported vector size or 1 |
4612 | // } |
4613 | while (CurNumElts != 0) { |
4614 | while (CurNumElts >= NumElts) { |
4615 | SmallVector<SDValue, 4> EOps; |
4616 | |
4617 | for (unsigned i = 0; i < NumOpers; ++i) { |
4618 | SDValue Op = InOps[i]; |
4619 | |
4620 | EVT OpVT = Op.getValueType(); |
4621 | if (OpVT.isVector()) { |
4622 | EVT = |
4623 | EVT::getVectorVT(Context&: *DAG.getContext(), VT: OpVT.getVectorElementType(), |
4624 | EC: VT.getVectorElementCount()); |
4625 | Op = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: OpExtractVT, N1: Op, |
4626 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4627 | } |
4628 | |
4629 | EOps.push_back(Elt: Op); |
4630 | } |
4631 | |
4632 | EVT OperVT[] = {VT, MVT::Other}; |
4633 | SDValue Oper = DAG.getNode(Opcode, dl, OperVT, EOps); |
4634 | ConcatOps[ConcatEnd++] = Oper; |
4635 | Chains.push_back(Elt: Oper.getValue(R: 1)); |
4636 | Idx += NumElts; |
4637 | CurNumElts -= NumElts; |
4638 | } |
4639 | do { |
4640 | NumElts = NumElts / 2; |
4641 | VT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: WidenEltVT, NumElements: NumElts); |
4642 | } while (!TLI.isTypeLegal(VT) && NumElts != 1); |
4643 | |
4644 | if (NumElts == 1) { |
4645 | for (unsigned i = 0; i != CurNumElts; ++i, ++Idx) { |
4646 | SmallVector<SDValue, 4> EOps; |
4647 | |
4648 | for (unsigned i = 0; i < NumOpers; ++i) { |
4649 | SDValue Op = InOps[i]; |
4650 | |
4651 | EVT OpVT = Op.getValueType(); |
4652 | if (OpVT.isVector()) |
4653 | Op = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, |
4654 | VT: OpVT.getVectorElementType(), N1: Op, |
4655 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
4656 | |
4657 | EOps.push_back(Elt: Op); |
4658 | } |
4659 | |
4660 | EVT WidenVT[] = {WidenEltVT, MVT::Other}; |
4661 | SDValue Oper = DAG.getNode(Opcode, dl, WidenVT, EOps); |
4662 | ConcatOps[ConcatEnd++] = Oper; |
4663 | Chains.push_back(Elt: Oper.getValue(R: 1)); |
4664 | } |
4665 | CurNumElts = 0; |
4666 | } |
4667 | } |
4668 | |
4669 | // Build a factor node to remember all the Ops that have been created. |
4670 | SDValue NewChain; |
4671 | if (Chains.size() == 1) |
4672 | NewChain = Chains[0]; |
4673 | else |
4674 | NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Chains); |
4675 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
4676 | |
4677 | return CollectOpsToWiden(DAG, TLI, ConcatOps, ConcatEnd, VT, MaxVT, WidenVT); |
4678 | } |
4679 | |
4680 | SDValue DAGTypeLegalizer::WidenVecRes_OverflowOp(SDNode *N, unsigned ResNo) { |
4681 | SDLoc DL(N); |
4682 | EVT ResVT = N->getValueType(ResNo: 0); |
4683 | EVT OvVT = N->getValueType(ResNo: 1); |
4684 | EVT WideResVT, WideOvVT; |
4685 | SDValue WideLHS, WideRHS; |
4686 | |
4687 | // TODO: This might result in a widen/split loop. |
4688 | if (ResNo == 0) { |
4689 | WideResVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: ResVT); |
4690 | WideOvVT = EVT::getVectorVT( |
4691 | Context&: *DAG.getContext(), VT: OvVT.getVectorElementType(), |
4692 | NumElements: WideResVT.getVectorNumElements()); |
4693 | |
4694 | WideLHS = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4695 | WideRHS = GetWidenedVector(Op: N->getOperand(Num: 1)); |
4696 | } else { |
4697 | WideOvVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: OvVT); |
4698 | WideResVT = EVT::getVectorVT( |
4699 | Context&: *DAG.getContext(), VT: ResVT.getVectorElementType(), |
4700 | NumElements: WideOvVT.getVectorNumElements()); |
4701 | |
4702 | SDValue Zero = DAG.getVectorIdxConstant(Val: 0, DL); |
4703 | WideLHS = DAG.getNode( |
4704 | Opcode: ISD::INSERT_SUBVECTOR, DL, VT: WideResVT, N1: DAG.getUNDEF(VT: WideResVT), |
4705 | N2: N->getOperand(Num: 0), N3: Zero); |
4706 | WideRHS = DAG.getNode( |
4707 | Opcode: ISD::INSERT_SUBVECTOR, DL, VT: WideResVT, N1: DAG.getUNDEF(VT: WideResVT), |
4708 | N2: N->getOperand(Num: 1), N3: Zero); |
4709 | } |
4710 | |
4711 | SDVTList WideVTs = DAG.getVTList(VT1: WideResVT, VT2: WideOvVT); |
4712 | SDNode *WideNode = DAG.getNode( |
4713 | Opcode: N->getOpcode(), DL, VTList: WideVTs, N1: WideLHS, N2: WideRHS).getNode(); |
4714 | |
4715 | // Replace the other vector result not being explicitly widened here. |
4716 | unsigned OtherNo = 1 - ResNo; |
4717 | EVT OtherVT = N->getValueType(ResNo: OtherNo); |
4718 | if (getTypeAction(VT: OtherVT) == TargetLowering::TypeWidenVector) { |
4719 | SetWidenedVector(Op: SDValue(N, OtherNo), Result: SDValue(WideNode, OtherNo)); |
4720 | } else { |
4721 | SDValue Zero = DAG.getVectorIdxConstant(Val: 0, DL); |
4722 | SDValue OtherVal = DAG.getNode( |
4723 | Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: OtherVT, N1: SDValue(WideNode, OtherNo), N2: Zero); |
4724 | ReplaceValueWith(From: SDValue(N, OtherNo), To: OtherVal); |
4725 | } |
4726 | |
4727 | return SDValue(WideNode, ResNo); |
4728 | } |
4729 | |
4730 | SDValue DAGTypeLegalizer::WidenVecRes_Convert(SDNode *N) { |
4731 | LLVMContext &Ctx = *DAG.getContext(); |
4732 | SDValue InOp = N->getOperand(Num: 0); |
4733 | SDLoc DL(N); |
4734 | |
4735 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: Ctx, VT: N->getValueType(ResNo: 0)); |
4736 | ElementCount WidenEC = WidenVT.getVectorElementCount(); |
4737 | |
4738 | EVT InVT = InOp.getValueType(); |
4739 | |
4740 | unsigned Opcode = N->getOpcode(); |
4741 | const SDNodeFlags Flags = N->getFlags(); |
4742 | |
4743 | // Handle the case of ZERO_EXTEND where the promoted InVT element size does |
4744 | // not equal that of WidenVT. |
4745 | if (N->getOpcode() == ISD::ZERO_EXTEND && |
4746 | getTypeAction(VT: InVT) == TargetLowering::TypePromoteInteger && |
4747 | TLI.getTypeToTransformTo(Context&: Ctx, VT: InVT).getScalarSizeInBits() != |
4748 | WidenVT.getScalarSizeInBits()) { |
4749 | InOp = ZExtPromotedInteger(Op: InOp); |
4750 | InVT = InOp.getValueType(); |
4751 | if (WidenVT.getScalarSizeInBits() < InVT.getScalarSizeInBits()) |
4752 | Opcode = ISD::TRUNCATE; |
4753 | } |
4754 | |
4755 | EVT InEltVT = InVT.getVectorElementType(); |
4756 | EVT InWidenVT = EVT::getVectorVT(Context&: Ctx, VT: InEltVT, EC: WidenEC); |
4757 | ElementCount InVTEC = InVT.getVectorElementCount(); |
4758 | |
4759 | if (getTypeAction(VT: InVT) == TargetLowering::TypeWidenVector) { |
4760 | InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4761 | InVT = InOp.getValueType(); |
4762 | InVTEC = InVT.getVectorElementCount(); |
4763 | if (InVTEC == WidenEC) { |
4764 | if (N->getNumOperands() == 1) |
4765 | return DAG.getNode(Opcode, DL, VT: WidenVT, Operand: InOp); |
4766 | if (N->getNumOperands() == 3) { |
4767 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
4768 | SDValue Mask = |
4769 | GetWidenedMask(Mask: N->getOperand(Num: 1), EC: WidenVT.getVectorElementCount()); |
4770 | return DAG.getNode(Opcode, DL, VT: WidenVT, N1: InOp, N2: Mask, N3: N->getOperand(Num: 2)); |
4771 | } |
4772 | return DAG.getNode(Opcode, DL, VT: WidenVT, N1: InOp, N2: N->getOperand(Num: 1), Flags); |
4773 | } |
4774 | if (WidenVT.getSizeInBits() == InVT.getSizeInBits()) { |
4775 | // If both input and result vector types are of same width, extend |
4776 | // operations should be done with SIGN/ZERO_EXTEND_VECTOR_INREG, which |
4777 | // accepts fewer elements in the result than in the input. |
4778 | if (Opcode == ISD::ANY_EXTEND) |
4779 | return DAG.getNode(Opcode: ISD::ANY_EXTEND_VECTOR_INREG, DL, VT: WidenVT, Operand: InOp); |
4780 | if (Opcode == ISD::SIGN_EXTEND) |
4781 | return DAG.getNode(Opcode: ISD::SIGN_EXTEND_VECTOR_INREG, DL, VT: WidenVT, Operand: InOp); |
4782 | if (Opcode == ISD::ZERO_EXTEND) |
4783 | return DAG.getNode(Opcode: ISD::ZERO_EXTEND_VECTOR_INREG, DL, VT: WidenVT, Operand: InOp); |
4784 | } |
4785 | } |
4786 | |
4787 | if (TLI.isTypeLegal(VT: InWidenVT)) { |
4788 | // Because the result and the input are different vector types, widening |
4789 | // the result could create a legal type but widening the input might make |
4790 | // it an illegal type that might lead to repeatedly splitting the input |
4791 | // and then widening it. To avoid this, we widen the input only if |
4792 | // it results in a legal type. |
4793 | if (WidenEC.isKnownMultipleOf(RHS: InVTEC.getKnownMinValue())) { |
4794 | // Widen the input and call convert on the widened input vector. |
4795 | unsigned NumConcat = |
4796 | WidenEC.getKnownMinValue() / InVTEC.getKnownMinValue(); |
4797 | SmallVector<SDValue, 16> Ops(NumConcat, DAG.getUNDEF(VT: InVT)); |
4798 | Ops[0] = InOp; |
4799 | SDValue InVec = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL, VT: InWidenVT, Ops); |
4800 | if (N->getNumOperands() == 1) |
4801 | return DAG.getNode(Opcode, DL, VT: WidenVT, Operand: InVec); |
4802 | return DAG.getNode(Opcode, DL, VT: WidenVT, N1: InVec, N2: N->getOperand(Num: 1), Flags); |
4803 | } |
4804 | |
4805 | if (InVTEC.isKnownMultipleOf(RHS: WidenEC.getKnownMinValue())) { |
4806 | SDValue InVal = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: InWidenVT, N1: InOp, |
4807 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
4808 | // Extract the input and convert the shorten input vector. |
4809 | if (N->getNumOperands() == 1) |
4810 | return DAG.getNode(Opcode, DL, VT: WidenVT, Operand: InVal); |
4811 | return DAG.getNode(Opcode, DL, VT: WidenVT, N1: InVal, N2: N->getOperand(Num: 1), Flags); |
4812 | } |
4813 | } |
4814 | |
4815 | // Otherwise unroll into some nasty scalar code and rebuild the vector. |
4816 | EVT EltVT = WidenVT.getVectorElementType(); |
4817 | SmallVector<SDValue, 16> Ops(WidenEC.getFixedValue(), DAG.getUNDEF(VT: EltVT)); |
4818 | // Use the original element count so we don't do more scalar opts than |
4819 | // necessary. |
4820 | unsigned MinElts = N->getValueType(ResNo: 0).getVectorNumElements(); |
4821 | for (unsigned i=0; i < MinElts; ++i) { |
4822 | SDValue Val = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT: InEltVT, N1: InOp, |
4823 | N2: DAG.getVectorIdxConstant(Val: i, DL)); |
4824 | if (N->getNumOperands() == 1) |
4825 | Ops[i] = DAG.getNode(Opcode, DL, VT: EltVT, Operand: Val); |
4826 | else |
4827 | Ops[i] = DAG.getNode(Opcode, DL, VT: EltVT, N1: Val, N2: N->getOperand(Num: 1), Flags); |
4828 | } |
4829 | |
4830 | return DAG.getBuildVector(VT: WidenVT, DL, Ops); |
4831 | } |
4832 | |
4833 | SDValue DAGTypeLegalizer::WidenVecRes_FP_TO_XINT_SAT(SDNode *N) { |
4834 | SDLoc dl(N); |
4835 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4836 | ElementCount WidenNumElts = WidenVT.getVectorElementCount(); |
4837 | |
4838 | SDValue Src = N->getOperand(Num: 0); |
4839 | EVT SrcVT = Src.getValueType(); |
4840 | |
4841 | // Also widen the input. |
4842 | if (getTypeAction(VT: SrcVT) == TargetLowering::TypeWidenVector) { |
4843 | Src = GetWidenedVector(Op: Src); |
4844 | SrcVT = Src.getValueType(); |
4845 | } |
4846 | |
4847 | // Input and output not widened to the same size, give up. |
4848 | if (WidenNumElts != SrcVT.getVectorElementCount()) |
4849 | return DAG.UnrollVectorOp(N, ResNE: WidenNumElts.getKnownMinValue()); |
4850 | |
4851 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, N1: Src, N2: N->getOperand(Num: 1)); |
4852 | } |
4853 | |
4854 | SDValue DAGTypeLegalizer::WidenVecRes_XRINT(SDNode *N) { |
4855 | SDLoc dl(N); |
4856 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4857 | ElementCount WidenNumElts = WidenVT.getVectorElementCount(); |
4858 | |
4859 | SDValue Src = N->getOperand(Num: 0); |
4860 | EVT SrcVT = Src.getValueType(); |
4861 | |
4862 | // Also widen the input. |
4863 | if (getTypeAction(VT: SrcVT) == TargetLowering::TypeWidenVector) { |
4864 | Src = GetWidenedVector(Op: Src); |
4865 | SrcVT = Src.getValueType(); |
4866 | } |
4867 | |
4868 | // Input and output not widened to the same size, give up. |
4869 | if (WidenNumElts != SrcVT.getVectorElementCount()) |
4870 | return DAG.UnrollVectorOp(N, ResNE: WidenNumElts.getKnownMinValue()); |
4871 | |
4872 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WidenVT, Operand: Src); |
4873 | } |
4874 | |
4875 | SDValue DAGTypeLegalizer::WidenVecRes_Convert_StrictFP(SDNode *N) { |
4876 | SDValue InOp = N->getOperand(Num: 1); |
4877 | SDLoc DL(N); |
4878 | SmallVector<SDValue, 4> NewOps(N->op_begin(), N->op_end()); |
4879 | |
4880 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4881 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
4882 | |
4883 | EVT InVT = InOp.getValueType(); |
4884 | EVT InEltVT = InVT.getVectorElementType(); |
4885 | |
4886 | unsigned Opcode = N->getOpcode(); |
4887 | |
4888 | // FIXME: Optimizations need to be implemented here. |
4889 | |
4890 | // Otherwise unroll into some nasty scalar code and rebuild the vector. |
4891 | EVT EltVT = WidenVT.getVectorElementType(); |
4892 | std::array<EVT, 2> EltVTs = {{EltVT, MVT::Other}}; |
4893 | SmallVector<SDValue, 16> Ops(WidenNumElts, DAG.getUNDEF(VT: EltVT)); |
4894 | SmallVector<SDValue, 32> OpChains; |
4895 | // Use the original element count so we don't do more scalar opts than |
4896 | // necessary. |
4897 | unsigned MinElts = N->getValueType(ResNo: 0).getVectorNumElements(); |
4898 | for (unsigned i=0; i < MinElts; ++i) { |
4899 | NewOps[1] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT: InEltVT, N1: InOp, |
4900 | N2: DAG.getVectorIdxConstant(Val: i, DL)); |
4901 | Ops[i] = DAG.getNode(Opcode, DL, ResultTys: EltVTs, Ops: NewOps); |
4902 | OpChains.push_back(Elt: Ops[i].getValue(R: 1)); |
4903 | } |
4904 | SDValue NewChain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, OpChains); |
4905 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
4906 | |
4907 | return DAG.getBuildVector(VT: WidenVT, DL, Ops); |
4908 | } |
4909 | |
4910 | SDValue DAGTypeLegalizer::WidenVecRes_EXTEND_VECTOR_INREG(SDNode *N) { |
4911 | unsigned Opcode = N->getOpcode(); |
4912 | SDValue InOp = N->getOperand(Num: 0); |
4913 | SDLoc DL(N); |
4914 | |
4915 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4916 | EVT WidenSVT = WidenVT.getVectorElementType(); |
4917 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
4918 | |
4919 | EVT InVT = InOp.getValueType(); |
4920 | EVT InSVT = InVT.getVectorElementType(); |
4921 | unsigned InVTNumElts = InVT.getVectorNumElements(); |
4922 | |
4923 | if (getTypeAction(VT: InVT) == TargetLowering::TypeWidenVector) { |
4924 | InOp = GetWidenedVector(Op: InOp); |
4925 | InVT = InOp.getValueType(); |
4926 | if (InVT.getSizeInBits() == WidenVT.getSizeInBits()) { |
4927 | switch (Opcode) { |
4928 | case ISD::ANY_EXTEND_VECTOR_INREG: |
4929 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
4930 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
4931 | return DAG.getNode(Opcode, DL, VT: WidenVT, Operand: InOp); |
4932 | } |
4933 | } |
4934 | } |
4935 | |
4936 | // Unroll, extend the scalars and rebuild the vector. |
4937 | SmallVector<SDValue, 16> Ops; |
4938 | for (unsigned i = 0, e = std::min(a: InVTNumElts, b: WidenNumElts); i != e; ++i) { |
4939 | SDValue Val = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL, VT: InSVT, N1: InOp, |
4940 | N2: DAG.getVectorIdxConstant(Val: i, DL)); |
4941 | switch (Opcode) { |
4942 | case ISD::ANY_EXTEND_VECTOR_INREG: |
4943 | Val = DAG.getNode(Opcode: ISD::ANY_EXTEND, DL, VT: WidenSVT, Operand: Val); |
4944 | break; |
4945 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
4946 | Val = DAG.getNode(Opcode: ISD::SIGN_EXTEND, DL, VT: WidenSVT, Operand: Val); |
4947 | break; |
4948 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
4949 | Val = DAG.getNode(Opcode: ISD::ZERO_EXTEND, DL, VT: WidenSVT, Operand: Val); |
4950 | break; |
4951 | default: |
4952 | llvm_unreachable("A *_EXTEND_VECTOR_INREG node was expected" ); |
4953 | } |
4954 | Ops.push_back(Elt: Val); |
4955 | } |
4956 | |
4957 | while (Ops.size() != WidenNumElts) |
4958 | Ops.push_back(Elt: DAG.getUNDEF(VT: WidenSVT)); |
4959 | |
4960 | return DAG.getBuildVector(VT: WidenVT, DL, Ops); |
4961 | } |
4962 | |
4963 | SDValue DAGTypeLegalizer::WidenVecRes_FCOPYSIGN(SDNode *N) { |
4964 | // If this is an FCOPYSIGN with same input types, we can treat it as a |
4965 | // normal (can trap) binary op. |
4966 | if (N->getOperand(Num: 0).getValueType() == N->getOperand(Num: 1).getValueType()) |
4967 | return WidenVecRes_BinaryCanTrap(N); |
4968 | |
4969 | // If the types are different, fall back to unrolling. |
4970 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4971 | return DAG.UnrollVectorOp(N, ResNE: WidenVT.getVectorNumElements()); |
4972 | } |
4973 | |
4974 | SDValue DAGTypeLegalizer::WidenVecRes_IS_FPCLASS(SDNode *N) { |
4975 | SDValue FpValue = N->getOperand(Num: 0); |
4976 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4977 | if (getTypeAction(VT: FpValue.getValueType()) != TargetLowering::TypeWidenVector) |
4978 | return DAG.UnrollVectorOp(N, ResNE: WidenVT.getVectorNumElements()); |
4979 | SDValue Arg = GetWidenedVector(Op: FpValue); |
4980 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: WidenVT, Ops: {Arg, N->getOperand(Num: 1)}, |
4981 | Flags: N->getFlags()); |
4982 | } |
4983 | |
4984 | SDValue DAGTypeLegalizer::WidenVecRes_ExpOp(SDNode *N) { |
4985 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4986 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4987 | SDValue RHS = N->getOperand(Num: 1); |
4988 | SDValue ExpOp = RHS.getValueType().isVector() ? GetWidenedVector(Op: RHS) : RHS; |
4989 | |
4990 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: WidenVT, N1: InOp, N2: ExpOp); |
4991 | } |
4992 | |
4993 | SDValue DAGTypeLegalizer::WidenVecRes_Unary(SDNode *N) { |
4994 | // Unary op widening. |
4995 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
4996 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
4997 | if (N->getNumOperands() == 1) |
4998 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: WidenVT, Operand: InOp, Flags: N->getFlags()); |
4999 | |
5000 | assert(N->getNumOperands() == 3 && "Unexpected number of operands!" ); |
5001 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
5002 | |
5003 | SDValue Mask = |
5004 | GetWidenedMask(Mask: N->getOperand(Num: 1), EC: WidenVT.getVectorElementCount()); |
5005 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: WidenVT, |
5006 | Ops: {InOp, Mask, N->getOperand(Num: 2)}); |
5007 | } |
5008 | |
5009 | SDValue DAGTypeLegalizer::WidenVecRes_InregOp(SDNode *N) { |
5010 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5011 | EVT ExtVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5012 | VT: cast<VTSDNode>(Val: N->getOperand(Num: 1))->getVT() |
5013 | .getVectorElementType(), |
5014 | NumElements: WidenVT.getVectorNumElements()); |
5015 | SDValue WidenLHS = GetWidenedVector(Op: N->getOperand(Num: 0)); |
5016 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), |
5017 | VT: WidenVT, N1: WidenLHS, N2: DAG.getValueType(ExtVT)); |
5018 | } |
5019 | |
5020 | SDValue DAGTypeLegalizer::WidenVecRes_MERGE_VALUES(SDNode *N, unsigned ResNo) { |
5021 | SDValue WidenVec = DisintegrateMERGE_VALUES(N, ResNo); |
5022 | return GetWidenedVector(Op: WidenVec); |
5023 | } |
5024 | |
5025 | SDValue DAGTypeLegalizer::WidenVecRes_BITCAST(SDNode *N) { |
5026 | SDValue InOp = N->getOperand(Num: 0); |
5027 | EVT InVT = InOp.getValueType(); |
5028 | EVT VT = N->getValueType(ResNo: 0); |
5029 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5030 | SDLoc dl(N); |
5031 | |
5032 | switch (getTypeAction(VT: InVT)) { |
5033 | case TargetLowering::TypeLegal: |
5034 | break; |
5035 | case TargetLowering::TypeScalarizeScalableVector: |
5036 | report_fatal_error(reason: "Scalarization of scalable vectors is not supported." ); |
5037 | case TargetLowering::TypePromoteInteger: { |
5038 | // If the incoming type is a vector that is being promoted, then |
5039 | // we know that the elements are arranged differently and that we |
5040 | // must perform the conversion using a stack slot. |
5041 | if (InVT.isVector()) |
5042 | break; |
5043 | |
5044 | // If the InOp is promoted to the same size, convert it. Otherwise, |
5045 | // fall out of the switch and widen the promoted input. |
5046 | SDValue NInOp = GetPromotedInteger(Op: InOp); |
5047 | EVT NInVT = NInOp.getValueType(); |
5048 | if (WidenVT.bitsEq(VT: NInVT)) { |
5049 | // For big endian targets we need to shift the input integer or the |
5050 | // interesting bits will end up at the wrong place. |
5051 | if (DAG.getDataLayout().isBigEndian()) { |
5052 | unsigned ShiftAmt = NInVT.getSizeInBits() - InVT.getSizeInBits(); |
5053 | EVT ShiftAmtTy = TLI.getShiftAmountTy(LHSTy: NInVT, DL: DAG.getDataLayout()); |
5054 | assert(ShiftAmt < WidenVT.getSizeInBits() && "Too large shift amount!" ); |
5055 | NInOp = DAG.getNode(Opcode: ISD::SHL, DL: dl, VT: NInVT, N1: NInOp, |
5056 | N2: DAG.getConstant(Val: ShiftAmt, DL: dl, VT: ShiftAmtTy)); |
5057 | } |
5058 | return DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: WidenVT, Operand: NInOp); |
5059 | } |
5060 | InOp = NInOp; |
5061 | InVT = NInVT; |
5062 | break; |
5063 | } |
5064 | case TargetLowering::TypeSoftenFloat: |
5065 | case TargetLowering::TypePromoteFloat: |
5066 | case TargetLowering::TypeSoftPromoteHalf: |
5067 | case TargetLowering::TypeExpandInteger: |
5068 | case TargetLowering::TypeExpandFloat: |
5069 | case TargetLowering::TypeScalarizeVector: |
5070 | case TargetLowering::TypeSplitVector: |
5071 | break; |
5072 | case TargetLowering::TypeWidenVector: |
5073 | // If the InOp is widened to the same size, convert it. Otherwise, fall |
5074 | // out of the switch and widen the widened input. |
5075 | InOp = GetWidenedVector(Op: InOp); |
5076 | InVT = InOp.getValueType(); |
5077 | if (WidenVT.bitsEq(VT: InVT)) |
5078 | // The input widens to the same size. Convert to the widen value. |
5079 | return DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: WidenVT, Operand: InOp); |
5080 | break; |
5081 | } |
5082 | |
5083 | unsigned WidenSize = WidenVT.getSizeInBits(); |
5084 | unsigned InSize = InVT.getSizeInBits(); |
5085 | unsigned InScalarSize = InVT.getScalarSizeInBits(); |
5086 | // x86mmx is not an acceptable vector element type, so don't try. |
5087 | if (WidenSize % InScalarSize == 0 && InVT != MVT::x86mmx) { |
5088 | // Determine new input vector type. The new input vector type will use |
5089 | // the same element type (if its a vector) or use the input type as a |
5090 | // vector. It is the same size as the type to widen to. |
5091 | EVT NewInVT; |
5092 | unsigned NewNumParts = WidenSize / InSize; |
5093 | if (InVT.isVector()) { |
5094 | EVT InEltVT = InVT.getVectorElementType(); |
5095 | NewInVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: InEltVT, |
5096 | NumElements: WidenSize / InEltVT.getSizeInBits()); |
5097 | } else { |
5098 | // For big endian systems, using the promoted input scalar type |
5099 | // to produce the scalar_to_vector would put the desired bits into |
5100 | // the least significant byte(s) of the wider element zero. This |
5101 | // will mean that the users of the result vector are using incorrect |
5102 | // bits. Use the original input type instead. Although either input |
5103 | // type can be used on little endian systems, for consistency we |
5104 | // use the original type there as well. |
5105 | EVT OrigInVT = N->getOperand(Num: 0).getValueType(); |
5106 | NewNumParts = WidenSize / OrigInVT.getSizeInBits(); |
5107 | NewInVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: OrigInVT, NumElements: NewNumParts); |
5108 | } |
5109 | |
5110 | if (TLI.isTypeLegal(VT: NewInVT)) { |
5111 | SDValue NewVec; |
5112 | if (InVT.isVector()) { |
5113 | // Because the result and the input are different vector types, widening |
5114 | // the result could create a legal type but widening the input might |
5115 | // make it an illegal type that might lead to repeatedly splitting the |
5116 | // input and then widening it. To avoid this, we widen the input only if |
5117 | // it results in a legal type. |
5118 | if (WidenSize % InSize == 0) { |
5119 | SmallVector<SDValue, 16> Ops(NewNumParts, DAG.getUNDEF(VT: InVT)); |
5120 | Ops[0] = InOp; |
5121 | |
5122 | NewVec = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: NewInVT, Ops); |
5123 | } else { |
5124 | SmallVector<SDValue, 16> Ops; |
5125 | DAG.ExtractVectorElements(Op: InOp, Args&: Ops); |
5126 | Ops.append(NumInputs: WidenSize / InScalarSize - Ops.size(), |
5127 | Elt: DAG.getUNDEF(VT: InVT.getVectorElementType())); |
5128 | |
5129 | NewVec = DAG.getNode(Opcode: ISD::BUILD_VECTOR, DL: dl, VT: NewInVT, Ops); |
5130 | } |
5131 | } else { |
5132 | NewVec = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: dl, VT: NewInVT, Operand: InOp); |
5133 | } |
5134 | return DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: WidenVT, Operand: NewVec); |
5135 | } |
5136 | } |
5137 | |
5138 | return CreateStackStoreLoad(Op: InOp, DestVT: WidenVT); |
5139 | } |
5140 | |
5141 | SDValue DAGTypeLegalizer::WidenVecRes_BUILD_VECTOR(SDNode *N) { |
5142 | SDLoc dl(N); |
5143 | // Build a vector with undefined for the new nodes. |
5144 | EVT VT = N->getValueType(ResNo: 0); |
5145 | |
5146 | // Integer BUILD_VECTOR operands may be larger than the node's vector element |
5147 | // type. The UNDEFs need to have the same type as the existing operands. |
5148 | EVT EltVT = N->getOperand(Num: 0).getValueType(); |
5149 | unsigned NumElts = VT.getVectorNumElements(); |
5150 | |
5151 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5152 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
5153 | |
5154 | SmallVector<SDValue, 16> NewOps(N->op_begin(), N->op_end()); |
5155 | assert(WidenNumElts >= NumElts && "Shrinking vector instead of widening!" ); |
5156 | NewOps.append(NumInputs: WidenNumElts - NumElts, Elt: DAG.getUNDEF(VT: EltVT)); |
5157 | |
5158 | return DAG.getBuildVector(VT: WidenVT, DL: dl, Ops: NewOps); |
5159 | } |
5160 | |
5161 | SDValue DAGTypeLegalizer::WidenVecRes_CONCAT_VECTORS(SDNode *N) { |
5162 | EVT InVT = N->getOperand(Num: 0).getValueType(); |
5163 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5164 | SDLoc dl(N); |
5165 | unsigned NumOperands = N->getNumOperands(); |
5166 | |
5167 | bool InputWidened = false; // Indicates we need to widen the input. |
5168 | if (getTypeAction(VT: InVT) != TargetLowering::TypeWidenVector) { |
5169 | unsigned WidenNumElts = WidenVT.getVectorMinNumElements(); |
5170 | unsigned NumInElts = InVT.getVectorMinNumElements(); |
5171 | if (WidenNumElts % NumInElts == 0) { |
5172 | // Add undef vectors to widen to correct length. |
5173 | unsigned NumConcat = WidenNumElts / NumInElts; |
5174 | SDValue UndefVal = DAG.getUNDEF(VT: InVT); |
5175 | SmallVector<SDValue, 16> Ops(NumConcat); |
5176 | for (unsigned i=0; i < NumOperands; ++i) |
5177 | Ops[i] = N->getOperand(Num: i); |
5178 | for (unsigned i = NumOperands; i != NumConcat; ++i) |
5179 | Ops[i] = UndefVal; |
5180 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, Ops); |
5181 | } |
5182 | } else { |
5183 | InputWidened = true; |
5184 | if (WidenVT == TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: InVT)) { |
5185 | // The inputs and the result are widen to the same value. |
5186 | unsigned i; |
5187 | for (i=1; i < NumOperands; ++i) |
5188 | if (!N->getOperand(Num: i).isUndef()) |
5189 | break; |
5190 | |
5191 | if (i == NumOperands) |
5192 | // Everything but the first operand is an UNDEF so just return the |
5193 | // widened first operand. |
5194 | return GetWidenedVector(Op: N->getOperand(Num: 0)); |
5195 | |
5196 | if (NumOperands == 2) { |
5197 | assert(!WidenVT.isScalableVector() && |
5198 | "Cannot use vector shuffles to widen CONCAT_VECTOR result" ); |
5199 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
5200 | unsigned NumInElts = InVT.getVectorNumElements(); |
5201 | |
5202 | // Replace concat of two operands with a shuffle. |
5203 | SmallVector<int, 16> MaskOps(WidenNumElts, -1); |
5204 | for (unsigned i = 0; i < NumInElts; ++i) { |
5205 | MaskOps[i] = i; |
5206 | MaskOps[i + NumInElts] = i + WidenNumElts; |
5207 | } |
5208 | return DAG.getVectorShuffle(VT: WidenVT, dl, |
5209 | N1: GetWidenedVector(Op: N->getOperand(Num: 0)), |
5210 | N2: GetWidenedVector(Op: N->getOperand(Num: 1)), |
5211 | Mask: MaskOps); |
5212 | } |
5213 | } |
5214 | } |
5215 | |
5216 | assert(!WidenVT.isScalableVector() && |
5217 | "Cannot use build vectors to widen CONCAT_VECTOR result" ); |
5218 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
5219 | unsigned NumInElts = InVT.getVectorNumElements(); |
5220 | |
5221 | // Fall back to use extracts and build vector. |
5222 | EVT EltVT = WidenVT.getVectorElementType(); |
5223 | SmallVector<SDValue, 16> Ops(WidenNumElts); |
5224 | unsigned Idx = 0; |
5225 | for (unsigned i=0; i < NumOperands; ++i) { |
5226 | SDValue InOp = N->getOperand(Num: i); |
5227 | if (InputWidened) |
5228 | InOp = GetWidenedVector(Op: InOp); |
5229 | for (unsigned j = 0; j < NumInElts; ++j) |
5230 | Ops[Idx++] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: EltVT, N1: InOp, |
5231 | N2: DAG.getVectorIdxConstant(Val: j, DL: dl)); |
5232 | } |
5233 | SDValue UndefVal = DAG.getUNDEF(VT: EltVT); |
5234 | for (; Idx < WidenNumElts; ++Idx) |
5235 | Ops[Idx] = UndefVal; |
5236 | return DAG.getBuildVector(VT: WidenVT, DL: dl, Ops); |
5237 | } |
5238 | |
5239 | SDValue DAGTypeLegalizer::WidenVecRes_INSERT_SUBVECTOR(SDNode *N) { |
5240 | EVT VT = N->getValueType(ResNo: 0); |
5241 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5242 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
5243 | SDValue InOp2 = N->getOperand(Num: 1); |
5244 | SDValue Idx = N->getOperand(Num: 2); |
5245 | SDLoc dl(N); |
5246 | return DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: WidenVT, N1: InOp1, N2: InOp2, N3: Idx); |
5247 | } |
5248 | |
5249 | SDValue DAGTypeLegalizer::(SDNode *N) { |
5250 | EVT VT = N->getValueType(ResNo: 0); |
5251 | EVT EltVT = VT.getVectorElementType(); |
5252 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5253 | SDValue InOp = N->getOperand(Num: 0); |
5254 | SDValue Idx = N->getOperand(Num: 1); |
5255 | SDLoc dl(N); |
5256 | |
5257 | auto InOpTypeAction = getTypeAction(VT: InOp.getValueType()); |
5258 | if (InOpTypeAction == TargetLowering::TypeWidenVector) |
5259 | InOp = GetWidenedVector(Op: InOp); |
5260 | |
5261 | EVT InVT = InOp.getValueType(); |
5262 | |
5263 | // Check if we can just return the input vector after widening. |
5264 | uint64_t IdxVal = Idx->getAsZExtVal(); |
5265 | if (IdxVal == 0 && InVT == WidenVT) |
5266 | return InOp; |
5267 | |
5268 | // Check if we can extract from the vector. |
5269 | unsigned WidenNumElts = WidenVT.getVectorMinNumElements(); |
5270 | unsigned InNumElts = InVT.getVectorMinNumElements(); |
5271 | unsigned VTNumElts = VT.getVectorMinNumElements(); |
5272 | assert(IdxVal % VTNumElts == 0 && |
5273 | "Expected Idx to be a multiple of subvector minimum vector length" ); |
5274 | if (IdxVal % WidenNumElts == 0 && IdxVal + WidenNumElts < InNumElts) |
5275 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: WidenVT, N1: InOp, N2: Idx); |
5276 | |
5277 | if (VT.isScalableVector()) { |
5278 | // Try to split the operation up into smaller extracts and concat the |
5279 | // results together, e.g. |
5280 | // nxv6i64 extract_subvector(nxv12i64, 6) |
5281 | // <-> |
5282 | // nxv8i64 concat( |
5283 | // nxv2i64 extract_subvector(nxv16i64, 6) |
5284 | // nxv2i64 extract_subvector(nxv16i64, 8) |
5285 | // nxv2i64 extract_subvector(nxv16i64, 10) |
5286 | // undef) |
5287 | unsigned GCD = std::gcd(m: VTNumElts, n: WidenNumElts); |
5288 | assert((IdxVal % GCD) == 0 && "Expected Idx to be a multiple of the broken " |
5289 | "down type's element count" ); |
5290 | EVT PartVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, |
5291 | EC: ElementCount::getScalable(MinVal: GCD)); |
5292 | // Avoid recursion around e.g. nxv1i8. |
5293 | if (getTypeAction(VT: PartVT) != TargetLowering::TypeWidenVector) { |
5294 | SmallVector<SDValue> Parts; |
5295 | unsigned I = 0; |
5296 | for (; I < VTNumElts / GCD; ++I) |
5297 | Parts.push_back( |
5298 | Elt: DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: PartVT, N1: InOp, |
5299 | N2: DAG.getVectorIdxConstant(Val: IdxVal + I * GCD, DL: dl))); |
5300 | for (; I < WidenNumElts / GCD; ++I) |
5301 | Parts.push_back(Elt: DAG.getUNDEF(VT: PartVT)); |
5302 | |
5303 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, Ops: Parts); |
5304 | } |
5305 | |
5306 | report_fatal_error(reason: "Don't know how to widen the result of " |
5307 | "EXTRACT_SUBVECTOR for scalable vectors" ); |
5308 | } |
5309 | |
5310 | // We could try widening the input to the right length but for now, extract |
5311 | // the original elements, fill the rest with undefs and build a vector. |
5312 | SmallVector<SDValue, 16> Ops(WidenNumElts); |
5313 | unsigned i; |
5314 | for (i = 0; i < VTNumElts; ++i) |
5315 | Ops[i] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: EltVT, N1: InOp, |
5316 | N2: DAG.getVectorIdxConstant(Val: IdxVal + i, DL: dl)); |
5317 | |
5318 | SDValue UndefVal = DAG.getUNDEF(VT: EltVT); |
5319 | for (; i < WidenNumElts; ++i) |
5320 | Ops[i] = UndefVal; |
5321 | return DAG.getBuildVector(VT: WidenVT, DL: dl, Ops); |
5322 | } |
5323 | |
5324 | SDValue DAGTypeLegalizer::WidenVecRes_AssertZext(SDNode *N) { |
5325 | SDValue InOp = ModifyToType( |
5326 | InOp: N->getOperand(Num: 0), |
5327 | NVT: TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)), FillWithZeroes: true); |
5328 | return DAG.getNode(Opcode: ISD::AssertZext, DL: SDLoc(N), VT: InOp.getValueType(), N1: InOp, |
5329 | N2: N->getOperand(Num: 1)); |
5330 | } |
5331 | |
5332 | SDValue DAGTypeLegalizer::WidenVecRes_INSERT_VECTOR_ELT(SDNode *N) { |
5333 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
5334 | return DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: SDLoc(N), |
5335 | VT: InOp.getValueType(), N1: InOp, |
5336 | N2: N->getOperand(Num: 1), N3: N->getOperand(Num: 2)); |
5337 | } |
5338 | |
5339 | SDValue DAGTypeLegalizer::WidenVecRes_LOAD(SDNode *N) { |
5340 | LoadSDNode *LD = cast<LoadSDNode>(Val: N); |
5341 | ISD::LoadExtType ExtType = LD->getExtensionType(); |
5342 | |
5343 | // A vector must always be stored in memory as-is, i.e. without any padding |
5344 | // between the elements, since various code depend on it, e.g. in the |
5345 | // handling of a bitcast of a vector type to int, which may be done with a |
5346 | // vector store followed by an integer load. A vector that does not have |
5347 | // elements that are byte-sized must therefore be stored as an integer |
5348 | // built out of the extracted vector elements. |
5349 | if (!LD->getMemoryVT().isByteSized()) { |
5350 | SDValue Value, NewChain; |
5351 | std::tie(args&: Value, args&: NewChain) = TLI.scalarizeVectorLoad(LD, DAG); |
5352 | ReplaceValueWith(From: SDValue(LD, 0), To: Value); |
5353 | ReplaceValueWith(From: SDValue(LD, 1), To: NewChain); |
5354 | return SDValue(); |
5355 | } |
5356 | |
5357 | // Generate a vector-predicated load if it is custom/legal on the target. To |
5358 | // avoid possible recursion, only do this if the widened mask type is legal. |
5359 | // FIXME: Not all targets may support EVL in VP_LOAD. These will have been |
5360 | // removed from the IR by the ExpandVectorPredication pass but we're |
5361 | // reintroducing them here. |
5362 | EVT LdVT = LD->getMemoryVT(); |
5363 | EVT WideVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: LdVT); |
5364 | EVT WideMaskVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1, |
5365 | WideVT.getVectorElementCount()); |
5366 | if (ExtType == ISD::NON_EXTLOAD && |
5367 | TLI.isOperationLegalOrCustom(Op: ISD::VP_LOAD, VT: WideVT) && |
5368 | TLI.isTypeLegal(VT: WideMaskVT)) { |
5369 | SDLoc DL(N); |
5370 | SDValue Mask = DAG.getAllOnesConstant(DL, VT: WideMaskVT); |
5371 | SDValue EVL = DAG.getElementCount(DL, VT: TLI.getVPExplicitVectorLengthTy(), |
5372 | EC: LdVT.getVectorElementCount()); |
5373 | const auto *MMO = LD->getMemOperand(); |
5374 | SDValue NewLoad = |
5375 | DAG.getLoadVP(VT: WideVT, dl: DL, Chain: LD->getChain(), Ptr: LD->getBasePtr(), Mask, EVL, |
5376 | PtrInfo: MMO->getPointerInfo(), Alignment: MMO->getAlign(), MMOFlags: MMO->getFlags(), |
5377 | AAInfo: MMO->getAAInfo()); |
5378 | |
5379 | // Modified the chain - switch anything that used the old chain to use |
5380 | // the new one. |
5381 | ReplaceValueWith(From: SDValue(N, 1), To: NewLoad.getValue(R: 1)); |
5382 | |
5383 | return NewLoad; |
5384 | } |
5385 | |
5386 | SDValue Result; |
5387 | SmallVector<SDValue, 16> LdChain; // Chain for the series of load |
5388 | if (ExtType != ISD::NON_EXTLOAD) |
5389 | Result = GenWidenVectorExtLoads(LdChain, LD, ExtType); |
5390 | else |
5391 | Result = GenWidenVectorLoads(LdChain, LD); |
5392 | |
5393 | if (Result) { |
5394 | // If we generate a single load, we can use that for the chain. Otherwise, |
5395 | // build a factor node to remember the multiple loads are independent and |
5396 | // chain to that. |
5397 | SDValue NewChain; |
5398 | if (LdChain.size() == 1) |
5399 | NewChain = LdChain[0]; |
5400 | else |
5401 | NewChain = DAG.getNode(ISD::TokenFactor, SDLoc(LD), MVT::Other, LdChain); |
5402 | |
5403 | // Modified the chain - switch anything that used the old chain to use |
5404 | // the new one. |
5405 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
5406 | |
5407 | return Result; |
5408 | } |
5409 | |
5410 | report_fatal_error(reason: "Unable to widen vector load" ); |
5411 | } |
5412 | |
5413 | SDValue DAGTypeLegalizer::WidenVecRes_VP_LOAD(VPLoadSDNode *N) { |
5414 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5415 | SDValue Mask = N->getMask(); |
5416 | SDValue EVL = N->getVectorLength(); |
5417 | ISD::LoadExtType ExtType = N->getExtensionType(); |
5418 | SDLoc dl(N); |
5419 | |
5420 | // The mask should be widened as well |
5421 | assert(getTypeAction(Mask.getValueType()) == |
5422 | TargetLowering::TypeWidenVector && |
5423 | "Unable to widen binary VP op" ); |
5424 | Mask = GetWidenedVector(Op: Mask); |
5425 | assert(Mask.getValueType().getVectorElementCount() == |
5426 | TLI.getTypeToTransformTo(*DAG.getContext(), Mask.getValueType()) |
5427 | .getVectorElementCount() && |
5428 | "Unable to widen vector load" ); |
5429 | |
5430 | SDValue Res = |
5431 | DAG.getLoadVP(AM: N->getAddressingMode(), ExtType, VT: WidenVT, dl, Chain: N->getChain(), |
5432 | Ptr: N->getBasePtr(), Offset: N->getOffset(), Mask, EVL, |
5433 | MemVT: N->getMemoryVT(), MMO: N->getMemOperand(), IsExpanding: N->isExpandingLoad()); |
5434 | // Legalize the chain result - switch anything that used the old chain to |
5435 | // use the new one. |
5436 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
5437 | return Res; |
5438 | } |
5439 | |
5440 | SDValue DAGTypeLegalizer::WidenVecRes_VP_STRIDED_LOAD(VPStridedLoadSDNode *N) { |
5441 | SDLoc DL(N); |
5442 | |
5443 | // The mask should be widened as well |
5444 | SDValue Mask = N->getMask(); |
5445 | assert(getTypeAction(Mask.getValueType()) == |
5446 | TargetLowering::TypeWidenVector && |
5447 | "Unable to widen VP strided load" ); |
5448 | Mask = GetWidenedVector(Op: Mask); |
5449 | |
5450 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5451 | assert(Mask.getValueType().getVectorElementCount() == |
5452 | WidenVT.getVectorElementCount() && |
5453 | "Data and mask vectors should have the same number of elements" ); |
5454 | |
5455 | SDValue Res = DAG.getStridedLoadVP( |
5456 | AM: N->getAddressingMode(), ExtType: N->getExtensionType(), VT: WidenVT, DL, Chain: N->getChain(), |
5457 | Ptr: N->getBasePtr(), Offset: N->getOffset(), Stride: N->getStride(), Mask, |
5458 | EVL: N->getVectorLength(), MemVT: N->getMemoryVT(), MMO: N->getMemOperand(), |
5459 | IsExpanding: N->isExpandingLoad()); |
5460 | |
5461 | // Legalize the chain result - switch anything that used the old chain to |
5462 | // use the new one. |
5463 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
5464 | return Res; |
5465 | } |
5466 | |
5467 | SDValue DAGTypeLegalizer::WidenVecRes_MLOAD(MaskedLoadSDNode *N) { |
5468 | |
5469 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(),VT: N->getValueType(ResNo: 0)); |
5470 | SDValue Mask = N->getMask(); |
5471 | EVT MaskVT = Mask.getValueType(); |
5472 | SDValue PassThru = GetWidenedVector(Op: N->getPassThru()); |
5473 | ISD::LoadExtType ExtType = N->getExtensionType(); |
5474 | SDLoc dl(N); |
5475 | |
5476 | // The mask should be widened as well |
5477 | EVT WideMaskVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5478 | VT: MaskVT.getVectorElementType(), |
5479 | NumElements: WidenVT.getVectorNumElements()); |
5480 | Mask = ModifyToType(InOp: Mask, NVT: WideMaskVT, FillWithZeroes: true); |
5481 | |
5482 | SDValue Res = DAG.getMaskedLoad( |
5483 | VT: WidenVT, dl, Chain: N->getChain(), Base: N->getBasePtr(), Offset: N->getOffset(), Mask, |
5484 | Src0: PassThru, MemVT: N->getMemoryVT(), MMO: N->getMemOperand(), AM: N->getAddressingMode(), |
5485 | ExtType, IsExpanding: N->isExpandingLoad()); |
5486 | // Legalize the chain result - switch anything that used the old chain to |
5487 | // use the new one. |
5488 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
5489 | return Res; |
5490 | } |
5491 | |
5492 | SDValue DAGTypeLegalizer::WidenVecRes_MGATHER(MaskedGatherSDNode *N) { |
5493 | |
5494 | EVT WideVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5495 | SDValue Mask = N->getMask(); |
5496 | EVT MaskVT = Mask.getValueType(); |
5497 | SDValue PassThru = GetWidenedVector(Op: N->getPassThru()); |
5498 | SDValue Scale = N->getScale(); |
5499 | unsigned NumElts = WideVT.getVectorNumElements(); |
5500 | SDLoc dl(N); |
5501 | |
5502 | // The mask should be widened as well |
5503 | EVT WideMaskVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5504 | VT: MaskVT.getVectorElementType(), |
5505 | NumElements: WideVT.getVectorNumElements()); |
5506 | Mask = ModifyToType(InOp: Mask, NVT: WideMaskVT, FillWithZeroes: true); |
5507 | |
5508 | // Widen the Index operand |
5509 | SDValue Index = N->getIndex(); |
5510 | EVT WideIndexVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5511 | VT: Index.getValueType().getScalarType(), |
5512 | NumElements: NumElts); |
5513 | Index = ModifyToType(InOp: Index, NVT: WideIndexVT); |
5514 | SDValue Ops[] = { N->getChain(), PassThru, Mask, N->getBasePtr(), Index, |
5515 | Scale }; |
5516 | |
5517 | // Widen the MemoryType |
5518 | EVT WideMemVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5519 | VT: N->getMemoryVT().getScalarType(), NumElements: NumElts); |
5520 | SDValue Res = DAG.getMaskedGather(DAG.getVTList(WideVT, MVT::Other), |
5521 | WideMemVT, dl, Ops, N->getMemOperand(), |
5522 | N->getIndexType(), N->getExtensionType()); |
5523 | |
5524 | // Legalize the chain result - switch anything that used the old chain to |
5525 | // use the new one. |
5526 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
5527 | return Res; |
5528 | } |
5529 | |
5530 | SDValue DAGTypeLegalizer::WidenVecRes_VP_GATHER(VPGatherSDNode *N) { |
5531 | EVT WideVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5532 | SDValue Mask = N->getMask(); |
5533 | SDValue Scale = N->getScale(); |
5534 | ElementCount WideEC = WideVT.getVectorElementCount(); |
5535 | SDLoc dl(N); |
5536 | |
5537 | SDValue Index = GetWidenedVector(Op: N->getIndex()); |
5538 | EVT WideMemVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
5539 | VT: N->getMemoryVT().getScalarType(), EC: WideEC); |
5540 | Mask = GetWidenedMask(Mask, EC: WideEC); |
5541 | |
5542 | SDValue Ops[] = {N->getChain(), N->getBasePtr(), Index, Scale, |
5543 | Mask, N->getVectorLength()}; |
5544 | SDValue Res = DAG.getGatherVP(DAG.getVTList(WideVT, MVT::Other), WideMemVT, |
5545 | dl, Ops, N->getMemOperand(), N->getIndexType()); |
5546 | |
5547 | // Legalize the chain result - switch anything that used the old chain to |
5548 | // use the new one. |
5549 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
5550 | return Res; |
5551 | } |
5552 | |
5553 | SDValue DAGTypeLegalizer::WidenVecRes_ScalarOp(SDNode *N) { |
5554 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5555 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: WidenVT, Operand: N->getOperand(Num: 0)); |
5556 | } |
5557 | |
5558 | // Return true is this is a SETCC node or a strict version of it. |
5559 | static inline bool isSETCCOp(unsigned Opcode) { |
5560 | switch (Opcode) { |
5561 | case ISD::SETCC: |
5562 | case ISD::STRICT_FSETCC: |
5563 | case ISD::STRICT_FSETCCS: |
5564 | return true; |
5565 | } |
5566 | return false; |
5567 | } |
5568 | |
5569 | // Return true if this is a node that could have two SETCCs as operands. |
5570 | static inline bool isLogicalMaskOp(unsigned Opcode) { |
5571 | switch (Opcode) { |
5572 | case ISD::AND: |
5573 | case ISD::OR: |
5574 | case ISD::XOR: |
5575 | return true; |
5576 | } |
5577 | return false; |
5578 | } |
5579 | |
5580 | // If N is a SETCC or a strict variant of it, return the type |
5581 | // of the compare operands. |
5582 | static inline EVT getSETCCOperandType(SDValue N) { |
5583 | unsigned OpNo = N->isStrictFPOpcode() ? 1 : 0; |
5584 | return N->getOperand(Num: OpNo).getValueType(); |
5585 | } |
5586 | |
5587 | // This is used just for the assert in convertMask(). Check that this either |
5588 | // a SETCC or a previously handled SETCC by convertMask(). |
5589 | #ifndef NDEBUG |
5590 | static inline bool isSETCCorConvertedSETCC(SDValue N) { |
5591 | if (N.getOpcode() == ISD::EXTRACT_SUBVECTOR) |
5592 | N = N.getOperand(i: 0); |
5593 | else if (N.getOpcode() == ISD::CONCAT_VECTORS) { |
5594 | for (unsigned i = 1; i < N->getNumOperands(); ++i) |
5595 | if (!N->getOperand(Num: i)->isUndef()) |
5596 | return false; |
5597 | N = N.getOperand(i: 0); |
5598 | } |
5599 | |
5600 | if (N.getOpcode() == ISD::TRUNCATE) |
5601 | N = N.getOperand(i: 0); |
5602 | else if (N.getOpcode() == ISD::SIGN_EXTEND) |
5603 | N = N.getOperand(i: 0); |
5604 | |
5605 | if (isLogicalMaskOp(Opcode: N.getOpcode())) |
5606 | return isSETCCorConvertedSETCC(N: N.getOperand(i: 0)) && |
5607 | isSETCCorConvertedSETCC(N: N.getOperand(i: 1)); |
5608 | |
5609 | return (isSETCCOp(Opcode: N.getOpcode()) || |
5610 | ISD::isBuildVectorOfConstantSDNodes(N: N.getNode())); |
5611 | } |
5612 | #endif |
5613 | |
5614 | // Return a mask of vector type MaskVT to replace InMask. Also adjust MaskVT |
5615 | // to ToMaskVT if needed with vector extension or truncation. |
5616 | SDValue DAGTypeLegalizer::convertMask(SDValue InMask, EVT MaskVT, |
5617 | EVT ToMaskVT) { |
5618 | // Currently a SETCC or a AND/OR/XOR with two SETCCs are handled. |
5619 | // FIXME: This code seems to be too restrictive, we might consider |
5620 | // generalizing it or dropping it. |
5621 | assert(isSETCCorConvertedSETCC(InMask) && "Unexpected mask argument." ); |
5622 | |
5623 | // Make a new Mask node, with a legal result VT. |
5624 | SDValue Mask; |
5625 | SmallVector<SDValue, 4> Ops; |
5626 | for (unsigned i = 0, e = InMask->getNumOperands(); i < e; ++i) |
5627 | Ops.push_back(Elt: InMask->getOperand(Num: i)); |
5628 | if (InMask->isStrictFPOpcode()) { |
5629 | Mask = DAG.getNode(InMask->getOpcode(), SDLoc(InMask), |
5630 | { MaskVT, MVT::Other }, Ops); |
5631 | ReplaceValueWith(From: InMask.getValue(R: 1), To: Mask.getValue(R: 1)); |
5632 | } |
5633 | else |
5634 | Mask = DAG.getNode(Opcode: InMask->getOpcode(), DL: SDLoc(InMask), VT: MaskVT, Ops); |
5635 | |
5636 | // If MaskVT has smaller or bigger elements than ToMaskVT, a vector sign |
5637 | // extend or truncate is needed. |
5638 | LLVMContext &Ctx = *DAG.getContext(); |
5639 | unsigned MaskScalarBits = MaskVT.getScalarSizeInBits(); |
5640 | unsigned ToMaskScalBits = ToMaskVT.getScalarSizeInBits(); |
5641 | if (MaskScalarBits < ToMaskScalBits) { |
5642 | EVT ExtVT = EVT::getVectorVT(Context&: Ctx, VT: ToMaskVT.getVectorElementType(), |
5643 | NumElements: MaskVT.getVectorNumElements()); |
5644 | Mask = DAG.getNode(Opcode: ISD::SIGN_EXTEND, DL: SDLoc(Mask), VT: ExtVT, Operand: Mask); |
5645 | } else if (MaskScalarBits > ToMaskScalBits) { |
5646 | EVT TruncVT = EVT::getVectorVT(Context&: Ctx, VT: ToMaskVT.getVectorElementType(), |
5647 | NumElements: MaskVT.getVectorNumElements()); |
5648 | Mask = DAG.getNode(Opcode: ISD::TRUNCATE, DL: SDLoc(Mask), VT: TruncVT, Operand: Mask); |
5649 | } |
5650 | |
5651 | assert(Mask->getValueType(0).getScalarSizeInBits() == |
5652 | ToMaskVT.getScalarSizeInBits() && |
5653 | "Mask should have the right element size by now." ); |
5654 | |
5655 | // Adjust Mask to the right number of elements. |
5656 | unsigned CurrMaskNumEls = Mask->getValueType(ResNo: 0).getVectorNumElements(); |
5657 | if (CurrMaskNumEls > ToMaskVT.getVectorNumElements()) { |
5658 | SDValue ZeroIdx = DAG.getVectorIdxConstant(Val: 0, DL: SDLoc(Mask)); |
5659 | Mask = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: SDLoc(Mask), VT: ToMaskVT, N1: Mask, |
5660 | N2: ZeroIdx); |
5661 | } else if (CurrMaskNumEls < ToMaskVT.getVectorNumElements()) { |
5662 | unsigned NumSubVecs = (ToMaskVT.getVectorNumElements() / CurrMaskNumEls); |
5663 | EVT SubVT = Mask->getValueType(ResNo: 0); |
5664 | SmallVector<SDValue, 16> SubOps(NumSubVecs, DAG.getUNDEF(VT: SubVT)); |
5665 | SubOps[0] = Mask; |
5666 | Mask = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: SDLoc(Mask), VT: ToMaskVT, Ops: SubOps); |
5667 | } |
5668 | |
5669 | assert((Mask->getValueType(0) == ToMaskVT) && |
5670 | "A mask of ToMaskVT should have been produced by now." ); |
5671 | |
5672 | return Mask; |
5673 | } |
5674 | |
5675 | // This method tries to handle some special cases for the vselect mask |
5676 | // and if needed adjusting the mask vector type to match that of the VSELECT. |
5677 | // Without it, many cases end up with scalarization of the SETCC, with many |
5678 | // unnecessary instructions. |
5679 | SDValue DAGTypeLegalizer::WidenVSELECTMask(SDNode *N) { |
5680 | LLVMContext &Ctx = *DAG.getContext(); |
5681 | SDValue Cond = N->getOperand(Num: 0); |
5682 | |
5683 | if (N->getOpcode() != ISD::VSELECT) |
5684 | return SDValue(); |
5685 | |
5686 | if (!isSETCCOp(Opcode: Cond->getOpcode()) && !isLogicalMaskOp(Opcode: Cond->getOpcode())) |
5687 | return SDValue(); |
5688 | |
5689 | // If this is a splitted VSELECT that was previously already handled, do |
5690 | // nothing. |
5691 | EVT CondVT = Cond->getValueType(ResNo: 0); |
5692 | if (CondVT.getScalarSizeInBits() != 1) |
5693 | return SDValue(); |
5694 | |
5695 | EVT VSelVT = N->getValueType(ResNo: 0); |
5696 | |
5697 | // This method can't handle scalable vector types. |
5698 | // FIXME: This support could be added in the future. |
5699 | if (VSelVT.isScalableVector()) |
5700 | return SDValue(); |
5701 | |
5702 | // Only handle vector types which are a power of 2. |
5703 | if (!isPowerOf2_64(Value: VSelVT.getSizeInBits())) |
5704 | return SDValue(); |
5705 | |
5706 | // Don't touch if this will be scalarized. |
5707 | EVT FinalVT = VSelVT; |
5708 | while (getTypeAction(VT: FinalVT) == TargetLowering::TypeSplitVector) |
5709 | FinalVT = FinalVT.getHalfNumVectorElementsVT(Context&: Ctx); |
5710 | |
5711 | if (FinalVT.getVectorNumElements() == 1) |
5712 | return SDValue(); |
5713 | |
5714 | // If there is support for an i1 vector mask, don't touch. |
5715 | if (isSETCCOp(Opcode: Cond.getOpcode())) { |
5716 | EVT SetCCOpVT = getSETCCOperandType(N: Cond); |
5717 | while (TLI.getTypeAction(Context&: Ctx, VT: SetCCOpVT) != TargetLowering::TypeLegal) |
5718 | SetCCOpVT = TLI.getTypeToTransformTo(Context&: Ctx, VT: SetCCOpVT); |
5719 | EVT SetCCResVT = getSetCCResultType(VT: SetCCOpVT); |
5720 | if (SetCCResVT.getScalarSizeInBits() == 1) |
5721 | return SDValue(); |
5722 | } else if (CondVT.getScalarType() == MVT::i1) { |
5723 | // If there is support for an i1 vector mask (or only scalar i1 conditions), |
5724 | // don't touch. |
5725 | while (TLI.getTypeAction(Context&: Ctx, VT: CondVT) != TargetLowering::TypeLegal) |
5726 | CondVT = TLI.getTypeToTransformTo(Context&: Ctx, VT: CondVT); |
5727 | |
5728 | if (CondVT.getScalarType() == MVT::i1) |
5729 | return SDValue(); |
5730 | } |
5731 | |
5732 | // Widen the vselect result type if needed. |
5733 | if (getTypeAction(VT: VSelVT) == TargetLowering::TypeWidenVector) |
5734 | VSelVT = TLI.getTypeToTransformTo(Context&: Ctx, VT: VSelVT); |
5735 | |
5736 | // The mask of the VSELECT should have integer elements. |
5737 | EVT ToMaskVT = VSelVT; |
5738 | if (!ToMaskVT.getScalarType().isInteger()) |
5739 | ToMaskVT = ToMaskVT.changeVectorElementTypeToInteger(); |
5740 | |
5741 | SDValue Mask; |
5742 | if (isSETCCOp(Opcode: Cond->getOpcode())) { |
5743 | EVT MaskVT = getSetCCResultType(VT: getSETCCOperandType(N: Cond)); |
5744 | Mask = convertMask(InMask: Cond, MaskVT, ToMaskVT); |
5745 | } else if (isLogicalMaskOp(Opcode: Cond->getOpcode()) && |
5746 | isSETCCOp(Opcode: Cond->getOperand(Num: 0).getOpcode()) && |
5747 | isSETCCOp(Opcode: Cond->getOperand(Num: 1).getOpcode())) { |
5748 | // Cond is (AND/OR/XOR (SETCC, SETCC)) |
5749 | SDValue SETCC0 = Cond->getOperand(Num: 0); |
5750 | SDValue SETCC1 = Cond->getOperand(Num: 1); |
5751 | EVT VT0 = getSetCCResultType(VT: getSETCCOperandType(N: SETCC0)); |
5752 | EVT VT1 = getSetCCResultType(VT: getSETCCOperandType(N: SETCC1)); |
5753 | unsigned ScalarBits0 = VT0.getScalarSizeInBits(); |
5754 | unsigned ScalarBits1 = VT1.getScalarSizeInBits(); |
5755 | unsigned ScalarBits_ToMask = ToMaskVT.getScalarSizeInBits(); |
5756 | EVT MaskVT; |
5757 | // If the two SETCCs have different VTs, either extend/truncate one of |
5758 | // them to the other "towards" ToMaskVT, or truncate one and extend the |
5759 | // other to ToMaskVT. |
5760 | if (ScalarBits0 != ScalarBits1) { |
5761 | EVT NarrowVT = ((ScalarBits0 < ScalarBits1) ? VT0 : VT1); |
5762 | EVT WideVT = ((NarrowVT == VT0) ? VT1 : VT0); |
5763 | if (ScalarBits_ToMask >= WideVT.getScalarSizeInBits()) |
5764 | MaskVT = WideVT; |
5765 | else if (ScalarBits_ToMask <= NarrowVT.getScalarSizeInBits()) |
5766 | MaskVT = NarrowVT; |
5767 | else |
5768 | MaskVT = ToMaskVT; |
5769 | } else |
5770 | // If the two SETCCs have the same VT, don't change it. |
5771 | MaskVT = VT0; |
5772 | |
5773 | // Make new SETCCs and logical nodes. |
5774 | SETCC0 = convertMask(InMask: SETCC0, MaskVT: VT0, ToMaskVT: MaskVT); |
5775 | SETCC1 = convertMask(InMask: SETCC1, MaskVT: VT1, ToMaskVT: MaskVT); |
5776 | Cond = DAG.getNode(Opcode: Cond->getOpcode(), DL: SDLoc(Cond), VT: MaskVT, N1: SETCC0, N2: SETCC1); |
5777 | |
5778 | // Convert the logical op for VSELECT if needed. |
5779 | Mask = convertMask(InMask: Cond, MaskVT, ToMaskVT); |
5780 | } else |
5781 | return SDValue(); |
5782 | |
5783 | return Mask; |
5784 | } |
5785 | |
5786 | SDValue DAGTypeLegalizer::WidenVecRes_Select(SDNode *N) { |
5787 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5788 | ElementCount WidenEC = WidenVT.getVectorElementCount(); |
5789 | |
5790 | SDValue Cond1 = N->getOperand(Num: 0); |
5791 | EVT CondVT = Cond1.getValueType(); |
5792 | unsigned Opcode = N->getOpcode(); |
5793 | if (CondVT.isVector()) { |
5794 | if (SDValue WideCond = WidenVSELECTMask(N)) { |
5795 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
5796 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 2)); |
5797 | assert(InOp1.getValueType() == WidenVT && InOp2.getValueType() == WidenVT); |
5798 | return DAG.getNode(Opcode, DL: SDLoc(N), VT: WidenVT, N1: WideCond, N2: InOp1, N3: InOp2); |
5799 | } |
5800 | |
5801 | EVT CondEltVT = CondVT.getVectorElementType(); |
5802 | EVT CondWidenVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: CondEltVT, EC: WidenEC); |
5803 | if (getTypeAction(VT: CondVT) == TargetLowering::TypeWidenVector) |
5804 | Cond1 = GetWidenedVector(Op: Cond1); |
5805 | |
5806 | // If we have to split the condition there is no point in widening the |
5807 | // select. This would result in an cycle of widening the select -> |
5808 | // widening the condition operand -> splitting the condition operand -> |
5809 | // splitting the select -> widening the select. Instead split this select |
5810 | // further and widen the resulting type. |
5811 | if (getTypeAction(VT: CondVT) == TargetLowering::TypeSplitVector) { |
5812 | SDValue SplitSelect = SplitVecOp_VSELECT(N, OpNo: 0); |
5813 | SDValue Res = ModifyToType(InOp: SplitSelect, NVT: WidenVT); |
5814 | return Res; |
5815 | } |
5816 | |
5817 | if (Cond1.getValueType() != CondWidenVT) |
5818 | Cond1 = ModifyToType(InOp: Cond1, NVT: CondWidenVT); |
5819 | } |
5820 | |
5821 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
5822 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 2)); |
5823 | assert(InOp1.getValueType() == WidenVT && InOp2.getValueType() == WidenVT); |
5824 | if (Opcode == ISD::VP_SELECT || Opcode == ISD::VP_MERGE) |
5825 | return DAG.getNode(Opcode, DL: SDLoc(N), VT: WidenVT, N1: Cond1, N2: InOp1, N3: InOp2, |
5826 | N4: N->getOperand(Num: 3)); |
5827 | return DAG.getNode(Opcode, DL: SDLoc(N), VT: WidenVT, N1: Cond1, N2: InOp1, N3: InOp2); |
5828 | } |
5829 | |
5830 | SDValue DAGTypeLegalizer::WidenVecRes_SELECT_CC(SDNode *N) { |
5831 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 2)); |
5832 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 3)); |
5833 | return DAG.getNode(Opcode: ISD::SELECT_CC, DL: SDLoc(N), |
5834 | VT: InOp1.getValueType(), N1: N->getOperand(Num: 0), |
5835 | N2: N->getOperand(Num: 1), N3: InOp1, N4: InOp2, N5: N->getOperand(Num: 4)); |
5836 | } |
5837 | |
5838 | SDValue DAGTypeLegalizer::WidenVecRes_UNDEF(SDNode *N) { |
5839 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5840 | return DAG.getUNDEF(VT: WidenVT); |
5841 | } |
5842 | |
5843 | SDValue DAGTypeLegalizer::WidenVecRes_VECTOR_SHUFFLE(ShuffleVectorSDNode *N) { |
5844 | EVT VT = N->getValueType(ResNo: 0); |
5845 | SDLoc dl(N); |
5846 | |
5847 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5848 | unsigned NumElts = VT.getVectorNumElements(); |
5849 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
5850 | |
5851 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
5852 | SDValue InOp2 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
5853 | |
5854 | // Adjust mask based on new input vector length. |
5855 | SmallVector<int, 16> NewMask; |
5856 | for (unsigned i = 0; i != NumElts; ++i) { |
5857 | int Idx = N->getMaskElt(Idx: i); |
5858 | if (Idx < (int)NumElts) |
5859 | NewMask.push_back(Elt: Idx); |
5860 | else |
5861 | NewMask.push_back(Elt: Idx - NumElts + WidenNumElts); |
5862 | } |
5863 | for (unsigned i = NumElts; i != WidenNumElts; ++i) |
5864 | NewMask.push_back(Elt: -1); |
5865 | return DAG.getVectorShuffle(VT: WidenVT, dl, N1: InOp1, N2: InOp2, Mask: NewMask); |
5866 | } |
5867 | |
5868 | SDValue DAGTypeLegalizer::WidenVecRes_VECTOR_REVERSE(SDNode *N) { |
5869 | EVT VT = N->getValueType(ResNo: 0); |
5870 | EVT EltVT = VT.getVectorElementType(); |
5871 | SDLoc dl(N); |
5872 | |
5873 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5874 | SDValue OpValue = GetWidenedVector(Op: N->getOperand(Num: 0)); |
5875 | assert(WidenVT == OpValue.getValueType() && "Unexpected widened vector type" ); |
5876 | |
5877 | SDValue ReverseVal = DAG.getNode(Opcode: ISD::VECTOR_REVERSE, DL: dl, VT: WidenVT, Operand: OpValue); |
5878 | unsigned WidenNumElts = WidenVT.getVectorMinNumElements(); |
5879 | unsigned VTNumElts = VT.getVectorMinNumElements(); |
5880 | unsigned IdxVal = WidenNumElts - VTNumElts; |
5881 | |
5882 | if (VT.isScalableVector()) { |
5883 | // Try to split the 'Widen ReverseVal' into smaller extracts and concat the |
5884 | // results together, e.g.(nxv6i64 -> nxv8i64) |
5885 | // nxv8i64 vector_reverse |
5886 | // <-> |
5887 | // nxv8i64 concat( |
5888 | // nxv2i64 extract_subvector(nxv8i64, 2) |
5889 | // nxv2i64 extract_subvector(nxv8i64, 4) |
5890 | // nxv2i64 extract_subvector(nxv8i64, 6) |
5891 | // nxv2i64 undef) |
5892 | |
5893 | unsigned GCD = std::gcd(m: VTNumElts, n: WidenNumElts); |
5894 | EVT PartVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, |
5895 | EC: ElementCount::getScalable(MinVal: GCD)); |
5896 | assert((IdxVal % GCD) == 0 && "Expected Idx to be a multiple of the broken " |
5897 | "down type's element count" ); |
5898 | SmallVector<SDValue> Parts; |
5899 | unsigned i = 0; |
5900 | for (; i < VTNumElts / GCD; ++i) |
5901 | Parts.push_back( |
5902 | Elt: DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: PartVT, N1: ReverseVal, |
5903 | N2: DAG.getVectorIdxConstant(Val: IdxVal + i * GCD, DL: dl))); |
5904 | for (; i < WidenNumElts / GCD; ++i) |
5905 | Parts.push_back(Elt: DAG.getUNDEF(VT: PartVT)); |
5906 | |
5907 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, Ops: Parts); |
5908 | } |
5909 | |
5910 | // Use VECTOR_SHUFFLE to combine new vector from 'ReverseVal' for |
5911 | // fixed-vectors. |
5912 | SmallVector<int, 16> Mask; |
5913 | for (unsigned i = 0; i != VTNumElts; ++i) { |
5914 | Mask.push_back(Elt: IdxVal + i); |
5915 | } |
5916 | for (unsigned i = VTNumElts; i != WidenNumElts; ++i) |
5917 | Mask.push_back(Elt: -1); |
5918 | |
5919 | return DAG.getVectorShuffle(VT: WidenVT, dl, N1: ReverseVal, N2: DAG.getUNDEF(VT: WidenVT), |
5920 | Mask); |
5921 | } |
5922 | |
5923 | SDValue DAGTypeLegalizer::WidenVecRes_SETCC(SDNode *N) { |
5924 | assert(N->getValueType(0).isVector() && |
5925 | N->getOperand(0).getValueType().isVector() && |
5926 | "Operands must be vectors" ); |
5927 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: N->getValueType(ResNo: 0)); |
5928 | ElementCount WidenEC = WidenVT.getVectorElementCount(); |
5929 | |
5930 | SDValue InOp1 = N->getOperand(Num: 0); |
5931 | EVT InVT = InOp1.getValueType(); |
5932 | assert(InVT.isVector() && "can not widen non-vector type" ); |
5933 | EVT WidenInVT = |
5934 | EVT::getVectorVT(Context&: *DAG.getContext(), VT: InVT.getVectorElementType(), EC: WidenEC); |
5935 | |
5936 | // The input and output types often differ here, and it could be that while |
5937 | // we'd prefer to widen the result type, the input operands have been split. |
5938 | // In this case, we also need to split the result of this node as well. |
5939 | if (getTypeAction(VT: InVT) == TargetLowering::TypeSplitVector) { |
5940 | SDValue SplitVSetCC = SplitVecOp_VSETCC(N); |
5941 | SDValue Res = ModifyToType(InOp: SplitVSetCC, NVT: WidenVT); |
5942 | return Res; |
5943 | } |
5944 | |
5945 | // If the inputs also widen, handle them directly. Otherwise widen by hand. |
5946 | SDValue InOp2 = N->getOperand(Num: 1); |
5947 | if (getTypeAction(VT: InVT) == TargetLowering::TypeWidenVector) { |
5948 | InOp1 = GetWidenedVector(Op: InOp1); |
5949 | InOp2 = GetWidenedVector(Op: InOp2); |
5950 | } else { |
5951 | InOp1 = DAG.WidenVector(N: InOp1, DL: SDLoc(N)); |
5952 | InOp2 = DAG.WidenVector(N: InOp2, DL: SDLoc(N)); |
5953 | } |
5954 | |
5955 | // Assume that the input and output will be widen appropriately. If not, |
5956 | // we will have to unroll it at some point. |
5957 | assert(InOp1.getValueType() == WidenInVT && |
5958 | InOp2.getValueType() == WidenInVT && |
5959 | "Input not widened to expected type!" ); |
5960 | (void)WidenInVT; |
5961 | if (N->getOpcode() == ISD::VP_SETCC) { |
5962 | SDValue Mask = |
5963 | GetWidenedMask(Mask: N->getOperand(Num: 3), EC: WidenVT.getVectorElementCount()); |
5964 | return DAG.getNode(Opcode: ISD::VP_SETCC, DL: SDLoc(N), VT: WidenVT, N1: InOp1, N2: InOp2, |
5965 | N3: N->getOperand(Num: 2), N4: Mask, N5: N->getOperand(Num: 4)); |
5966 | } |
5967 | return DAG.getNode(Opcode: ISD::SETCC, DL: SDLoc(N), VT: WidenVT, N1: InOp1, N2: InOp2, |
5968 | N3: N->getOperand(Num: 2)); |
5969 | } |
5970 | |
5971 | SDValue DAGTypeLegalizer::WidenVecRes_STRICT_FSETCC(SDNode *N) { |
5972 | assert(N->getValueType(0).isVector() && |
5973 | N->getOperand(1).getValueType().isVector() && |
5974 | "Operands must be vectors" ); |
5975 | EVT VT = N->getValueType(ResNo: 0); |
5976 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT); |
5977 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
5978 | unsigned NumElts = VT.getVectorNumElements(); |
5979 | EVT EltVT = VT.getVectorElementType(); |
5980 | |
5981 | SDLoc dl(N); |
5982 | SDValue Chain = N->getOperand(Num: 0); |
5983 | SDValue LHS = N->getOperand(Num: 1); |
5984 | SDValue RHS = N->getOperand(Num: 2); |
5985 | SDValue CC = N->getOperand(Num: 3); |
5986 | EVT TmpEltVT = LHS.getValueType().getVectorElementType(); |
5987 | |
5988 | // Fully unroll and reassemble. |
5989 | SmallVector<SDValue, 8> Scalars(WidenNumElts, DAG.getUNDEF(VT: EltVT)); |
5990 | SmallVector<SDValue, 8> Chains(NumElts); |
5991 | for (unsigned i = 0; i != NumElts; ++i) { |
5992 | SDValue LHSElem = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: TmpEltVT, N1: LHS, |
5993 | N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
5994 | SDValue RHSElem = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: TmpEltVT, N1: RHS, |
5995 | N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
5996 | |
5997 | Scalars[i] = DAG.getNode(N->getOpcode(), dl, {MVT::i1, MVT::Other}, |
5998 | {Chain, LHSElem, RHSElem, CC}); |
5999 | Chains[i] = Scalars[i].getValue(R: 1); |
6000 | Scalars[i] = DAG.getSelect(DL: dl, VT: EltVT, Cond: Scalars[i], |
6001 | LHS: DAG.getBoolConstant(V: true, DL: dl, VT: EltVT, OpVT: VT), |
6002 | RHS: DAG.getBoolConstant(V: false, DL: dl, VT: EltVT, OpVT: VT)); |
6003 | } |
6004 | |
6005 | SDValue NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Chains); |
6006 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
6007 | |
6008 | return DAG.getBuildVector(VT: WidenVT, DL: dl, Ops: Scalars); |
6009 | } |
6010 | |
6011 | //===----------------------------------------------------------------------===// |
6012 | // Widen Vector Operand |
6013 | //===----------------------------------------------------------------------===// |
6014 | bool DAGTypeLegalizer::WidenVectorOperand(SDNode *N, unsigned OpNo) { |
6015 | LLVM_DEBUG(dbgs() << "Widen node operand " << OpNo << ": " ; N->dump(&DAG)); |
6016 | SDValue Res = SDValue(); |
6017 | |
6018 | // See if the target wants to custom widen this node. |
6019 | if (CustomLowerNode(N, VT: N->getOperand(Num: OpNo).getValueType(), LegalizeResult: false)) |
6020 | return false; |
6021 | |
6022 | switch (N->getOpcode()) { |
6023 | default: |
6024 | #ifndef NDEBUG |
6025 | dbgs() << "WidenVectorOperand op #" << OpNo << ": " ; |
6026 | N->dump(G: &DAG); |
6027 | dbgs() << "\n" ; |
6028 | #endif |
6029 | report_fatal_error(reason: "Do not know how to widen this operator's operand!" ); |
6030 | |
6031 | case ISD::BITCAST: Res = WidenVecOp_BITCAST(N); break; |
6032 | case ISD::CONCAT_VECTORS: Res = WidenVecOp_CONCAT_VECTORS(N); break; |
6033 | case ISD::INSERT_SUBVECTOR: Res = WidenVecOp_INSERT_SUBVECTOR(N); break; |
6034 | case ISD::EXTRACT_SUBVECTOR: Res = WidenVecOp_EXTRACT_SUBVECTOR(N); break; |
6035 | case ISD::EXTRACT_VECTOR_ELT: Res = WidenVecOp_EXTRACT_VECTOR_ELT(N); break; |
6036 | case ISD::STORE: Res = WidenVecOp_STORE(N); break; |
6037 | case ISD::VP_STORE: Res = WidenVecOp_VP_STORE(N, OpNo); break; |
6038 | case ISD::EXPERIMENTAL_VP_STRIDED_STORE: |
6039 | Res = WidenVecOp_VP_STRIDED_STORE(N, OpNo); |
6040 | break; |
6041 | case ISD::ANY_EXTEND_VECTOR_INREG: |
6042 | case ISD::SIGN_EXTEND_VECTOR_INREG: |
6043 | case ISD::ZERO_EXTEND_VECTOR_INREG: |
6044 | Res = WidenVecOp_EXTEND_VECTOR_INREG(N); |
6045 | break; |
6046 | case ISD::MSTORE: Res = WidenVecOp_MSTORE(N, OpNo); break; |
6047 | case ISD::MGATHER: Res = WidenVecOp_MGATHER(N, OpNo); break; |
6048 | case ISD::MSCATTER: Res = WidenVecOp_MSCATTER(N, OpNo); break; |
6049 | case ISD::VP_SCATTER: Res = WidenVecOp_VP_SCATTER(N, OpNo); break; |
6050 | case ISD::SETCC: Res = WidenVecOp_SETCC(N); break; |
6051 | case ISD::STRICT_FSETCC: |
6052 | case ISD::STRICT_FSETCCS: Res = WidenVecOp_STRICT_FSETCC(N); break; |
6053 | case ISD::VSELECT: Res = WidenVecOp_VSELECT(N); break; |
6054 | case ISD::FLDEXP: |
6055 | case ISD::FCOPYSIGN: |
6056 | case ISD::LRINT: |
6057 | case ISD::LLRINT: |
6058 | Res = WidenVecOp_UnrollVectorOp(N); |
6059 | break; |
6060 | case ISD::IS_FPCLASS: Res = WidenVecOp_IS_FPCLASS(N); break; |
6061 | |
6062 | case ISD::ANY_EXTEND: |
6063 | case ISD::SIGN_EXTEND: |
6064 | case ISD::ZERO_EXTEND: |
6065 | Res = WidenVecOp_EXTEND(N); |
6066 | break; |
6067 | |
6068 | case ISD::FP_EXTEND: |
6069 | case ISD::STRICT_FP_EXTEND: |
6070 | case ISD::FP_ROUND: |
6071 | case ISD::STRICT_FP_ROUND: |
6072 | case ISD::FP_TO_SINT: |
6073 | case ISD::STRICT_FP_TO_SINT: |
6074 | case ISD::FP_TO_UINT: |
6075 | case ISD::STRICT_FP_TO_UINT: |
6076 | case ISD::SINT_TO_FP: |
6077 | case ISD::STRICT_SINT_TO_FP: |
6078 | case ISD::UINT_TO_FP: |
6079 | case ISD::STRICT_UINT_TO_FP: |
6080 | case ISD::TRUNCATE: |
6081 | Res = WidenVecOp_Convert(N); |
6082 | break; |
6083 | |
6084 | case ISD::FP_TO_SINT_SAT: |
6085 | case ISD::FP_TO_UINT_SAT: |
6086 | Res = WidenVecOp_FP_TO_XINT_SAT(N); |
6087 | break; |
6088 | |
6089 | case ISD::VECREDUCE_FADD: |
6090 | case ISD::VECREDUCE_FMUL: |
6091 | case ISD::VECREDUCE_ADD: |
6092 | case ISD::VECREDUCE_MUL: |
6093 | case ISD::VECREDUCE_AND: |
6094 | case ISD::VECREDUCE_OR: |
6095 | case ISD::VECREDUCE_XOR: |
6096 | case ISD::VECREDUCE_SMAX: |
6097 | case ISD::VECREDUCE_SMIN: |
6098 | case ISD::VECREDUCE_UMAX: |
6099 | case ISD::VECREDUCE_UMIN: |
6100 | case ISD::VECREDUCE_FMAX: |
6101 | case ISD::VECREDUCE_FMIN: |
6102 | case ISD::VECREDUCE_FMAXIMUM: |
6103 | case ISD::VECREDUCE_FMINIMUM: |
6104 | Res = WidenVecOp_VECREDUCE(N); |
6105 | break; |
6106 | case ISD::VECREDUCE_SEQ_FADD: |
6107 | case ISD::VECREDUCE_SEQ_FMUL: |
6108 | Res = WidenVecOp_VECREDUCE_SEQ(N); |
6109 | break; |
6110 | case ISD::VP_REDUCE_FADD: |
6111 | case ISD::VP_REDUCE_SEQ_FADD: |
6112 | case ISD::VP_REDUCE_FMUL: |
6113 | case ISD::VP_REDUCE_SEQ_FMUL: |
6114 | case ISD::VP_REDUCE_ADD: |
6115 | case ISD::VP_REDUCE_MUL: |
6116 | case ISD::VP_REDUCE_AND: |
6117 | case ISD::VP_REDUCE_OR: |
6118 | case ISD::VP_REDUCE_XOR: |
6119 | case ISD::VP_REDUCE_SMAX: |
6120 | case ISD::VP_REDUCE_SMIN: |
6121 | case ISD::VP_REDUCE_UMAX: |
6122 | case ISD::VP_REDUCE_UMIN: |
6123 | case ISD::VP_REDUCE_FMAX: |
6124 | case ISD::VP_REDUCE_FMIN: |
6125 | Res = WidenVecOp_VP_REDUCE(N); |
6126 | break; |
6127 | } |
6128 | |
6129 | // If Res is null, the sub-method took care of registering the result. |
6130 | if (!Res.getNode()) return false; |
6131 | |
6132 | // If the result is N, the sub-method updated N in place. Tell the legalizer |
6133 | // core about this. |
6134 | if (Res.getNode() == N) |
6135 | return true; |
6136 | |
6137 | |
6138 | if (N->isStrictFPOpcode()) |
6139 | assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 2 && |
6140 | "Invalid operand expansion" ); |
6141 | else |
6142 | assert(Res.getValueType() == N->getValueType(0) && N->getNumValues() == 1 && |
6143 | "Invalid operand expansion" ); |
6144 | |
6145 | ReplaceValueWith(From: SDValue(N, 0), To: Res); |
6146 | return false; |
6147 | } |
6148 | |
6149 | SDValue DAGTypeLegalizer::WidenVecOp_EXTEND(SDNode *N) { |
6150 | SDLoc DL(N); |
6151 | EVT VT = N->getValueType(ResNo: 0); |
6152 | |
6153 | SDValue InOp = N->getOperand(Num: 0); |
6154 | assert(getTypeAction(InOp.getValueType()) == |
6155 | TargetLowering::TypeWidenVector && |
6156 | "Unexpected type action" ); |
6157 | InOp = GetWidenedVector(Op: InOp); |
6158 | assert(VT.getVectorNumElements() < |
6159 | InOp.getValueType().getVectorNumElements() && |
6160 | "Input wasn't widened!" ); |
6161 | |
6162 | // We may need to further widen the operand until it has the same total |
6163 | // vector size as the result. |
6164 | EVT InVT = InOp.getValueType(); |
6165 | if (InVT.getSizeInBits() != VT.getSizeInBits()) { |
6166 | EVT InEltVT = InVT.getVectorElementType(); |
6167 | for (EVT FixedVT : MVT::vector_valuetypes()) { |
6168 | EVT FixedEltVT = FixedVT.getVectorElementType(); |
6169 | if (TLI.isTypeLegal(FixedVT) && |
6170 | FixedVT.getSizeInBits() == VT.getSizeInBits() && |
6171 | FixedEltVT == InEltVT) { |
6172 | assert(FixedVT.getVectorNumElements() >= VT.getVectorNumElements() && |
6173 | "Not enough elements in the fixed type for the operand!" ); |
6174 | assert(FixedVT.getVectorNumElements() != InVT.getVectorNumElements() && |
6175 | "We can't have the same type as we started with!" ); |
6176 | if (FixedVT.getVectorNumElements() > InVT.getVectorNumElements()) |
6177 | InOp = DAG.getNode(ISD::INSERT_SUBVECTOR, DL, FixedVT, |
6178 | DAG.getUNDEF(FixedVT), InOp, |
6179 | DAG.getVectorIdxConstant(0, DL)); |
6180 | else |
6181 | InOp = DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, FixedVT, InOp, |
6182 | DAG.getVectorIdxConstant(0, DL)); |
6183 | break; |
6184 | } |
6185 | } |
6186 | InVT = InOp.getValueType(); |
6187 | if (InVT.getSizeInBits() != VT.getSizeInBits()) |
6188 | // We couldn't find a legal vector type that was a widening of the input |
6189 | // and could be extended in-register to the result type, so we have to |
6190 | // scalarize. |
6191 | return WidenVecOp_Convert(N); |
6192 | } |
6193 | |
6194 | // Use special DAG nodes to represent the operation of extending the |
6195 | // low lanes. |
6196 | switch (N->getOpcode()) { |
6197 | default: |
6198 | llvm_unreachable("Extend legalization on extend operation!" ); |
6199 | case ISD::ANY_EXTEND: |
6200 | return DAG.getNode(Opcode: ISD::ANY_EXTEND_VECTOR_INREG, DL, VT, Operand: InOp); |
6201 | case ISD::SIGN_EXTEND: |
6202 | return DAG.getNode(Opcode: ISD::SIGN_EXTEND_VECTOR_INREG, DL, VT, Operand: InOp); |
6203 | case ISD::ZERO_EXTEND: |
6204 | return DAG.getNode(Opcode: ISD::ZERO_EXTEND_VECTOR_INREG, DL, VT, Operand: InOp); |
6205 | } |
6206 | } |
6207 | |
6208 | SDValue DAGTypeLegalizer::WidenVecOp_UnrollVectorOp(SDNode *N) { |
6209 | // The result (and first input) is legal, but the second input is illegal. |
6210 | // We can't do much to fix that, so just unroll and let the extracts off of |
6211 | // the second input be widened as needed later. |
6212 | return DAG.UnrollVectorOp(N); |
6213 | } |
6214 | |
6215 | SDValue DAGTypeLegalizer::WidenVecOp_IS_FPCLASS(SDNode *N) { |
6216 | SDLoc DL(N); |
6217 | EVT ResultVT = N->getValueType(ResNo: 0); |
6218 | SDValue Test = N->getOperand(Num: 1); |
6219 | SDValue WideArg = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6220 | |
6221 | // Process this node similarly to SETCC. |
6222 | EVT WideResultVT = getSetCCResultType(VT: WideArg.getValueType()); |
6223 | if (ResultVT.getScalarType() == MVT::i1) |
6224 | WideResultVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1, |
6225 | WideResultVT.getVectorNumElements()); |
6226 | |
6227 | SDValue WideNode = DAG.getNode(Opcode: ISD::IS_FPCLASS, DL, VT: WideResultVT, |
6228 | Ops: {WideArg, Test}, Flags: N->getFlags()); |
6229 | |
6230 | // Extract the needed results from the result vector. |
6231 | EVT ResVT = |
6232 | EVT::getVectorVT(Context&: *DAG.getContext(), VT: WideResultVT.getVectorElementType(), |
6233 | NumElements: ResultVT.getVectorNumElements()); |
6234 | SDValue CC = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT: ResVT, N1: WideNode, |
6235 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
6236 | |
6237 | EVT OpVT = N->getOperand(Num: 0).getValueType(); |
6238 | ISD::NodeType ExtendCode = |
6239 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: OpVT)); |
6240 | return DAG.getNode(Opcode: ExtendCode, DL, VT: ResultVT, Operand: CC); |
6241 | } |
6242 | |
6243 | SDValue DAGTypeLegalizer::WidenVecOp_Convert(SDNode *N) { |
6244 | // Since the result is legal and the input is illegal. |
6245 | EVT VT = N->getValueType(ResNo: 0); |
6246 | EVT EltVT = VT.getVectorElementType(); |
6247 | SDLoc dl(N); |
6248 | SDValue InOp = N->getOperand(Num: N->isStrictFPOpcode() ? 1 : 0); |
6249 | assert(getTypeAction(InOp.getValueType()) == |
6250 | TargetLowering::TypeWidenVector && |
6251 | "Unexpected type action" ); |
6252 | InOp = GetWidenedVector(Op: InOp); |
6253 | EVT InVT = InOp.getValueType(); |
6254 | unsigned Opcode = N->getOpcode(); |
6255 | |
6256 | // See if a widened result type would be legal, if so widen the node. |
6257 | // FIXME: This isn't safe for StrictFP. Other optimization here is needed. |
6258 | EVT WideVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, |
6259 | EC: InVT.getVectorElementCount()); |
6260 | if (TLI.isTypeLegal(VT: WideVT) && !N->isStrictFPOpcode()) { |
6261 | SDValue Res; |
6262 | if (N->isStrictFPOpcode()) { |
6263 | if (Opcode == ISD::STRICT_FP_ROUND) |
6264 | Res = DAG.getNode(Opcode, dl, { WideVT, MVT::Other }, |
6265 | { N->getOperand(0), InOp, N->getOperand(2) }); |
6266 | else |
6267 | Res = DAG.getNode(Opcode, dl, { WideVT, MVT::Other }, |
6268 | { N->getOperand(0), InOp }); |
6269 | // Legalize the chain result - switch anything that used the old chain to |
6270 | // use the new one. |
6271 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
6272 | } else { |
6273 | if (Opcode == ISD::FP_ROUND) |
6274 | Res = DAG.getNode(Opcode, DL: dl, VT: WideVT, N1: InOp, N2: N->getOperand(Num: 1)); |
6275 | else |
6276 | Res = DAG.getNode(Opcode, DL: dl, VT: WideVT, Operand: InOp); |
6277 | } |
6278 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT, N1: Res, |
6279 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
6280 | } |
6281 | |
6282 | EVT InEltVT = InVT.getVectorElementType(); |
6283 | |
6284 | // Unroll the convert into some scalar code and create a nasty build vector. |
6285 | unsigned NumElts = VT.getVectorNumElements(); |
6286 | SmallVector<SDValue, 16> Ops(NumElts); |
6287 | if (N->isStrictFPOpcode()) { |
6288 | SmallVector<SDValue, 4> NewOps(N->op_begin(), N->op_end()); |
6289 | SmallVector<SDValue, 32> OpChains; |
6290 | for (unsigned i=0; i < NumElts; ++i) { |
6291 | NewOps[1] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: InEltVT, N1: InOp, |
6292 | N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
6293 | Ops[i] = DAG.getNode(Opcode, dl, { EltVT, MVT::Other }, NewOps); |
6294 | OpChains.push_back(Elt: Ops[i].getValue(R: 1)); |
6295 | } |
6296 | SDValue NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OpChains); |
6297 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
6298 | } else { |
6299 | for (unsigned i = 0; i < NumElts; ++i) |
6300 | Ops[i] = DAG.getNode(Opcode, DL: dl, VT: EltVT, |
6301 | Operand: DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: InEltVT, |
6302 | N1: InOp, N2: DAG.getVectorIdxConstant(Val: i, DL: dl))); |
6303 | } |
6304 | |
6305 | return DAG.getBuildVector(VT, DL: dl, Ops); |
6306 | } |
6307 | |
6308 | SDValue DAGTypeLegalizer::WidenVecOp_FP_TO_XINT_SAT(SDNode *N) { |
6309 | EVT DstVT = N->getValueType(ResNo: 0); |
6310 | SDValue Src = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6311 | EVT SrcVT = Src.getValueType(); |
6312 | ElementCount WideNumElts = SrcVT.getVectorElementCount(); |
6313 | SDLoc dl(N); |
6314 | |
6315 | // See if a widened result type would be legal, if so widen the node. |
6316 | EVT WideDstVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6317 | VT: DstVT.getVectorElementType(), EC: WideNumElts); |
6318 | if (TLI.isTypeLegal(VT: WideDstVT)) { |
6319 | SDValue Res = |
6320 | DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: WideDstVT, N1: Src, N2: N->getOperand(Num: 1)); |
6321 | return DAG.getNode( |
6322 | Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: DstVT, N1: Res, |
6323 | N2: DAG.getConstant(Val: 0, DL: dl, VT: TLI.getVectorIdxTy(DL: DAG.getDataLayout()))); |
6324 | } |
6325 | |
6326 | // Give up and unroll. |
6327 | return DAG.UnrollVectorOp(N); |
6328 | } |
6329 | |
6330 | SDValue DAGTypeLegalizer::WidenVecOp_BITCAST(SDNode *N) { |
6331 | EVT VT = N->getValueType(ResNo: 0); |
6332 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6333 | EVT InWidenVT = InOp.getValueType(); |
6334 | SDLoc dl(N); |
6335 | |
6336 | // Check if we can convert between two legal vector types and extract. |
6337 | TypeSize InWidenSize = InWidenVT.getSizeInBits(); |
6338 | TypeSize Size = VT.getSizeInBits(); |
6339 | // x86mmx is not an acceptable vector element type, so don't try. |
6340 | if (!VT.isVector() && VT != MVT::x86mmx && |
6341 | InWidenSize.hasKnownScalarFactor(Size)) { |
6342 | unsigned NewNumElts = InWidenSize.getKnownScalarFactor(RHS: Size); |
6343 | EVT NewVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT, NumElements: NewNumElts); |
6344 | if (TLI.isTypeLegal(VT: NewVT)) { |
6345 | SDValue BitOp = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: NewVT, Operand: InOp); |
6346 | return DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT, N1: BitOp, |
6347 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
6348 | } |
6349 | } |
6350 | |
6351 | // Handle a case like bitcast v12i8 -> v3i32. Normally that would get widened |
6352 | // to v16i8 -> v4i32, but for a target where v3i32 is legal but v12i8 is not, |
6353 | // we end up here. Handling the case here with EXTRACT_SUBVECTOR avoids |
6354 | // having to copy via memory. |
6355 | if (VT.isVector()) { |
6356 | EVT EltVT = VT.getVectorElementType(); |
6357 | unsigned EltSize = EltVT.getFixedSizeInBits(); |
6358 | if (InWidenSize.isKnownMultipleOf(RHS: EltSize)) { |
6359 | ElementCount NewNumElts = |
6360 | (InWidenVT.getVectorElementCount() * InWidenVT.getScalarSizeInBits()) |
6361 | .divideCoefficientBy(RHS: EltSize); |
6362 | EVT NewVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: EltVT, EC: NewNumElts); |
6363 | if (TLI.isTypeLegal(VT: NewVT)) { |
6364 | SDValue BitOp = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: NewVT, Operand: InOp); |
6365 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT, N1: BitOp, |
6366 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
6367 | } |
6368 | } |
6369 | } |
6370 | |
6371 | return CreateStackStoreLoad(Op: InOp, DestVT: VT); |
6372 | } |
6373 | |
6374 | SDValue DAGTypeLegalizer::WidenVecOp_CONCAT_VECTORS(SDNode *N) { |
6375 | EVT VT = N->getValueType(ResNo: 0); |
6376 | EVT EltVT = VT.getVectorElementType(); |
6377 | EVT InVT = N->getOperand(Num: 0).getValueType(); |
6378 | SDLoc dl(N); |
6379 | |
6380 | // If the widen width for this operand is the same as the width of the concat |
6381 | // and all but the first operand is undef, just use the widened operand. |
6382 | unsigned NumOperands = N->getNumOperands(); |
6383 | if (VT == TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: InVT)) { |
6384 | unsigned i; |
6385 | for (i = 1; i < NumOperands; ++i) |
6386 | if (!N->getOperand(Num: i).isUndef()) |
6387 | break; |
6388 | |
6389 | if (i == NumOperands) |
6390 | return GetWidenedVector(Op: N->getOperand(Num: 0)); |
6391 | } |
6392 | |
6393 | // Otherwise, fall back to a nasty build vector. |
6394 | unsigned NumElts = VT.getVectorNumElements(); |
6395 | SmallVector<SDValue, 16> Ops(NumElts); |
6396 | |
6397 | unsigned NumInElts = InVT.getVectorNumElements(); |
6398 | |
6399 | unsigned Idx = 0; |
6400 | for (unsigned i=0; i < NumOperands; ++i) { |
6401 | SDValue InOp = N->getOperand(Num: i); |
6402 | assert(getTypeAction(InOp.getValueType()) == |
6403 | TargetLowering::TypeWidenVector && |
6404 | "Unexpected type action" ); |
6405 | InOp = GetWidenedVector(Op: InOp); |
6406 | for (unsigned j = 0; j < NumInElts; ++j) |
6407 | Ops[Idx++] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: EltVT, N1: InOp, |
6408 | N2: DAG.getVectorIdxConstant(Val: j, DL: dl)); |
6409 | } |
6410 | return DAG.getBuildVector(VT, DL: dl, Ops); |
6411 | } |
6412 | |
6413 | SDValue DAGTypeLegalizer::WidenVecOp_INSERT_SUBVECTOR(SDNode *N) { |
6414 | EVT VT = N->getValueType(ResNo: 0); |
6415 | SDValue SubVec = N->getOperand(Num: 1); |
6416 | SDValue InVec = N->getOperand(Num: 0); |
6417 | |
6418 | if (getTypeAction(VT: SubVec.getValueType()) == TargetLowering::TypeWidenVector) |
6419 | SubVec = GetWidenedVector(Op: SubVec); |
6420 | |
6421 | EVT SubVT = SubVec.getValueType(); |
6422 | |
6423 | // Whether or not all the elements of the widened SubVec will be inserted into |
6424 | // valid indices of VT. |
6425 | bool IndicesValid = false; |
6426 | // If we statically know that VT can fit SubVT, the indices are valid. |
6427 | if (VT.knownBitsGE(VT: SubVT)) |
6428 | IndicesValid = true; |
6429 | else if (VT.isScalableVector() && SubVT.isFixedLengthVector()) { |
6430 | // Otherwise, if we're inserting a fixed vector into a scalable vector and |
6431 | // we know the minimum vscale we can work out if it's valid ourselves. |
6432 | Attribute Attr = DAG.getMachineFunction().getFunction().getFnAttribute( |
6433 | Attribute::VScaleRange); |
6434 | if (Attr.isValid()) { |
6435 | unsigned VScaleMin = Attr.getVScaleRangeMin(); |
6436 | if (VT.getSizeInBits().getKnownMinValue() * VScaleMin >= |
6437 | SubVT.getFixedSizeInBits()) |
6438 | IndicesValid = true; |
6439 | } |
6440 | } |
6441 | |
6442 | // We need to make sure that the indices are still valid, otherwise we might |
6443 | // widen what was previously well-defined to something undefined. |
6444 | if (IndicesValid && InVec.isUndef() && N->getConstantOperandVal(Num: 2) == 0) |
6445 | return DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: SDLoc(N), VT, N1: InVec, N2: SubVec, |
6446 | N3: N->getOperand(Num: 2)); |
6447 | |
6448 | report_fatal_error(reason: "Don't know how to widen the operands for " |
6449 | "INSERT_SUBVECTOR" ); |
6450 | } |
6451 | |
6452 | SDValue DAGTypeLegalizer::(SDNode *N) { |
6453 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6454 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: SDLoc(N), |
6455 | VT: N->getValueType(ResNo: 0), N1: InOp, N2: N->getOperand(Num: 1)); |
6456 | } |
6457 | |
6458 | SDValue DAGTypeLegalizer::(SDNode *N) { |
6459 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6460 | return DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: SDLoc(N), |
6461 | VT: N->getValueType(ResNo: 0), N1: InOp, N2: N->getOperand(Num: 1)); |
6462 | } |
6463 | |
6464 | SDValue DAGTypeLegalizer::WidenVecOp_EXTEND_VECTOR_INREG(SDNode *N) { |
6465 | SDValue InOp = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6466 | return DAG.getNode(Opcode: N->getOpcode(), DL: SDLoc(N), VT: N->getValueType(ResNo: 0), Operand: InOp); |
6467 | } |
6468 | |
6469 | SDValue DAGTypeLegalizer::WidenVecOp_STORE(SDNode *N) { |
6470 | // We have to widen the value, but we want only to store the original |
6471 | // vector type. |
6472 | StoreSDNode *ST = cast<StoreSDNode>(Val: N); |
6473 | |
6474 | if (!ST->getMemoryVT().getScalarType().isByteSized()) |
6475 | return TLI.scalarizeVectorStore(ST, DAG); |
6476 | |
6477 | if (ST->isTruncatingStore()) |
6478 | return TLI.scalarizeVectorStore(ST, DAG); |
6479 | |
6480 | // Generate a vector-predicated store if it is custom/legal on the target. |
6481 | // To avoid possible recursion, only do this if the widened mask type is |
6482 | // legal. |
6483 | // FIXME: Not all targets may support EVL in VP_STORE. These will have been |
6484 | // removed from the IR by the ExpandVectorPredication pass but we're |
6485 | // reintroducing them here. |
6486 | SDValue StVal = ST->getValue(); |
6487 | EVT StVT = StVal.getValueType(); |
6488 | EVT WideVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: StVT); |
6489 | EVT WideMaskVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1, |
6490 | WideVT.getVectorElementCount()); |
6491 | |
6492 | if (TLI.isOperationLegalOrCustom(Op: ISD::VP_STORE, VT: WideVT) && |
6493 | TLI.isTypeLegal(VT: WideMaskVT)) { |
6494 | // Widen the value. |
6495 | SDLoc DL(N); |
6496 | StVal = GetWidenedVector(Op: StVal); |
6497 | SDValue Mask = DAG.getAllOnesConstant(DL, VT: WideMaskVT); |
6498 | SDValue EVL = DAG.getElementCount(DL, VT: TLI.getVPExplicitVectorLengthTy(), |
6499 | EC: StVT.getVectorElementCount()); |
6500 | return DAG.getStoreVP(Chain: ST->getChain(), dl: DL, Val: StVal, Ptr: ST->getBasePtr(), |
6501 | Offset: DAG.getUNDEF(VT: ST->getBasePtr().getValueType()), Mask, |
6502 | EVL, MemVT: StVT, MMO: ST->getMemOperand(), |
6503 | AM: ST->getAddressingMode()); |
6504 | } |
6505 | |
6506 | SmallVector<SDValue, 16> StChain; |
6507 | if (GenWidenVectorStores(StChain, ST)) { |
6508 | if (StChain.size() == 1) |
6509 | return StChain[0]; |
6510 | |
6511 | return DAG.getNode(ISD::TokenFactor, SDLoc(ST), MVT::Other, StChain); |
6512 | } |
6513 | |
6514 | report_fatal_error(reason: "Unable to widen vector store" ); |
6515 | } |
6516 | |
6517 | SDValue DAGTypeLegalizer::WidenVecOp_VP_STORE(SDNode *N, unsigned OpNo) { |
6518 | assert((OpNo == 1 || OpNo == 3) && |
6519 | "Can widen only data or mask operand of vp_store" ); |
6520 | VPStoreSDNode *ST = cast<VPStoreSDNode>(Val: N); |
6521 | SDValue Mask = ST->getMask(); |
6522 | SDValue StVal = ST->getValue(); |
6523 | SDLoc dl(N); |
6524 | |
6525 | if (OpNo == 1) { |
6526 | // Widen the value. |
6527 | StVal = GetWidenedVector(Op: StVal); |
6528 | |
6529 | // We only handle the case where the mask needs widening to an |
6530 | // identically-sized type as the vector inputs. |
6531 | assert(getTypeAction(Mask.getValueType()) == |
6532 | TargetLowering::TypeWidenVector && |
6533 | "Unable to widen VP store" ); |
6534 | Mask = GetWidenedVector(Op: Mask); |
6535 | } else { |
6536 | Mask = GetWidenedVector(Op: Mask); |
6537 | |
6538 | // We only handle the case where the stored value needs widening to an |
6539 | // identically-sized type as the mask. |
6540 | assert(getTypeAction(StVal.getValueType()) == |
6541 | TargetLowering::TypeWidenVector && |
6542 | "Unable to widen VP store" ); |
6543 | StVal = GetWidenedVector(Op: StVal); |
6544 | } |
6545 | |
6546 | assert(Mask.getValueType().getVectorElementCount() == |
6547 | StVal.getValueType().getVectorElementCount() && |
6548 | "Mask and data vectors should have the same number of elements" ); |
6549 | return DAG.getStoreVP(Chain: ST->getChain(), dl, Val: StVal, Ptr: ST->getBasePtr(), |
6550 | Offset: ST->getOffset(), Mask, EVL: ST->getVectorLength(), |
6551 | MemVT: ST->getMemoryVT(), MMO: ST->getMemOperand(), |
6552 | AM: ST->getAddressingMode(), IsTruncating: ST->isTruncatingStore(), |
6553 | IsCompressing: ST->isCompressingStore()); |
6554 | } |
6555 | |
6556 | SDValue DAGTypeLegalizer::WidenVecOp_VP_STRIDED_STORE(SDNode *N, |
6557 | unsigned OpNo) { |
6558 | assert((OpNo == 1 || OpNo == 4) && |
6559 | "Can widen only data or mask operand of vp_strided_store" ); |
6560 | VPStridedStoreSDNode *SST = cast<VPStridedStoreSDNode>(Val: N); |
6561 | SDValue Mask = SST->getMask(); |
6562 | SDValue StVal = SST->getValue(); |
6563 | SDLoc DL(N); |
6564 | |
6565 | if (OpNo == 1) |
6566 | assert(getTypeAction(Mask.getValueType()) == |
6567 | TargetLowering::TypeWidenVector && |
6568 | "Unable to widen VP strided store" ); |
6569 | else |
6570 | assert(getTypeAction(StVal.getValueType()) == |
6571 | TargetLowering::TypeWidenVector && |
6572 | "Unable to widen VP strided store" ); |
6573 | |
6574 | StVal = GetWidenedVector(Op: StVal); |
6575 | Mask = GetWidenedVector(Op: Mask); |
6576 | |
6577 | assert(StVal.getValueType().getVectorElementCount() == |
6578 | Mask.getValueType().getVectorElementCount() && |
6579 | "Data and mask vectors should have the same number of elements" ); |
6580 | |
6581 | return DAG.getStridedStoreVP( |
6582 | Chain: SST->getChain(), DL, Val: StVal, Ptr: SST->getBasePtr(), Offset: SST->getOffset(), |
6583 | Stride: SST->getStride(), Mask, EVL: SST->getVectorLength(), MemVT: SST->getMemoryVT(), |
6584 | MMO: SST->getMemOperand(), AM: SST->getAddressingMode(), IsTruncating: SST->isTruncatingStore(), |
6585 | IsCompressing: SST->isCompressingStore()); |
6586 | } |
6587 | |
6588 | SDValue DAGTypeLegalizer::WidenVecOp_MSTORE(SDNode *N, unsigned OpNo) { |
6589 | assert((OpNo == 1 || OpNo == 4) && |
6590 | "Can widen only data or mask operand of mstore" ); |
6591 | MaskedStoreSDNode *MST = cast<MaskedStoreSDNode>(Val: N); |
6592 | SDValue Mask = MST->getMask(); |
6593 | EVT MaskVT = Mask.getValueType(); |
6594 | SDValue StVal = MST->getValue(); |
6595 | SDLoc dl(N); |
6596 | |
6597 | if (OpNo == 1) { |
6598 | // Widen the value. |
6599 | StVal = GetWidenedVector(Op: StVal); |
6600 | |
6601 | // The mask should be widened as well. |
6602 | EVT WideVT = StVal.getValueType(); |
6603 | EVT WideMaskVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6604 | VT: MaskVT.getVectorElementType(), |
6605 | NumElements: WideVT.getVectorNumElements()); |
6606 | Mask = ModifyToType(InOp: Mask, NVT: WideMaskVT, FillWithZeroes: true); |
6607 | } else { |
6608 | // Widen the mask. |
6609 | EVT WideMaskVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(), VT: MaskVT); |
6610 | Mask = ModifyToType(InOp: Mask, NVT: WideMaskVT, FillWithZeroes: true); |
6611 | |
6612 | EVT ValueVT = StVal.getValueType(); |
6613 | EVT WideVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6614 | VT: ValueVT.getVectorElementType(), |
6615 | NumElements: WideMaskVT.getVectorNumElements()); |
6616 | StVal = ModifyToType(InOp: StVal, NVT: WideVT); |
6617 | } |
6618 | |
6619 | assert(Mask.getValueType().getVectorNumElements() == |
6620 | StVal.getValueType().getVectorNumElements() && |
6621 | "Mask and data vectors should have the same number of elements" ); |
6622 | return DAG.getMaskedStore(Chain: MST->getChain(), dl, Val: StVal, Base: MST->getBasePtr(), |
6623 | Offset: MST->getOffset(), Mask, MemVT: MST->getMemoryVT(), |
6624 | MMO: MST->getMemOperand(), AM: MST->getAddressingMode(), |
6625 | IsTruncating: false, IsCompressing: MST->isCompressingStore()); |
6626 | } |
6627 | |
6628 | SDValue DAGTypeLegalizer::WidenVecOp_MGATHER(SDNode *N, unsigned OpNo) { |
6629 | assert(OpNo == 4 && "Can widen only the index of mgather" ); |
6630 | auto *MG = cast<MaskedGatherSDNode>(Val: N); |
6631 | SDValue DataOp = MG->getPassThru(); |
6632 | SDValue Mask = MG->getMask(); |
6633 | SDValue Scale = MG->getScale(); |
6634 | |
6635 | // Just widen the index. It's allowed to have extra elements. |
6636 | SDValue Index = GetWidenedVector(Op: MG->getIndex()); |
6637 | |
6638 | SDLoc dl(N); |
6639 | SDValue Ops[] = {MG->getChain(), DataOp, Mask, MG->getBasePtr(), Index, |
6640 | Scale}; |
6641 | SDValue Res = DAG.getMaskedGather(VTs: MG->getVTList(), MemVT: MG->getMemoryVT(), dl, Ops, |
6642 | MMO: MG->getMemOperand(), IndexType: MG->getIndexType(), |
6643 | ExtTy: MG->getExtensionType()); |
6644 | ReplaceValueWith(From: SDValue(N, 1), To: Res.getValue(R: 1)); |
6645 | ReplaceValueWith(From: SDValue(N, 0), To: Res.getValue(R: 0)); |
6646 | return SDValue(); |
6647 | } |
6648 | |
6649 | SDValue DAGTypeLegalizer::WidenVecOp_MSCATTER(SDNode *N, unsigned OpNo) { |
6650 | MaskedScatterSDNode *MSC = cast<MaskedScatterSDNode>(Val: N); |
6651 | SDValue DataOp = MSC->getValue(); |
6652 | SDValue Mask = MSC->getMask(); |
6653 | SDValue Index = MSC->getIndex(); |
6654 | SDValue Scale = MSC->getScale(); |
6655 | EVT WideMemVT = MSC->getMemoryVT(); |
6656 | |
6657 | if (OpNo == 1) { |
6658 | DataOp = GetWidenedVector(Op: DataOp); |
6659 | unsigned NumElts = DataOp.getValueType().getVectorNumElements(); |
6660 | |
6661 | // Widen index. |
6662 | EVT IndexVT = Index.getValueType(); |
6663 | EVT WideIndexVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6664 | VT: IndexVT.getVectorElementType(), NumElements: NumElts); |
6665 | Index = ModifyToType(InOp: Index, NVT: WideIndexVT); |
6666 | |
6667 | // The mask should be widened as well. |
6668 | EVT MaskVT = Mask.getValueType(); |
6669 | EVT WideMaskVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6670 | VT: MaskVT.getVectorElementType(), NumElements: NumElts); |
6671 | Mask = ModifyToType(InOp: Mask, NVT: WideMaskVT, FillWithZeroes: true); |
6672 | |
6673 | // Widen the MemoryType |
6674 | WideMemVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6675 | VT: MSC->getMemoryVT().getScalarType(), NumElements: NumElts); |
6676 | } else if (OpNo == 4) { |
6677 | // Just widen the index. It's allowed to have extra elements. |
6678 | Index = GetWidenedVector(Op: Index); |
6679 | } else |
6680 | llvm_unreachable("Can't widen this operand of mscatter" ); |
6681 | |
6682 | SDValue Ops[] = {MSC->getChain(), DataOp, Mask, MSC->getBasePtr(), Index, |
6683 | Scale}; |
6684 | return DAG.getMaskedScatter(DAG.getVTList(MVT::Other), WideMemVT, SDLoc(N), |
6685 | Ops, MSC->getMemOperand(), MSC->getIndexType(), |
6686 | MSC->isTruncatingStore()); |
6687 | } |
6688 | |
6689 | SDValue DAGTypeLegalizer::WidenVecOp_VP_SCATTER(SDNode *N, unsigned OpNo) { |
6690 | VPScatterSDNode *VPSC = cast<VPScatterSDNode>(Val: N); |
6691 | SDValue DataOp = VPSC->getValue(); |
6692 | SDValue Mask = VPSC->getMask(); |
6693 | SDValue Index = VPSC->getIndex(); |
6694 | SDValue Scale = VPSC->getScale(); |
6695 | EVT WideMemVT = VPSC->getMemoryVT(); |
6696 | |
6697 | if (OpNo == 1) { |
6698 | DataOp = GetWidenedVector(Op: DataOp); |
6699 | Index = GetWidenedVector(Op: Index); |
6700 | const auto WideEC = DataOp.getValueType().getVectorElementCount(); |
6701 | Mask = GetWidenedMask(Mask, EC: WideEC); |
6702 | WideMemVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6703 | VT: VPSC->getMemoryVT().getScalarType(), EC: WideEC); |
6704 | } else if (OpNo == 3) { |
6705 | // Just widen the index. It's allowed to have extra elements. |
6706 | Index = GetWidenedVector(Op: Index); |
6707 | } else |
6708 | llvm_unreachable("Can't widen this operand of VP_SCATTER" ); |
6709 | |
6710 | SDValue Ops[] = { |
6711 | VPSC->getChain(), DataOp, VPSC->getBasePtr(), Index, Scale, Mask, |
6712 | VPSC->getVectorLength()}; |
6713 | return DAG.getScatterVP(DAG.getVTList(MVT::Other), WideMemVT, SDLoc(N), Ops, |
6714 | VPSC->getMemOperand(), VPSC->getIndexType()); |
6715 | } |
6716 | |
6717 | SDValue DAGTypeLegalizer::WidenVecOp_SETCC(SDNode *N) { |
6718 | SDValue InOp0 = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6719 | SDValue InOp1 = GetWidenedVector(Op: N->getOperand(Num: 1)); |
6720 | SDLoc dl(N); |
6721 | EVT VT = N->getValueType(ResNo: 0); |
6722 | |
6723 | // WARNING: In this code we widen the compare instruction with garbage. |
6724 | // This garbage may contain denormal floats which may be slow. Is this a real |
6725 | // concern ? Should we zero the unused lanes if this is a float compare ? |
6726 | |
6727 | // Get a new SETCC node to compare the newly widened operands. |
6728 | // Only some of the compared elements are legal. |
6729 | EVT SVT = getSetCCResultType(VT: InOp0.getValueType()); |
6730 | // The result type is legal, if its vXi1, keep vXi1 for the new SETCC. |
6731 | if (VT.getScalarType() == MVT::i1) |
6732 | SVT = EVT::getVectorVT(*DAG.getContext(), MVT::i1, |
6733 | SVT.getVectorElementCount()); |
6734 | |
6735 | SDValue WideSETCC = DAG.getNode(Opcode: ISD::SETCC, DL: SDLoc(N), |
6736 | VT: SVT, N1: InOp0, N2: InOp1, N3: N->getOperand(Num: 2)); |
6737 | |
6738 | // Extract the needed results from the result vector. |
6739 | EVT ResVT = EVT::getVectorVT(Context&: *DAG.getContext(), |
6740 | VT: SVT.getVectorElementType(), |
6741 | EC: VT.getVectorElementCount()); |
6742 | SDValue CC = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: ResVT, N1: WideSETCC, |
6743 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
6744 | |
6745 | EVT OpVT = N->getOperand(Num: 0).getValueType(); |
6746 | ISD::NodeType ExtendCode = |
6747 | TargetLowering::getExtendForContent(Content: TLI.getBooleanContents(Type: OpVT)); |
6748 | return DAG.getNode(Opcode: ExtendCode, DL: dl, VT, Operand: CC); |
6749 | } |
6750 | |
6751 | SDValue DAGTypeLegalizer::WidenVecOp_STRICT_FSETCC(SDNode *N) { |
6752 | SDValue Chain = N->getOperand(Num: 0); |
6753 | SDValue LHS = GetWidenedVector(Op: N->getOperand(Num: 1)); |
6754 | SDValue RHS = GetWidenedVector(Op: N->getOperand(Num: 2)); |
6755 | SDValue CC = N->getOperand(Num: 3); |
6756 | SDLoc dl(N); |
6757 | |
6758 | EVT VT = N->getValueType(ResNo: 0); |
6759 | EVT EltVT = VT.getVectorElementType(); |
6760 | EVT TmpEltVT = LHS.getValueType().getVectorElementType(); |
6761 | unsigned NumElts = VT.getVectorNumElements(); |
6762 | |
6763 | // Unroll into a build vector. |
6764 | SmallVector<SDValue, 8> Scalars(NumElts); |
6765 | SmallVector<SDValue, 8> Chains(NumElts); |
6766 | |
6767 | for (unsigned i = 0; i != NumElts; ++i) { |
6768 | SDValue LHSElem = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: TmpEltVT, N1: LHS, |
6769 | N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
6770 | SDValue RHSElem = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: TmpEltVT, N1: RHS, |
6771 | N2: DAG.getVectorIdxConstant(Val: i, DL: dl)); |
6772 | |
6773 | Scalars[i] = DAG.getNode(N->getOpcode(), dl, {MVT::i1, MVT::Other}, |
6774 | {Chain, LHSElem, RHSElem, CC}); |
6775 | Chains[i] = Scalars[i].getValue(R: 1); |
6776 | Scalars[i] = DAG.getSelect(DL: dl, VT: EltVT, Cond: Scalars[i], |
6777 | LHS: DAG.getBoolConstant(V: true, DL: dl, VT: EltVT, OpVT: VT), |
6778 | RHS: DAG.getBoolConstant(V: false, DL: dl, VT: EltVT, OpVT: VT)); |
6779 | } |
6780 | |
6781 | SDValue NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Chains); |
6782 | ReplaceValueWith(From: SDValue(N, 1), To: NewChain); |
6783 | |
6784 | return DAG.getBuildVector(VT, DL: dl, Ops: Scalars); |
6785 | } |
6786 | |
6787 | SDValue DAGTypeLegalizer::WidenVecOp_VECREDUCE(SDNode *N) { |
6788 | SDLoc dl(N); |
6789 | SDValue Op = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6790 | EVT OrigVT = N->getOperand(Num: 0).getValueType(); |
6791 | EVT WideVT = Op.getValueType(); |
6792 | EVT ElemVT = OrigVT.getVectorElementType(); |
6793 | SDNodeFlags Flags = N->getFlags(); |
6794 | |
6795 | unsigned Opc = N->getOpcode(); |
6796 | unsigned BaseOpc = ISD::getVecReduceBaseOpcode(VecReduceOpcode: Opc); |
6797 | SDValue NeutralElem = DAG.getNeutralElement(Opcode: BaseOpc, DL: dl, VT: ElemVT, Flags); |
6798 | assert(NeutralElem && "Neutral element must exist" ); |
6799 | |
6800 | // Pad the vector with the neutral element. |
6801 | unsigned OrigElts = OrigVT.getVectorMinNumElements(); |
6802 | unsigned WideElts = WideVT.getVectorMinNumElements(); |
6803 | |
6804 | if (WideVT.isScalableVector()) { |
6805 | unsigned GCD = std::gcd(m: OrigElts, n: WideElts); |
6806 | EVT SplatVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: ElemVT, |
6807 | EC: ElementCount::getScalable(MinVal: GCD)); |
6808 | SDValue SplatNeutral = DAG.getSplatVector(VT: SplatVT, DL: dl, Op: NeutralElem); |
6809 | for (unsigned Idx = OrigElts; Idx < WideElts; Idx = Idx + GCD) |
6810 | Op = DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: WideVT, N1: Op, N2: SplatNeutral, |
6811 | N3: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
6812 | return DAG.getNode(Opcode: Opc, DL: dl, VT: N->getValueType(ResNo: 0), Operand: Op, Flags); |
6813 | } |
6814 | |
6815 | for (unsigned Idx = OrigElts; Idx < WideElts; Idx++) |
6816 | Op = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, VT: WideVT, N1: Op, N2: NeutralElem, |
6817 | N3: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
6818 | |
6819 | return DAG.getNode(Opcode: Opc, DL: dl, VT: N->getValueType(ResNo: 0), Operand: Op, Flags); |
6820 | } |
6821 | |
6822 | SDValue DAGTypeLegalizer::WidenVecOp_VECREDUCE_SEQ(SDNode *N) { |
6823 | SDLoc dl(N); |
6824 | SDValue AccOp = N->getOperand(Num: 0); |
6825 | SDValue VecOp = N->getOperand(Num: 1); |
6826 | SDValue Op = GetWidenedVector(Op: VecOp); |
6827 | |
6828 | EVT OrigVT = VecOp.getValueType(); |
6829 | EVT WideVT = Op.getValueType(); |
6830 | EVT ElemVT = OrigVT.getVectorElementType(); |
6831 | SDNodeFlags Flags = N->getFlags(); |
6832 | |
6833 | unsigned Opc = N->getOpcode(); |
6834 | unsigned BaseOpc = ISD::getVecReduceBaseOpcode(VecReduceOpcode: Opc); |
6835 | SDValue NeutralElem = DAG.getNeutralElement(Opcode: BaseOpc, DL: dl, VT: ElemVT, Flags); |
6836 | |
6837 | // Pad the vector with the neutral element. |
6838 | unsigned OrigElts = OrigVT.getVectorMinNumElements(); |
6839 | unsigned WideElts = WideVT.getVectorMinNumElements(); |
6840 | |
6841 | if (WideVT.isScalableVector()) { |
6842 | unsigned GCD = std::gcd(m: OrigElts, n: WideElts); |
6843 | EVT SplatVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: ElemVT, |
6844 | EC: ElementCount::getScalable(MinVal: GCD)); |
6845 | SDValue SplatNeutral = DAG.getSplatVector(VT: SplatVT, DL: dl, Op: NeutralElem); |
6846 | for (unsigned Idx = OrigElts; Idx < WideElts; Idx = Idx + GCD) |
6847 | Op = DAG.getNode(Opcode: ISD::INSERT_SUBVECTOR, DL: dl, VT: WideVT, N1: Op, N2: SplatNeutral, |
6848 | N3: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
6849 | return DAG.getNode(Opcode: Opc, DL: dl, VT: N->getValueType(ResNo: 0), N1: AccOp, N2: Op, Flags); |
6850 | } |
6851 | |
6852 | for (unsigned Idx = OrigElts; Idx < WideElts; Idx++) |
6853 | Op = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, VT: WideVT, N1: Op, N2: NeutralElem, |
6854 | N3: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
6855 | |
6856 | return DAG.getNode(Opcode: Opc, DL: dl, VT: N->getValueType(ResNo: 0), N1: AccOp, N2: Op, Flags); |
6857 | } |
6858 | |
6859 | SDValue DAGTypeLegalizer::WidenVecOp_VP_REDUCE(SDNode *N) { |
6860 | assert(N->isVPOpcode() && "Expected VP opcode" ); |
6861 | |
6862 | SDLoc dl(N); |
6863 | SDValue Op = GetWidenedVector(Op: N->getOperand(Num: 1)); |
6864 | SDValue Mask = GetWidenedMask(Mask: N->getOperand(Num: 2), |
6865 | EC: Op.getValueType().getVectorElementCount()); |
6866 | |
6867 | return DAG.getNode(Opcode: N->getOpcode(), DL: dl, VT: N->getValueType(ResNo: 0), |
6868 | Ops: {N->getOperand(Num: 0), Op, Mask, N->getOperand(Num: 3)}, |
6869 | Flags: N->getFlags()); |
6870 | } |
6871 | |
6872 | SDValue DAGTypeLegalizer::WidenVecOp_VSELECT(SDNode *N) { |
6873 | // This only gets called in the case that the left and right inputs and |
6874 | // result are of a legal odd vector type, and the condition is illegal i1 of |
6875 | // the same odd width that needs widening. |
6876 | EVT VT = N->getValueType(ResNo: 0); |
6877 | assert(VT.isVector() && !VT.isPow2VectorType() && isTypeLegal(VT)); |
6878 | |
6879 | SDValue Cond = GetWidenedVector(Op: N->getOperand(Num: 0)); |
6880 | SDValue LeftIn = DAG.WidenVector(N: N->getOperand(Num: 1), DL: SDLoc(N)); |
6881 | SDValue RightIn = DAG.WidenVector(N: N->getOperand(Num: 2), DL: SDLoc(N)); |
6882 | SDLoc DL(N); |
6883 | |
6884 | SDValue Select = DAG.getNode(Opcode: N->getOpcode(), DL, VT: LeftIn.getValueType(), N1: Cond, |
6885 | N2: LeftIn, N3: RightIn); |
6886 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL, VT, N1: Select, |
6887 | N2: DAG.getVectorIdxConstant(Val: 0, DL)); |
6888 | } |
6889 | |
6890 | //===----------------------------------------------------------------------===// |
6891 | // Vector Widening Utilities |
6892 | //===----------------------------------------------------------------------===// |
6893 | |
6894 | // Utility function to find the type to chop up a widen vector for load/store |
6895 | // TLI: Target lowering used to determine legal types. |
6896 | // Width: Width left need to load/store. |
6897 | // WidenVT: The widen vector type to load to/store from |
6898 | // Align: If 0, don't allow use of a wider type |
6899 | // WidenEx: If Align is not 0, the amount additional we can load/store from. |
6900 | |
6901 | static std::optional<EVT> findMemType(SelectionDAG &DAG, |
6902 | const TargetLowering &TLI, unsigned Width, |
6903 | EVT WidenVT, unsigned Align = 0, |
6904 | unsigned WidenEx = 0) { |
6905 | EVT WidenEltVT = WidenVT.getVectorElementType(); |
6906 | const bool Scalable = WidenVT.isScalableVector(); |
6907 | unsigned WidenWidth = WidenVT.getSizeInBits().getKnownMinValue(); |
6908 | unsigned WidenEltWidth = WidenEltVT.getSizeInBits(); |
6909 | unsigned AlignInBits = Align*8; |
6910 | |
6911 | // If we have one element to load/store, return it. |
6912 | EVT RetVT = WidenEltVT; |
6913 | if (!Scalable && Width == WidenEltWidth) |
6914 | return RetVT; |
6915 | |
6916 | // Don't bother looking for an integer type if the vector is scalable, skip |
6917 | // to vector types. |
6918 | if (!Scalable) { |
6919 | // See if there is larger legal integer than the element type to load/store. |
6920 | for (EVT MemVT : reverse(MVT::integer_valuetypes())) { |
6921 | unsigned MemVTWidth = MemVT.getSizeInBits(); |
6922 | if (MemVT.getSizeInBits() <= WidenEltWidth) |
6923 | break; |
6924 | auto Action = TLI.getTypeAction(*DAG.getContext(), MemVT); |
6925 | if ((Action == TargetLowering::TypeLegal || |
6926 | Action == TargetLowering::TypePromoteInteger) && |
6927 | (WidenWidth % MemVTWidth) == 0 && |
6928 | isPowerOf2_32(WidenWidth / MemVTWidth) && |
6929 | (MemVTWidth <= Width || |
6930 | (Align!=0 && MemVTWidth<=AlignInBits && MemVTWidth<=Width+WidenEx))) { |
6931 | if (MemVTWidth == WidenWidth) |
6932 | return MemVT; |
6933 | RetVT = MemVT; |
6934 | break; |
6935 | } |
6936 | } |
6937 | } |
6938 | |
6939 | // See if there is a larger vector type to load/store that has the same vector |
6940 | // element type and is evenly divisible with the WidenVT. |
6941 | for (EVT MemVT : reverse(MVT::vector_valuetypes())) { |
6942 | // Skip vector MVTs which don't match the scalable property of WidenVT. |
6943 | if (Scalable != MemVT.isScalableVector()) |
6944 | continue; |
6945 | unsigned MemVTWidth = MemVT.getSizeInBits().getKnownMinValue(); |
6946 | auto Action = TLI.getTypeAction(*DAG.getContext(), MemVT); |
6947 | if ((Action == TargetLowering::TypeLegal || |
6948 | Action == TargetLowering::TypePromoteInteger) && |
6949 | WidenEltVT == MemVT.getVectorElementType() && |
6950 | (WidenWidth % MemVTWidth) == 0 && |
6951 | isPowerOf2_32(WidenWidth / MemVTWidth) && |
6952 | (MemVTWidth <= Width || |
6953 | (Align!=0 && MemVTWidth<=AlignInBits && MemVTWidth<=Width+WidenEx))) { |
6954 | if (RetVT.getFixedSizeInBits() < MemVTWidth || MemVT == WidenVT) |
6955 | return MemVT; |
6956 | } |
6957 | } |
6958 | |
6959 | // Using element-wise loads and stores for widening operations is not |
6960 | // supported for scalable vectors |
6961 | if (Scalable) |
6962 | return std::nullopt; |
6963 | |
6964 | return RetVT; |
6965 | } |
6966 | |
6967 | // Builds a vector type from scalar loads |
6968 | // VecTy: Resulting Vector type |
6969 | // LDOps: Load operators to build a vector type |
6970 | // [Start,End) the list of loads to use. |
6971 | static SDValue BuildVectorFromScalar(SelectionDAG& DAG, EVT VecTy, |
6972 | SmallVectorImpl<SDValue> &LdOps, |
6973 | unsigned Start, unsigned End) { |
6974 | SDLoc dl(LdOps[Start]); |
6975 | EVT LdTy = LdOps[Start].getValueType(); |
6976 | unsigned Width = VecTy.getSizeInBits(); |
6977 | unsigned NumElts = Width / LdTy.getSizeInBits(); |
6978 | EVT NewVecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: LdTy, NumElements: NumElts); |
6979 | |
6980 | unsigned Idx = 1; |
6981 | SDValue VecOp = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: dl, VT: NewVecVT,Operand: LdOps[Start]); |
6982 | |
6983 | for (unsigned i = Start + 1; i != End; ++i) { |
6984 | EVT NewLdTy = LdOps[i].getValueType(); |
6985 | if (NewLdTy != LdTy) { |
6986 | NumElts = Width / NewLdTy.getSizeInBits(); |
6987 | NewVecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: NewLdTy, NumElements: NumElts); |
6988 | VecOp = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: NewVecVT, Operand: VecOp); |
6989 | // Readjust position and vector position based on new load type. |
6990 | Idx = Idx * LdTy.getSizeInBits() / NewLdTy.getSizeInBits(); |
6991 | LdTy = NewLdTy; |
6992 | } |
6993 | VecOp = DAG.getNode(Opcode: ISD::INSERT_VECTOR_ELT, DL: dl, VT: NewVecVT, N1: VecOp, N2: LdOps[i], |
6994 | N3: DAG.getVectorIdxConstant(Val: Idx++, DL: dl)); |
6995 | } |
6996 | return DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: VecTy, Operand: VecOp); |
6997 | } |
6998 | |
6999 | SDValue DAGTypeLegalizer::GenWidenVectorLoads(SmallVectorImpl<SDValue> &LdChain, |
7000 | LoadSDNode *LD) { |
7001 | // The strategy assumes that we can efficiently load power-of-two widths. |
7002 | // The routine chops the vector into the largest vector loads with the same |
7003 | // element type or scalar loads and then recombines it to the widen vector |
7004 | // type. |
7005 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(),VT: LD->getValueType(ResNo: 0)); |
7006 | EVT LdVT = LD->getMemoryVT(); |
7007 | SDLoc dl(LD); |
7008 | assert(LdVT.isVector() && WidenVT.isVector()); |
7009 | assert(LdVT.isScalableVector() == WidenVT.isScalableVector()); |
7010 | assert(LdVT.getVectorElementType() == WidenVT.getVectorElementType()); |
7011 | |
7012 | // Load information |
7013 | SDValue Chain = LD->getChain(); |
7014 | SDValue BasePtr = LD->getBasePtr(); |
7015 | MachineMemOperand::Flags MMOFlags = LD->getMemOperand()->getFlags(); |
7016 | AAMDNodes AAInfo = LD->getAAInfo(); |
7017 | |
7018 | TypeSize LdWidth = LdVT.getSizeInBits(); |
7019 | TypeSize WidenWidth = WidenVT.getSizeInBits(); |
7020 | TypeSize WidthDiff = WidenWidth - LdWidth; |
7021 | // Allow wider loads if they are sufficiently aligned to avoid memory faults |
7022 | // and if the original load is simple. |
7023 | unsigned LdAlign = |
7024 | (!LD->isSimple() || LdVT.isScalableVector()) ? 0 : LD->getAlign().value(); |
7025 | |
7026 | // Find the vector type that can load from. |
7027 | std::optional<EVT> FirstVT = |
7028 | findMemType(DAG, TLI, Width: LdWidth.getKnownMinValue(), WidenVT, Align: LdAlign, |
7029 | WidenEx: WidthDiff.getKnownMinValue()); |
7030 | |
7031 | if (!FirstVT) |
7032 | return SDValue(); |
7033 | |
7034 | SmallVector<EVT, 8> MemVTs; |
7035 | TypeSize FirstVTWidth = FirstVT->getSizeInBits(); |
7036 | |
7037 | // Unless we're able to load in one instruction we must work out how to load |
7038 | // the remainder. |
7039 | if (!TypeSize::isKnownLE(LHS: LdWidth, RHS: FirstVTWidth)) { |
7040 | std::optional<EVT> NewVT = FirstVT; |
7041 | TypeSize RemainingWidth = LdWidth; |
7042 | TypeSize NewVTWidth = FirstVTWidth; |
7043 | do { |
7044 | RemainingWidth -= NewVTWidth; |
7045 | if (TypeSize::isKnownLT(LHS: RemainingWidth, RHS: NewVTWidth)) { |
7046 | // The current type we are using is too large. Find a better size. |
7047 | NewVT = findMemType(DAG, TLI, Width: RemainingWidth.getKnownMinValue(), |
7048 | WidenVT, Align: LdAlign, WidenEx: WidthDiff.getKnownMinValue()); |
7049 | if (!NewVT) |
7050 | return SDValue(); |
7051 | NewVTWidth = NewVT->getSizeInBits(); |
7052 | } |
7053 | MemVTs.push_back(Elt: *NewVT); |
7054 | } while (TypeSize::isKnownGT(LHS: RemainingWidth, RHS: NewVTWidth)); |
7055 | } |
7056 | |
7057 | SDValue LdOp = DAG.getLoad(VT: *FirstVT, dl, Chain, Ptr: BasePtr, PtrInfo: LD->getPointerInfo(), |
7058 | Alignment: LD->getOriginalAlign(), MMOFlags, AAInfo); |
7059 | LdChain.push_back(Elt: LdOp.getValue(R: 1)); |
7060 | |
7061 | // Check if we can load the element with one instruction. |
7062 | if (MemVTs.empty()) { |
7063 | assert(TypeSize::isKnownLE(LdWidth, FirstVTWidth)); |
7064 | if (!FirstVT->isVector()) { |
7065 | unsigned NumElts = |
7066 | WidenWidth.getFixedValue() / FirstVTWidth.getFixedValue(); |
7067 | EVT NewVecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: *FirstVT, NumElements: NumElts); |
7068 | SDValue VecOp = DAG.getNode(Opcode: ISD::SCALAR_TO_VECTOR, DL: dl, VT: NewVecVT, Operand: LdOp); |
7069 | return DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: WidenVT, Operand: VecOp); |
7070 | } |
7071 | if (FirstVT == WidenVT) |
7072 | return LdOp; |
7073 | |
7074 | // TODO: We don't currently have any tests that exercise this code path. |
7075 | assert(WidenWidth.getFixedValue() % FirstVTWidth.getFixedValue() == 0); |
7076 | unsigned NumConcat = |
7077 | WidenWidth.getFixedValue() / FirstVTWidth.getFixedValue(); |
7078 | SmallVector<SDValue, 16> ConcatOps(NumConcat); |
7079 | SDValue UndefVal = DAG.getUNDEF(VT: *FirstVT); |
7080 | ConcatOps[0] = LdOp; |
7081 | for (unsigned i = 1; i != NumConcat; ++i) |
7082 | ConcatOps[i] = UndefVal; |
7083 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, Ops: ConcatOps); |
7084 | } |
7085 | |
7086 | // Load vector by using multiple loads from largest vector to scalar. |
7087 | SmallVector<SDValue, 16> LdOps; |
7088 | LdOps.push_back(Elt: LdOp); |
7089 | |
7090 | uint64_t ScaledOffset = 0; |
7091 | MachinePointerInfo MPI = LD->getPointerInfo(); |
7092 | |
7093 | // First incremement past the first load. |
7094 | IncrementPointer(N: cast<LoadSDNode>(Val&: LdOp), MemVT: *FirstVT, MPI, Ptr&: BasePtr, |
7095 | ScaledOffset: &ScaledOffset); |
7096 | |
7097 | for (EVT MemVT : MemVTs) { |
7098 | Align NewAlign = ScaledOffset == 0 |
7099 | ? LD->getOriginalAlign() |
7100 | : commonAlignment(A: LD->getAlign(), Offset: ScaledOffset); |
7101 | SDValue L = |
7102 | DAG.getLoad(VT: MemVT, dl, Chain, Ptr: BasePtr, PtrInfo: MPI, Alignment: NewAlign, MMOFlags, AAInfo); |
7103 | |
7104 | LdOps.push_back(Elt: L); |
7105 | LdChain.push_back(Elt: L.getValue(R: 1)); |
7106 | IncrementPointer(N: cast<LoadSDNode>(Val&: L), MemVT, MPI, Ptr&: BasePtr, ScaledOffset: &ScaledOffset); |
7107 | } |
7108 | |
7109 | // Build the vector from the load operations. |
7110 | unsigned End = LdOps.size(); |
7111 | if (!LdOps[0].getValueType().isVector()) |
7112 | // All the loads are scalar loads. |
7113 | return BuildVectorFromScalar(DAG, VecTy: WidenVT, LdOps, Start: 0, End); |
7114 | |
7115 | // If the load contains vectors, build the vector using concat vector. |
7116 | // All of the vectors used to load are power-of-2, and the scalar loads can be |
7117 | // combined to make a power-of-2 vector. |
7118 | SmallVector<SDValue, 16> ConcatOps(End); |
7119 | int i = End - 1; |
7120 | int Idx = End; |
7121 | EVT LdTy = LdOps[i].getValueType(); |
7122 | // First, combine the scalar loads to a vector. |
7123 | if (!LdTy.isVector()) { |
7124 | for (--i; i >= 0; --i) { |
7125 | LdTy = LdOps[i].getValueType(); |
7126 | if (LdTy.isVector()) |
7127 | break; |
7128 | } |
7129 | ConcatOps[--Idx] = BuildVectorFromScalar(DAG, VecTy: LdTy, LdOps, Start: i + 1, End); |
7130 | } |
7131 | |
7132 | ConcatOps[--Idx] = LdOps[i]; |
7133 | for (--i; i >= 0; --i) { |
7134 | EVT NewLdTy = LdOps[i].getValueType(); |
7135 | if (NewLdTy != LdTy) { |
7136 | // Create a larger vector. |
7137 | TypeSize LdTySize = LdTy.getSizeInBits(); |
7138 | TypeSize NewLdTySize = NewLdTy.getSizeInBits(); |
7139 | assert(NewLdTySize.isScalable() == LdTySize.isScalable() && |
7140 | NewLdTySize.isKnownMultipleOf(LdTySize.getKnownMinValue())); |
7141 | unsigned NumOps = |
7142 | NewLdTySize.getKnownMinValue() / LdTySize.getKnownMinValue(); |
7143 | SmallVector<SDValue, 16> WidenOps(NumOps); |
7144 | unsigned j = 0; |
7145 | for (; j != End-Idx; ++j) |
7146 | WidenOps[j] = ConcatOps[Idx+j]; |
7147 | for (; j != NumOps; ++j) |
7148 | WidenOps[j] = DAG.getUNDEF(VT: LdTy); |
7149 | |
7150 | ConcatOps[End-1] = DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: NewLdTy, |
7151 | Ops: WidenOps); |
7152 | Idx = End - 1; |
7153 | LdTy = NewLdTy; |
7154 | } |
7155 | ConcatOps[--Idx] = LdOps[i]; |
7156 | } |
7157 | |
7158 | if (WidenWidth == LdTy.getSizeInBits() * (End - Idx)) |
7159 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, |
7160 | Ops: ArrayRef(&ConcatOps[Idx], End - Idx)); |
7161 | |
7162 | // We need to fill the rest with undefs to build the vector. |
7163 | unsigned NumOps = |
7164 | WidenWidth.getKnownMinValue() / LdTy.getSizeInBits().getKnownMinValue(); |
7165 | SmallVector<SDValue, 16> WidenOps(NumOps); |
7166 | SDValue UndefVal = DAG.getUNDEF(VT: LdTy); |
7167 | { |
7168 | unsigned i = 0; |
7169 | for (; i != End-Idx; ++i) |
7170 | WidenOps[i] = ConcatOps[Idx+i]; |
7171 | for (; i != NumOps; ++i) |
7172 | WidenOps[i] = UndefVal; |
7173 | } |
7174 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: WidenVT, Ops: WidenOps); |
7175 | } |
7176 | |
7177 | SDValue |
7178 | DAGTypeLegalizer::GenWidenVectorExtLoads(SmallVectorImpl<SDValue> &LdChain, |
7179 | LoadSDNode *LD, |
7180 | ISD::LoadExtType ExtType) { |
7181 | // For extension loads, it may not be more efficient to chop up the vector |
7182 | // and then extend it. Instead, we unroll the load and build a new vector. |
7183 | EVT WidenVT = TLI.getTypeToTransformTo(Context&: *DAG.getContext(),VT: LD->getValueType(ResNo: 0)); |
7184 | EVT LdVT = LD->getMemoryVT(); |
7185 | SDLoc dl(LD); |
7186 | assert(LdVT.isVector() && WidenVT.isVector()); |
7187 | assert(LdVT.isScalableVector() == WidenVT.isScalableVector()); |
7188 | |
7189 | // Load information |
7190 | SDValue Chain = LD->getChain(); |
7191 | SDValue BasePtr = LD->getBasePtr(); |
7192 | MachineMemOperand::Flags MMOFlags = LD->getMemOperand()->getFlags(); |
7193 | AAMDNodes AAInfo = LD->getAAInfo(); |
7194 | |
7195 | if (LdVT.isScalableVector()) |
7196 | report_fatal_error(reason: "Generating widen scalable extending vector loads is " |
7197 | "not yet supported" ); |
7198 | |
7199 | EVT EltVT = WidenVT.getVectorElementType(); |
7200 | EVT LdEltVT = LdVT.getVectorElementType(); |
7201 | unsigned NumElts = LdVT.getVectorNumElements(); |
7202 | |
7203 | // Load each element and widen. |
7204 | unsigned WidenNumElts = WidenVT.getVectorNumElements(); |
7205 | SmallVector<SDValue, 16> Ops(WidenNumElts); |
7206 | unsigned Increment = LdEltVT.getSizeInBits() / 8; |
7207 | Ops[0] = |
7208 | DAG.getExtLoad(ExtType, dl, VT: EltVT, Chain, Ptr: BasePtr, PtrInfo: LD->getPointerInfo(), |
7209 | MemVT: LdEltVT, Alignment: LD->getOriginalAlign(), MMOFlags, AAInfo); |
7210 | LdChain.push_back(Elt: Ops[0].getValue(R: 1)); |
7211 | unsigned i = 0, Offset = Increment; |
7212 | for (i=1; i < NumElts; ++i, Offset += Increment) { |
7213 | SDValue NewBasePtr = |
7214 | DAG.getObjectPtrOffset(SL: dl, Ptr: BasePtr, Offset: TypeSize::getFixed(ExactSize: Offset)); |
7215 | Ops[i] = DAG.getExtLoad(ExtType, dl, VT: EltVT, Chain, Ptr: NewBasePtr, |
7216 | PtrInfo: LD->getPointerInfo().getWithOffset(O: Offset), MemVT: LdEltVT, |
7217 | Alignment: LD->getOriginalAlign(), MMOFlags, AAInfo); |
7218 | LdChain.push_back(Elt: Ops[i].getValue(R: 1)); |
7219 | } |
7220 | |
7221 | // Fill the rest with undefs. |
7222 | SDValue UndefVal = DAG.getUNDEF(VT: EltVT); |
7223 | for (; i != WidenNumElts; ++i) |
7224 | Ops[i] = UndefVal; |
7225 | |
7226 | return DAG.getBuildVector(VT: WidenVT, DL: dl, Ops); |
7227 | } |
7228 | |
7229 | bool DAGTypeLegalizer::GenWidenVectorStores(SmallVectorImpl<SDValue> &StChain, |
7230 | StoreSDNode *ST) { |
7231 | // The strategy assumes that we can efficiently store power-of-two widths. |
7232 | // The routine chops the vector into the largest vector stores with the same |
7233 | // element type or scalar stores. |
7234 | SDValue Chain = ST->getChain(); |
7235 | SDValue BasePtr = ST->getBasePtr(); |
7236 | MachineMemOperand::Flags MMOFlags = ST->getMemOperand()->getFlags(); |
7237 | AAMDNodes AAInfo = ST->getAAInfo(); |
7238 | SDValue ValOp = GetWidenedVector(Op: ST->getValue()); |
7239 | SDLoc dl(ST); |
7240 | |
7241 | EVT StVT = ST->getMemoryVT(); |
7242 | TypeSize StWidth = StVT.getSizeInBits(); |
7243 | EVT ValVT = ValOp.getValueType(); |
7244 | TypeSize ValWidth = ValVT.getSizeInBits(); |
7245 | EVT ValEltVT = ValVT.getVectorElementType(); |
7246 | unsigned ValEltWidth = ValEltVT.getFixedSizeInBits(); |
7247 | assert(StVT.getVectorElementType() == ValEltVT); |
7248 | assert(StVT.isScalableVector() == ValVT.isScalableVector() && |
7249 | "Mismatch between store and value types" ); |
7250 | |
7251 | int Idx = 0; // current index to store |
7252 | |
7253 | MachinePointerInfo MPI = ST->getPointerInfo(); |
7254 | uint64_t ScaledOffset = 0; |
7255 | |
7256 | // A breakdown of how to widen this vector store. Each element of the vector |
7257 | // is a memory VT combined with the number of times it is to be stored to, |
7258 | // e,g., v5i32 -> {{v2i32,2},{i32,1}} |
7259 | SmallVector<std::pair<EVT, unsigned>, 4> MemVTs; |
7260 | |
7261 | while (StWidth.isNonZero()) { |
7262 | // Find the largest vector type we can store with. |
7263 | std::optional<EVT> NewVT = |
7264 | findMemType(DAG, TLI, Width: StWidth.getKnownMinValue(), WidenVT: ValVT); |
7265 | if (!NewVT) |
7266 | return false; |
7267 | MemVTs.push_back(Elt: {*NewVT, 0}); |
7268 | TypeSize NewVTWidth = NewVT->getSizeInBits(); |
7269 | |
7270 | do { |
7271 | StWidth -= NewVTWidth; |
7272 | MemVTs.back().second++; |
7273 | } while (StWidth.isNonZero() && TypeSize::isKnownGE(LHS: StWidth, RHS: NewVTWidth)); |
7274 | } |
7275 | |
7276 | for (const auto &Pair : MemVTs) { |
7277 | EVT NewVT = Pair.first; |
7278 | unsigned Count = Pair.second; |
7279 | TypeSize NewVTWidth = NewVT.getSizeInBits(); |
7280 | |
7281 | if (NewVT.isVector()) { |
7282 | unsigned NumVTElts = NewVT.getVectorMinNumElements(); |
7283 | do { |
7284 | Align NewAlign = ScaledOffset == 0 |
7285 | ? ST->getOriginalAlign() |
7286 | : commonAlignment(A: ST->getAlign(), Offset: ScaledOffset); |
7287 | SDValue EOp = DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: NewVT, N1: ValOp, |
7288 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
7289 | SDValue PartStore = DAG.getStore(Chain, dl, Val: EOp, Ptr: BasePtr, PtrInfo: MPI, Alignment: NewAlign, |
7290 | MMOFlags, AAInfo); |
7291 | StChain.push_back(Elt: PartStore); |
7292 | |
7293 | Idx += NumVTElts; |
7294 | IncrementPointer(N: cast<StoreSDNode>(Val&: PartStore), MemVT: NewVT, MPI, Ptr&: BasePtr, |
7295 | ScaledOffset: &ScaledOffset); |
7296 | } while (--Count); |
7297 | } else { |
7298 | // Cast the vector to the scalar type we can store. |
7299 | unsigned NumElts = ValWidth.getFixedValue() / NewVTWidth.getFixedValue(); |
7300 | EVT NewVecVT = EVT::getVectorVT(Context&: *DAG.getContext(), VT: NewVT, NumElements: NumElts); |
7301 | SDValue VecOp = DAG.getNode(Opcode: ISD::BITCAST, DL: dl, VT: NewVecVT, Operand: ValOp); |
7302 | // Readjust index position based on new vector type. |
7303 | Idx = Idx * ValEltWidth / NewVTWidth.getFixedValue(); |
7304 | do { |
7305 | SDValue EOp = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: NewVT, N1: VecOp, |
7306 | N2: DAG.getVectorIdxConstant(Val: Idx++, DL: dl)); |
7307 | SDValue PartStore = |
7308 | DAG.getStore(Chain, dl, Val: EOp, Ptr: BasePtr, PtrInfo: MPI, Alignment: ST->getOriginalAlign(), |
7309 | MMOFlags, AAInfo); |
7310 | StChain.push_back(Elt: PartStore); |
7311 | |
7312 | IncrementPointer(N: cast<StoreSDNode>(Val&: PartStore), MemVT: NewVT, MPI, Ptr&: BasePtr); |
7313 | } while (--Count); |
7314 | // Restore index back to be relative to the original widen element type. |
7315 | Idx = Idx * NewVTWidth.getFixedValue() / ValEltWidth; |
7316 | } |
7317 | } |
7318 | |
7319 | return true; |
7320 | } |
7321 | |
7322 | /// Modifies a vector input (widen or narrows) to a vector of NVT. The |
7323 | /// input vector must have the same element type as NVT. |
7324 | /// FillWithZeroes specifies that the vector should be widened with zeroes. |
7325 | SDValue DAGTypeLegalizer::ModifyToType(SDValue InOp, EVT NVT, |
7326 | bool FillWithZeroes) { |
7327 | // Note that InOp might have been widened so it might already have |
7328 | // the right width or it might need be narrowed. |
7329 | EVT InVT = InOp.getValueType(); |
7330 | assert(InVT.getVectorElementType() == NVT.getVectorElementType() && |
7331 | "input and widen element type must match" ); |
7332 | assert(InVT.isScalableVector() == NVT.isScalableVector() && |
7333 | "cannot modify scalable vectors in this way" ); |
7334 | SDLoc dl(InOp); |
7335 | |
7336 | // Check if InOp already has the right width. |
7337 | if (InVT == NVT) |
7338 | return InOp; |
7339 | |
7340 | ElementCount InEC = InVT.getVectorElementCount(); |
7341 | ElementCount WidenEC = NVT.getVectorElementCount(); |
7342 | if (WidenEC.hasKnownScalarFactor(RHS: InEC)) { |
7343 | unsigned NumConcat = WidenEC.getKnownScalarFactor(RHS: InEC); |
7344 | SmallVector<SDValue, 16> Ops(NumConcat); |
7345 | SDValue FillVal = FillWithZeroes ? DAG.getConstant(Val: 0, DL: dl, VT: InVT) : |
7346 | DAG.getUNDEF(VT: InVT); |
7347 | Ops[0] = InOp; |
7348 | for (unsigned i = 1; i != NumConcat; ++i) |
7349 | Ops[i] = FillVal; |
7350 | |
7351 | return DAG.getNode(Opcode: ISD::CONCAT_VECTORS, DL: dl, VT: NVT, Ops); |
7352 | } |
7353 | |
7354 | if (InEC.hasKnownScalarFactor(RHS: WidenEC)) |
7355 | return DAG.getNode(Opcode: ISD::EXTRACT_SUBVECTOR, DL: dl, VT: NVT, N1: InOp, |
7356 | N2: DAG.getVectorIdxConstant(Val: 0, DL: dl)); |
7357 | |
7358 | assert(!InVT.isScalableVector() && !NVT.isScalableVector() && |
7359 | "Scalable vectors should have been handled already." ); |
7360 | |
7361 | unsigned InNumElts = InEC.getFixedValue(); |
7362 | unsigned WidenNumElts = WidenEC.getFixedValue(); |
7363 | |
7364 | // Fall back to extract and build (+ mask, if padding with zeros). |
7365 | SmallVector<SDValue, 16> Ops(WidenNumElts); |
7366 | EVT EltVT = NVT.getVectorElementType(); |
7367 | unsigned MinNumElts = std::min(a: WidenNumElts, b: InNumElts); |
7368 | unsigned Idx; |
7369 | for (Idx = 0; Idx < MinNumElts; ++Idx) |
7370 | Ops[Idx] = DAG.getNode(Opcode: ISD::EXTRACT_VECTOR_ELT, DL: dl, VT: EltVT, N1: InOp, |
7371 | N2: DAG.getVectorIdxConstant(Val: Idx, DL: dl)); |
7372 | |
7373 | SDValue UndefVal = DAG.getUNDEF(VT: EltVT); |
7374 | for (; Idx < WidenNumElts; ++Idx) |
7375 | Ops[Idx] = UndefVal; |
7376 | |
7377 | SDValue Widened = DAG.getBuildVector(VT: NVT, DL: dl, Ops); |
7378 | if (!FillWithZeroes) |
7379 | return Widened; |
7380 | |
7381 | assert(NVT.isInteger() && |
7382 | "We expect to never want to FillWithZeroes for non-integral types." ); |
7383 | |
7384 | SmallVector<SDValue, 16> MaskOps; |
7385 | MaskOps.append(NumInputs: MinNumElts, Elt: DAG.getAllOnesConstant(DL: dl, VT: EltVT)); |
7386 | MaskOps.append(NumInputs: WidenNumElts - MinNumElts, Elt: DAG.getConstant(Val: 0, DL: dl, VT: EltVT)); |
7387 | |
7388 | return DAG.getNode(Opcode: ISD::AND, DL: dl, VT: NVT, N1: Widened, |
7389 | N2: DAG.getBuildVector(VT: NVT, DL: dl, Ops: MaskOps)); |
7390 | } |
7391 | |