xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.cpp (revision ca53e5aedfebcc1b4091b68e01b2d5cae923f85e)
1 //===-- AMDGPUInstPrinter.cpp - AMDGPU MC Inst -> ASM ---------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 // \file
8 //===----------------------------------------------------------------------===//
9 
10 #include "AMDGPUInstPrinter.h"
11 #include "MCTargetDesc/AMDGPUMCTargetDesc.h"
12 #include "SIDefines.h"
13 #include "Utils/AMDGPUAsmUtils.h"
14 #include "Utils/AMDGPUBaseInfo.h"
15 #include "llvm/MC/MCExpr.h"
16 #include "llvm/MC/MCInst.h"
17 #include "llvm/MC/MCInstrDesc.h"
18 #include "llvm/MC/MCInstrInfo.h"
19 #include "llvm/MC/MCRegisterInfo.h"
20 #include "llvm/MC/MCSubtargetInfo.h"
21 #include "llvm/Support/CommandLine.h"
22 #include "llvm/Support/ErrorHandling.h"
23 #include "llvm/Support/MathExtras.h"
24 #include "llvm/Support/raw_ostream.h"
25 #include <cassert>
26 
27 using namespace llvm;
28 using namespace llvm::AMDGPU;
29 
30 static cl::opt<bool> Keep16BitSuffixes(
31   "amdgpu-keep-16-bit-reg-suffixes",
32   cl::desc("Keep .l and .h suffixes in asm for debugging purposes"),
33   cl::init(false),
34   cl::ReallyHidden);
35 
36 void AMDGPUInstPrinter::printRegName(raw_ostream &OS, unsigned RegNo) const {
37   // FIXME: The current implementation of
38   // AsmParser::parseRegisterOrRegisterNumber in MC implies we either emit this
39   // as an integer or we provide a name which represents a physical register.
40   // For CFI instructions we really want to emit a name for the DWARF register
41   // instead, because there may be multiple DWARF registers corresponding to a
42   // single physical register. One case where this problem manifests is with
43   // wave32/wave64 where using the physical register name is ambiguous: if we
44   // write e.g. `.cfi_undefined v0` we lose information about the wavefront
45   // size which we need to encode the register in the final DWARF. Ideally we
46   // would extend MC to support parsing DWARF register names so we could do
47   // something like `.cfi_undefined dwarf_wave32_v0`. For now we just live with
48   // non-pretty DWARF register names in assembly text.
49   OS << RegNo;
50 }
51 
52 void AMDGPUInstPrinter::printInst(const MCInst *MI, uint64_t Address,
53                                   StringRef Annot, const MCSubtargetInfo &STI,
54                                   raw_ostream &OS) {
55   OS.flush();
56   printInstruction(MI, Address, STI, OS);
57   printAnnotation(OS, Annot);
58 }
59 
60 void AMDGPUInstPrinter::printU4ImmOperand(const MCInst *MI, unsigned OpNo,
61                                           const MCSubtargetInfo &STI,
62                                           raw_ostream &O) {
63   O << formatHex(MI->getOperand(OpNo).getImm() & 0xf);
64 }
65 
66 void AMDGPUInstPrinter::printU8ImmOperand(const MCInst *MI, unsigned OpNo,
67                                           raw_ostream &O) {
68   O << formatHex(MI->getOperand(OpNo).getImm() & 0xff);
69 }
70 
71 void AMDGPUInstPrinter::printU16ImmOperand(const MCInst *MI, unsigned OpNo,
72                                            const MCSubtargetInfo &STI,
73                                            raw_ostream &O) {
74   // It's possible to end up with a 32-bit literal used with a 16-bit operand
75   // with ignored high bits. Print as 32-bit anyway in that case.
76   int64_t Imm = MI->getOperand(OpNo).getImm();
77   if (isInt<16>(Imm) || isUInt<16>(Imm))
78     O << formatHex(static_cast<uint64_t>(Imm & 0xffff));
79   else
80     printU32ImmOperand(MI, OpNo, STI, O);
81 }
82 
83 void AMDGPUInstPrinter::printU4ImmDecOperand(const MCInst *MI, unsigned OpNo,
84                                              raw_ostream &O) {
85   O << formatDec(MI->getOperand(OpNo).getImm() & 0xf);
86 }
87 
88 void AMDGPUInstPrinter::printU8ImmDecOperand(const MCInst *MI, unsigned OpNo,
89                                              raw_ostream &O) {
90   O << formatDec(MI->getOperand(OpNo).getImm() & 0xff);
91 }
92 
93 void AMDGPUInstPrinter::printU16ImmDecOperand(const MCInst *MI, unsigned OpNo,
94                                               raw_ostream &O) {
95   O << formatDec(MI->getOperand(OpNo).getImm() & 0xffff);
96 }
97 
98 void AMDGPUInstPrinter::printU32ImmOperand(const MCInst *MI, unsigned OpNo,
99                                            const MCSubtargetInfo &STI,
100                                            raw_ostream &O) {
101   O << formatHex(MI->getOperand(OpNo).getImm() & 0xffffffff);
102 }
103 
104 void AMDGPUInstPrinter::printNamedBit(const MCInst *MI, unsigned OpNo,
105                                       raw_ostream &O, StringRef BitName) {
106   if (MI->getOperand(OpNo).getImm()) {
107     O << ' ' << BitName;
108   }
109 }
110 
111 void AMDGPUInstPrinter::printOffen(const MCInst *MI, unsigned OpNo,
112                                    raw_ostream &O) {
113   printNamedBit(MI, OpNo, O, "offen");
114 }
115 
116 void AMDGPUInstPrinter::printIdxen(const MCInst *MI, unsigned OpNo,
117                                    raw_ostream &O) {
118   printNamedBit(MI, OpNo, O, "idxen");
119 }
120 
121 void AMDGPUInstPrinter::printAddr64(const MCInst *MI, unsigned OpNo,
122                                     raw_ostream &O) {
123   printNamedBit(MI, OpNo, O, "addr64");
124 }
125 
126 void AMDGPUInstPrinter::printMBUFOffset(const MCInst *MI, unsigned OpNo,
127                                         raw_ostream &O) {
128   if (MI->getOperand(OpNo).getImm()) {
129     O << " offset:";
130     printU16ImmDecOperand(MI, OpNo, O);
131   }
132 }
133 
134 void AMDGPUInstPrinter::printOffset(const MCInst *MI, unsigned OpNo,
135                                     const MCSubtargetInfo &STI,
136                                     raw_ostream &O) {
137   uint16_t Imm = MI->getOperand(OpNo).getImm();
138   if (Imm != 0) {
139     O << ((OpNo == 0)? "offset:" : " offset:");
140     printU16ImmDecOperand(MI, OpNo, O);
141   }
142 }
143 
144 void AMDGPUInstPrinter::printFlatOffset(const MCInst *MI, unsigned OpNo,
145                                         const MCSubtargetInfo &STI,
146                                         raw_ostream &O) {
147   uint16_t Imm = MI->getOperand(OpNo).getImm();
148   if (Imm != 0) {
149     O << ((OpNo == 0)? "offset:" : " offset:");
150 
151     const MCInstrDesc &Desc = MII.get(MI->getOpcode());
152     bool IsFlatSeg = !(Desc.TSFlags & SIInstrFlags::IsNonFlatSeg);
153 
154     if (IsFlatSeg) { // Unsigned offset
155       printU16ImmDecOperand(MI, OpNo, O);
156     } else {         // Signed offset
157       if (AMDGPU::isGFX10(STI)) {
158         O << formatDec(SignExtend32<12>(MI->getOperand(OpNo).getImm()));
159       } else {
160         O << formatDec(SignExtend32<13>(MI->getOperand(OpNo).getImm()));
161       }
162     }
163   }
164 }
165 
166 void AMDGPUInstPrinter::printOffset0(const MCInst *MI, unsigned OpNo,
167                                      const MCSubtargetInfo &STI,
168                                      raw_ostream &O) {
169   if (MI->getOperand(OpNo).getImm()) {
170     O << " offset0:";
171     printU8ImmDecOperand(MI, OpNo, O);
172   }
173 }
174 
175 void AMDGPUInstPrinter::printOffset1(const MCInst *MI, unsigned OpNo,
176                                      const MCSubtargetInfo &STI,
177                                      raw_ostream &O) {
178   if (MI->getOperand(OpNo).getImm()) {
179     O << " offset1:";
180     printU8ImmDecOperand(MI, OpNo, O);
181   }
182 }
183 
184 void AMDGPUInstPrinter::printSMRDOffset8(const MCInst *MI, unsigned OpNo,
185                                         const MCSubtargetInfo &STI,
186                                         raw_ostream &O) {
187   printU32ImmOperand(MI, OpNo, STI, O);
188 }
189 
190 void AMDGPUInstPrinter::printSMEMOffset(const MCInst *MI, unsigned OpNo,
191                                         const MCSubtargetInfo &STI,
192                                         raw_ostream &O) {
193   O << formatHex(MI->getOperand(OpNo).getImm());
194 }
195 
196 void AMDGPUInstPrinter::printSMRDLiteralOffset(const MCInst *MI, unsigned OpNo,
197                                                const MCSubtargetInfo &STI,
198                                                raw_ostream &O) {
199   printU32ImmOperand(MI, OpNo, STI, O);
200 }
201 
202 void AMDGPUInstPrinter::printGDS(const MCInst *MI, unsigned OpNo,
203                                  const MCSubtargetInfo &STI, raw_ostream &O) {
204   printNamedBit(MI, OpNo, O, "gds");
205 }
206 
207 void AMDGPUInstPrinter::printDLC(const MCInst *MI, unsigned OpNo,
208                                  const MCSubtargetInfo &STI, raw_ostream &O) {
209   if (AMDGPU::isGFX10(STI))
210     printNamedBit(MI, OpNo, O, "dlc");
211 }
212 
213 void AMDGPUInstPrinter::printGLC(const MCInst *MI, unsigned OpNo,
214                                  const MCSubtargetInfo &STI, raw_ostream &O) {
215   printNamedBit(MI, OpNo, O, "glc");
216 }
217 
218 void AMDGPUInstPrinter::printSLC(const MCInst *MI, unsigned OpNo,
219                                  const MCSubtargetInfo &STI, raw_ostream &O) {
220   printNamedBit(MI, OpNo, O, "slc");
221 }
222 
223 void AMDGPUInstPrinter::printSWZ(const MCInst *MI, unsigned OpNo,
224                                  const MCSubtargetInfo &STI, raw_ostream &O) {
225 }
226 
227 void AMDGPUInstPrinter::printTFE(const MCInst *MI, unsigned OpNo,
228                                  const MCSubtargetInfo &STI, raw_ostream &O) {
229   printNamedBit(MI, OpNo, O, "tfe");
230 }
231 
232 void AMDGPUInstPrinter::printDMask(const MCInst *MI, unsigned OpNo,
233                                    const MCSubtargetInfo &STI, raw_ostream &O) {
234   if (MI->getOperand(OpNo).getImm()) {
235     O << " dmask:";
236     printU16ImmOperand(MI, OpNo, STI, O);
237   }
238 }
239 
240 void AMDGPUInstPrinter::printDim(const MCInst *MI, unsigned OpNo,
241                                  const MCSubtargetInfo &STI, raw_ostream &O) {
242   unsigned Dim = MI->getOperand(OpNo).getImm();
243   O << " dim:SQ_RSRC_IMG_";
244 
245   const AMDGPU::MIMGDimInfo *DimInfo = AMDGPU::getMIMGDimInfoByEncoding(Dim);
246   if (DimInfo)
247     O << DimInfo->AsmSuffix;
248   else
249     O << Dim;
250 }
251 
252 void AMDGPUInstPrinter::printUNorm(const MCInst *MI, unsigned OpNo,
253                                    const MCSubtargetInfo &STI, raw_ostream &O) {
254   printNamedBit(MI, OpNo, O, "unorm");
255 }
256 
257 void AMDGPUInstPrinter::printDA(const MCInst *MI, unsigned OpNo,
258                                 const MCSubtargetInfo &STI, raw_ostream &O) {
259   printNamedBit(MI, OpNo, O, "da");
260 }
261 
262 void AMDGPUInstPrinter::printR128A16(const MCInst *MI, unsigned OpNo,
263                                   const MCSubtargetInfo &STI, raw_ostream &O) {
264   if (STI.hasFeature(AMDGPU::FeatureR128A16))
265     printNamedBit(MI, OpNo, O, "a16");
266   else
267     printNamedBit(MI, OpNo, O, "r128");
268 }
269 
270 void AMDGPUInstPrinter::printGFX10A16(const MCInst *MI, unsigned OpNo,
271                                   const MCSubtargetInfo &STI, raw_ostream &O) {
272   printNamedBit(MI, OpNo, O, "a16");
273 }
274 
275 void AMDGPUInstPrinter::printLWE(const MCInst *MI, unsigned OpNo,
276                                  const MCSubtargetInfo &STI, raw_ostream &O) {
277   printNamedBit(MI, OpNo, O, "lwe");
278 }
279 
280 void AMDGPUInstPrinter::printD16(const MCInst *MI, unsigned OpNo,
281                                  const MCSubtargetInfo &STI, raw_ostream &O) {
282   printNamedBit(MI, OpNo, O, "d16");
283 }
284 
285 void AMDGPUInstPrinter::printExpCompr(const MCInst *MI, unsigned OpNo,
286                                       const MCSubtargetInfo &STI,
287                                       raw_ostream &O) {
288   if (MI->getOperand(OpNo).getImm())
289     O << " compr";
290 }
291 
292 void AMDGPUInstPrinter::printExpVM(const MCInst *MI, unsigned OpNo,
293                                    const MCSubtargetInfo &STI,
294                                    raw_ostream &O) {
295   if (MI->getOperand(OpNo).getImm())
296     O << " vm";
297 }
298 
299 void AMDGPUInstPrinter::printFORMAT(const MCInst *MI, unsigned OpNo,
300                                     const MCSubtargetInfo &STI,
301                                     raw_ostream &O) {
302   if (unsigned Val = MI->getOperand(OpNo).getImm()) {
303     if (AMDGPU::isGFX10(STI))
304       O << " format:" << Val;
305     else {
306       O << " dfmt:" << (Val & 15);
307       O << ", nfmt:" << (Val >> 4);
308     }
309   }
310 }
311 
312 void AMDGPUInstPrinter::printRegOperand(unsigned RegNo, raw_ostream &O,
313                                         const MCRegisterInfo &MRI) {
314 #if !defined(NDEBUG)
315   switch (RegNo) {
316   case AMDGPU::FP_REG:
317   case AMDGPU::SP_REG:
318   case AMDGPU::PRIVATE_RSRC_REG:
319     llvm_unreachable("pseudo-register should not ever be emitted");
320   case AMDGPU::SCC:
321     llvm_unreachable("pseudo scc should not ever be emitted");
322   default:
323     break;
324   }
325 #endif
326 
327   StringRef RegName(getRegisterName(RegNo));
328   if (!Keep16BitSuffixes)
329     if (!RegName.consume_back(".l"))
330       RegName.consume_back(".h");
331 
332   O << RegName;
333 }
334 
335 void AMDGPUInstPrinter::printVOPDst(const MCInst *MI, unsigned OpNo,
336                                     const MCSubtargetInfo &STI, raw_ostream &O) {
337   if (OpNo == 0) {
338     if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3)
339       O << "_e64 ";
340     else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::DPP)
341       O << "_dpp ";
342     else if (MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::SDWA)
343       O << "_sdwa ";
344     else
345       O << "_e32 ";
346   }
347 
348   printOperand(MI, OpNo, STI, O);
349 
350   // Print default vcc/vcc_lo operand.
351   switch (MI->getOpcode()) {
352   default: break;
353 
354   case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10:
355   case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10:
356   case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10:
357   case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10:
358   case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10:
359   case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10:
360   case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10:
361   case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10:
362   case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10:
363   case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10:
364   case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10:
365   case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10:
366     printDefaultVccOperand(1, STI, O);
367     break;
368   }
369 }
370 
371 void AMDGPUInstPrinter::printVINTRPDst(const MCInst *MI, unsigned OpNo,
372                                        const MCSubtargetInfo &STI, raw_ostream &O) {
373   if (AMDGPU::isSI(STI) || AMDGPU::isCI(STI))
374     O << " ";
375   else
376     O << "_e32 ";
377 
378   printOperand(MI, OpNo, STI, O);
379 }
380 
381 void AMDGPUInstPrinter::printImmediateInt16(uint32_t Imm,
382                                             const MCSubtargetInfo &STI,
383                                             raw_ostream &O) {
384   int16_t SImm = static_cast<int16_t>(Imm);
385   if (isInlinableIntLiteral(SImm))
386     O << SImm;
387   else
388     O << formatHex(static_cast<uint64_t>(Imm));
389 }
390 
391 void AMDGPUInstPrinter::printImmediate16(uint32_t Imm,
392                                          const MCSubtargetInfo &STI,
393                                          raw_ostream &O) {
394   int16_t SImm = static_cast<int16_t>(Imm);
395   if (isInlinableIntLiteral(SImm)) {
396     O << SImm;
397     return;
398   }
399 
400   if (Imm == 0x3C00)
401     O<< "1.0";
402   else if (Imm == 0xBC00)
403     O<< "-1.0";
404   else if (Imm == 0x3800)
405     O<< "0.5";
406   else if (Imm == 0xB800)
407     O<< "-0.5";
408   else if (Imm == 0x4000)
409     O<< "2.0";
410   else if (Imm == 0xC000)
411     O<< "-2.0";
412   else if (Imm == 0x4400)
413     O<< "4.0";
414   else if (Imm == 0xC400)
415     O<< "-4.0";
416   else if (Imm == 0x3118) {
417     assert(STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm]);
418     O << "0.15915494";
419   } else
420     O << formatHex(static_cast<uint64_t>(Imm));
421 }
422 
423 void AMDGPUInstPrinter::printImmediateV216(uint32_t Imm,
424                                            const MCSubtargetInfo &STI,
425                                            raw_ostream &O) {
426   uint16_t Lo16 = static_cast<uint16_t>(Imm);
427   printImmediate16(Lo16, STI, O);
428 }
429 
430 void AMDGPUInstPrinter::printImmediate32(uint32_t Imm,
431                                          const MCSubtargetInfo &STI,
432                                          raw_ostream &O) {
433   int32_t SImm = static_cast<int32_t>(Imm);
434   if (SImm >= -16 && SImm <= 64) {
435     O << SImm;
436     return;
437   }
438 
439   if (Imm == FloatToBits(0.0f))
440     O << "0.0";
441   else if (Imm == FloatToBits(1.0f))
442     O << "1.0";
443   else if (Imm == FloatToBits(-1.0f))
444     O << "-1.0";
445   else if (Imm == FloatToBits(0.5f))
446     O << "0.5";
447   else if (Imm == FloatToBits(-0.5f))
448     O << "-0.5";
449   else if (Imm == FloatToBits(2.0f))
450     O << "2.0";
451   else if (Imm == FloatToBits(-2.0f))
452     O << "-2.0";
453   else if (Imm == FloatToBits(4.0f))
454     O << "4.0";
455   else if (Imm == FloatToBits(-4.0f))
456     O << "-4.0";
457   else if (Imm == 0x3e22f983 &&
458            STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
459     O << "0.15915494";
460   else
461     O << formatHex(static_cast<uint64_t>(Imm));
462 }
463 
464 void AMDGPUInstPrinter::printImmediate64(uint64_t Imm,
465                                          const MCSubtargetInfo &STI,
466                                          raw_ostream &O) {
467   int64_t SImm = static_cast<int64_t>(Imm);
468   if (SImm >= -16 && SImm <= 64) {
469     O << SImm;
470     return;
471   }
472 
473   if (Imm == DoubleToBits(0.0))
474     O << "0.0";
475   else if (Imm == DoubleToBits(1.0))
476     O << "1.0";
477   else if (Imm == DoubleToBits(-1.0))
478     O << "-1.0";
479   else if (Imm == DoubleToBits(0.5))
480     O << "0.5";
481   else if (Imm == DoubleToBits(-0.5))
482     O << "-0.5";
483   else if (Imm == DoubleToBits(2.0))
484     O << "2.0";
485   else if (Imm == DoubleToBits(-2.0))
486     O << "-2.0";
487   else if (Imm == DoubleToBits(4.0))
488     O << "4.0";
489   else if (Imm == DoubleToBits(-4.0))
490     O << "-4.0";
491   else if (Imm == 0x3fc45f306dc9c882 &&
492            STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
493     O << "0.15915494309189532";
494   else {
495     assert(isUInt<32>(Imm) || Imm == 0x3fc45f306dc9c882);
496 
497     // In rare situations, we will have a 32-bit literal in a 64-bit
498     // operand. This is technically allowed for the encoding of s_mov_b64.
499     O << formatHex(static_cast<uint64_t>(Imm));
500   }
501 }
502 
503 void AMDGPUInstPrinter::printBLGP(const MCInst *MI, unsigned OpNo,
504                                   const MCSubtargetInfo &STI,
505                                   raw_ostream &O) {
506   unsigned Imm = MI->getOperand(OpNo).getImm();
507   if (!Imm)
508     return;
509 
510   O << " blgp:" << Imm;
511 }
512 
513 void AMDGPUInstPrinter::printCBSZ(const MCInst *MI, unsigned OpNo,
514                                   const MCSubtargetInfo &STI,
515                                   raw_ostream &O) {
516   unsigned Imm = MI->getOperand(OpNo).getImm();
517   if (!Imm)
518     return;
519 
520   O << " cbsz:" << Imm;
521 }
522 
523 void AMDGPUInstPrinter::printABID(const MCInst *MI, unsigned OpNo,
524                                   const MCSubtargetInfo &STI,
525                                   raw_ostream &O) {
526   unsigned Imm = MI->getOperand(OpNo).getImm();
527   if (!Imm)
528     return;
529 
530   O << " abid:" << Imm;
531 }
532 
533 void AMDGPUInstPrinter::printDefaultVccOperand(unsigned OpNo,
534                                                const MCSubtargetInfo &STI,
535                                                raw_ostream &O) {
536   if (OpNo > 0)
537     O << ", ";
538   printRegOperand(STI.getFeatureBits()[AMDGPU::FeatureWavefrontSize64] ?
539                   AMDGPU::VCC : AMDGPU::VCC_LO, O, MRI);
540   if (OpNo == 0)
541     O << ", ";
542 }
543 
544 void AMDGPUInstPrinter::printOperand(const MCInst *MI, unsigned OpNo,
545                                      const MCSubtargetInfo &STI,
546                                      raw_ostream &O) {
547   // Print default vcc/vcc_lo operand of VOPC.
548   const MCInstrDesc &Desc = MII.get(MI->getOpcode());
549   if (OpNo == 0 && (Desc.TSFlags & SIInstrFlags::VOPC) &&
550       (Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC) ||
551        Desc.hasImplicitDefOfPhysReg(AMDGPU::VCC_LO)))
552     printDefaultVccOperand(OpNo, STI, O);
553 
554   if (OpNo >= MI->getNumOperands()) {
555     O << "/*Missing OP" << OpNo << "*/";
556     return;
557   }
558 
559   const MCOperand &Op = MI->getOperand(OpNo);
560   if (Op.isReg()) {
561     printRegOperand(Op.getReg(), O, MRI);
562   } else if (Op.isImm()) {
563     const uint8_t OpTy = Desc.OpInfo[OpNo].OperandType;
564     switch (OpTy) {
565     case AMDGPU::OPERAND_REG_IMM_INT32:
566     case AMDGPU::OPERAND_REG_IMM_FP32:
567     case AMDGPU::OPERAND_REG_INLINE_C_INT32:
568     case AMDGPU::OPERAND_REG_INLINE_C_FP32:
569     case AMDGPU::OPERAND_REG_INLINE_AC_INT32:
570     case AMDGPU::OPERAND_REG_INLINE_AC_FP32:
571     case MCOI::OPERAND_IMMEDIATE:
572       printImmediate32(Op.getImm(), STI, O);
573       break;
574     case AMDGPU::OPERAND_REG_IMM_INT64:
575     case AMDGPU::OPERAND_REG_IMM_FP64:
576     case AMDGPU::OPERAND_REG_INLINE_C_INT64:
577     case AMDGPU::OPERAND_REG_INLINE_C_FP64:
578       printImmediate64(Op.getImm(), STI, O);
579       break;
580     case AMDGPU::OPERAND_REG_INLINE_C_INT16:
581     case AMDGPU::OPERAND_REG_INLINE_AC_INT16:
582     case AMDGPU::OPERAND_REG_IMM_INT16:
583       printImmediateInt16(Op.getImm(), STI, O);
584       break;
585     case AMDGPU::OPERAND_REG_INLINE_C_FP16:
586     case AMDGPU::OPERAND_REG_INLINE_AC_FP16:
587     case AMDGPU::OPERAND_REG_IMM_FP16:
588       printImmediate16(Op.getImm(), STI, O);
589       break;
590     case AMDGPU::OPERAND_REG_IMM_V2INT16:
591     case AMDGPU::OPERAND_REG_IMM_V2FP16:
592       if (!isUInt<16>(Op.getImm()) &&
593           STI.getFeatureBits()[AMDGPU::FeatureVOP3Literal]) {
594         printImmediate32(Op.getImm(), STI, O);
595         break;
596       }
597 
598       //  Deal with 16-bit FP inline immediates not working.
599       if (OpTy == AMDGPU::OPERAND_REG_IMM_V2FP16) {
600         printImmediate16(static_cast<uint16_t>(Op.getImm()), STI, O);
601         break;
602       }
603       LLVM_FALLTHROUGH;
604     case AMDGPU::OPERAND_REG_INLINE_C_V2INT16:
605     case AMDGPU::OPERAND_REG_INLINE_AC_V2INT16:
606       printImmediateInt16(static_cast<uint16_t>(Op.getImm()), STI, O);
607       break;
608     case AMDGPU::OPERAND_REG_INLINE_C_V2FP16:
609     case AMDGPU::OPERAND_REG_INLINE_AC_V2FP16:
610       printImmediateV216(Op.getImm(), STI, O);
611       break;
612     case MCOI::OPERAND_UNKNOWN:
613     case MCOI::OPERAND_PCREL:
614       O << formatDec(Op.getImm());
615       break;
616     case MCOI::OPERAND_REGISTER:
617       // FIXME: This should be removed and handled somewhere else. Seems to come
618       // from a disassembler bug.
619       O << "/*invalid immediate*/";
620       break;
621     default:
622       // We hit this for the immediate instruction bits that don't yet have a
623       // custom printer.
624       llvm_unreachable("unexpected immediate operand type");
625     }
626   } else if (Op.isFPImm()) {
627     // We special case 0.0 because otherwise it will be printed as an integer.
628     if (Op.getFPImm() == 0.0)
629       O << "0.0";
630     else {
631       const MCInstrDesc &Desc = MII.get(MI->getOpcode());
632       int RCID = Desc.OpInfo[OpNo].RegClass;
633       unsigned RCBits = AMDGPU::getRegBitWidth(MRI.getRegClass(RCID));
634       if (RCBits == 32)
635         printImmediate32(FloatToBits(Op.getFPImm()), STI, O);
636       else if (RCBits == 64)
637         printImmediate64(DoubleToBits(Op.getFPImm()), STI, O);
638       else
639         llvm_unreachable("Invalid register class size");
640     }
641   } else if (Op.isExpr()) {
642     const MCExpr *Exp = Op.getExpr();
643     Exp->print(O, &MAI);
644   } else {
645     O << "/*INV_OP*/";
646   }
647 
648   // Print default vcc/vcc_lo operand of v_cndmask_b32_e32.
649   switch (MI->getOpcode()) {
650   default: break;
651 
652   case AMDGPU::V_CNDMASK_B32_e32_gfx10:
653   case AMDGPU::V_ADD_CO_CI_U32_e32_gfx10:
654   case AMDGPU::V_SUB_CO_CI_U32_e32_gfx10:
655   case AMDGPU::V_SUBREV_CO_CI_U32_e32_gfx10:
656   case AMDGPU::V_CNDMASK_B32_dpp_gfx10:
657   case AMDGPU::V_ADD_CO_CI_U32_dpp_gfx10:
658   case AMDGPU::V_SUB_CO_CI_U32_dpp_gfx10:
659   case AMDGPU::V_SUBREV_CO_CI_U32_dpp_gfx10:
660   case AMDGPU::V_CNDMASK_B32_dpp8_gfx10:
661   case AMDGPU::V_ADD_CO_CI_U32_dpp8_gfx10:
662   case AMDGPU::V_SUB_CO_CI_U32_dpp8_gfx10:
663   case AMDGPU::V_SUBREV_CO_CI_U32_dpp8_gfx10:
664 
665   case AMDGPU::V_CNDMASK_B32_e32_gfx6_gfx7:
666   case AMDGPU::V_CNDMASK_B32_e32_vi:
667     if ((int)OpNo == AMDGPU::getNamedOperandIdx(MI->getOpcode(),
668                                                 AMDGPU::OpName::src1))
669       printDefaultVccOperand(OpNo, STI, O);
670     break;
671   }
672 }
673 
674 void AMDGPUInstPrinter::printOperandAndFPInputMods(const MCInst *MI,
675                                                    unsigned OpNo,
676                                                    const MCSubtargetInfo &STI,
677                                                    raw_ostream &O) {
678   unsigned InputModifiers = MI->getOperand(OpNo).getImm();
679 
680   // Use 'neg(...)' instead of '-' to avoid ambiguity.
681   // This is important for integer literals because
682   // -1 is not the same value as neg(1).
683   bool NegMnemo = false;
684 
685   if (InputModifiers & SISrcMods::NEG) {
686     if (OpNo + 1 < MI->getNumOperands() &&
687         (InputModifiers & SISrcMods::ABS) == 0) {
688       const MCOperand &Op = MI->getOperand(OpNo + 1);
689       NegMnemo = Op.isImm() || Op.isFPImm();
690     }
691     if (NegMnemo) {
692       O << "neg(";
693     } else {
694       O << '-';
695     }
696   }
697 
698   if (InputModifiers & SISrcMods::ABS)
699     O << '|';
700   printOperand(MI, OpNo + 1, STI, O);
701   if (InputModifiers & SISrcMods::ABS)
702     O << '|';
703 
704   if (NegMnemo) {
705     O << ')';
706   }
707 }
708 
709 void AMDGPUInstPrinter::printOperandAndIntInputMods(const MCInst *MI,
710                                                     unsigned OpNo,
711                                                     const MCSubtargetInfo &STI,
712                                                     raw_ostream &O) {
713   unsigned InputModifiers = MI->getOperand(OpNo).getImm();
714   if (InputModifiers & SISrcMods::SEXT)
715     O << "sext(";
716   printOperand(MI, OpNo + 1, STI, O);
717   if (InputModifiers & SISrcMods::SEXT)
718     O << ')';
719 
720   // Print default vcc/vcc_lo operand of VOP2b.
721   switch (MI->getOpcode()) {
722   default: break;
723 
724   case AMDGPU::V_CNDMASK_B32_sdwa_gfx10:
725   case AMDGPU::V_ADD_CO_CI_U32_sdwa_gfx10:
726   case AMDGPU::V_SUB_CO_CI_U32_sdwa_gfx10:
727   case AMDGPU::V_SUBREV_CO_CI_U32_sdwa_gfx10:
728     if ((int)OpNo + 1 == AMDGPU::getNamedOperandIdx(MI->getOpcode(),
729                                                     AMDGPU::OpName::src1))
730       printDefaultVccOperand(OpNo, STI, O);
731     break;
732   }
733 }
734 
735 void AMDGPUInstPrinter::printDPP8(const MCInst *MI, unsigned OpNo,
736                                   const MCSubtargetInfo &STI,
737                                   raw_ostream &O) {
738   if (!AMDGPU::isGFX10(STI))
739     llvm_unreachable("dpp8 is not supported on ASICs earlier than GFX10");
740 
741   unsigned Imm = MI->getOperand(OpNo).getImm();
742   O << " dpp8:[" << formatDec(Imm & 0x7);
743   for (size_t i = 1; i < 8; ++i) {
744     O << ',' << formatDec((Imm >> (3 * i)) & 0x7);
745   }
746   O << ']';
747 }
748 
749 void AMDGPUInstPrinter::printDPPCtrl(const MCInst *MI, unsigned OpNo,
750                                      const MCSubtargetInfo &STI,
751                                      raw_ostream &O) {
752   using namespace AMDGPU::DPP;
753 
754   unsigned Imm = MI->getOperand(OpNo).getImm();
755   if (Imm <= DppCtrl::QUAD_PERM_LAST) {
756     O << " quad_perm:[";
757     O << formatDec(Imm & 0x3)         << ',';
758     O << formatDec((Imm & 0xc)  >> 2) << ',';
759     O << formatDec((Imm & 0x30) >> 4) << ',';
760     O << formatDec((Imm & 0xc0) >> 6) << ']';
761   } else if ((Imm >= DppCtrl::ROW_SHL_FIRST) &&
762              (Imm <= DppCtrl::ROW_SHL_LAST)) {
763     O << " row_shl:";
764     printU4ImmDecOperand(MI, OpNo, O);
765   } else if ((Imm >= DppCtrl::ROW_SHR_FIRST) &&
766              (Imm <= DppCtrl::ROW_SHR_LAST)) {
767     O << " row_shr:";
768     printU4ImmDecOperand(MI, OpNo, O);
769   } else if ((Imm >= DppCtrl::ROW_ROR_FIRST) &&
770              (Imm <= DppCtrl::ROW_ROR_LAST)) {
771     O << " row_ror:";
772     printU4ImmDecOperand(MI, OpNo, O);
773   } else if (Imm == DppCtrl::WAVE_SHL1) {
774     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
775       O << " /* wave_shl is not supported starting from GFX10 */";
776       return;
777     }
778     O << " wave_shl:1";
779   } else if (Imm == DppCtrl::WAVE_ROL1) {
780     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
781       O << " /* wave_rol is not supported starting from GFX10 */";
782       return;
783     }
784     O << " wave_rol:1";
785   } else if (Imm == DppCtrl::WAVE_SHR1) {
786     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
787       O << " /* wave_shr is not supported starting from GFX10 */";
788       return;
789     }
790     O << " wave_shr:1";
791   } else if (Imm == DppCtrl::WAVE_ROR1) {
792     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
793       O << " /* wave_ror is not supported starting from GFX10 */";
794       return;
795     }
796     O << " wave_ror:1";
797   } else if (Imm == DppCtrl::ROW_MIRROR) {
798     O << " row_mirror";
799   } else if (Imm == DppCtrl::ROW_HALF_MIRROR) {
800     O << " row_half_mirror";
801   } else if (Imm == DppCtrl::BCAST15) {
802     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
803       O << " /* row_bcast is not supported starting from GFX10 */";
804       return;
805     }
806     O << " row_bcast:15";
807   } else if (Imm == DppCtrl::BCAST31) {
808     if (!AMDGPU::isVI(STI) && !AMDGPU::isGFX9(STI)) {
809       O << " /* row_bcast is not supported starting from GFX10 */";
810       return;
811     }
812     O << " row_bcast:31";
813   } else if ((Imm >= DppCtrl::ROW_SHARE_FIRST) &&
814              (Imm <= DppCtrl::ROW_SHARE_LAST)) {
815     if (!AMDGPU::isGFX10(STI)) {
816       O << " /* row_share is not supported on ASICs earlier than GFX10 */";
817       return;
818     }
819     O << " row_share:";
820     printU4ImmDecOperand(MI, OpNo, O);
821   } else if ((Imm >= DppCtrl::ROW_XMASK_FIRST) &&
822              (Imm <= DppCtrl::ROW_XMASK_LAST)) {
823     if (!AMDGPU::isGFX10(STI)) {
824       O << " /* row_xmask is not supported on ASICs earlier than GFX10 */";
825       return;
826     }
827     O << "row_xmask:";
828     printU4ImmDecOperand(MI, OpNo, O);
829   } else {
830     O << " /* Invalid dpp_ctrl value */";
831   }
832 }
833 
834 void AMDGPUInstPrinter::printRowMask(const MCInst *MI, unsigned OpNo,
835                                      const MCSubtargetInfo &STI,
836                                      raw_ostream &O) {
837   O << " row_mask:";
838   printU4ImmOperand(MI, OpNo, STI, O);
839 }
840 
841 void AMDGPUInstPrinter::printBankMask(const MCInst *MI, unsigned OpNo,
842                                       const MCSubtargetInfo &STI,
843                                       raw_ostream &O) {
844   O << " bank_mask:";
845   printU4ImmOperand(MI, OpNo, STI, O);
846 }
847 
848 void AMDGPUInstPrinter::printBoundCtrl(const MCInst *MI, unsigned OpNo,
849                                        const MCSubtargetInfo &STI,
850                                        raw_ostream &O) {
851   unsigned Imm = MI->getOperand(OpNo).getImm();
852   if (Imm) {
853     O << " bound_ctrl:0"; // XXX - this syntax is used in sp3
854   }
855 }
856 
857 void AMDGPUInstPrinter::printFI(const MCInst *MI, unsigned OpNo,
858                                 const MCSubtargetInfo &STI,
859                                 raw_ostream &O) {
860   using namespace llvm::AMDGPU::DPP;
861   unsigned Imm = MI->getOperand(OpNo).getImm();
862   if (Imm == DPP_FI_1 || Imm == DPP8_FI_1) {
863     O << " fi:1";
864   }
865 }
866 
867 void AMDGPUInstPrinter::printSDWASel(const MCInst *MI, unsigned OpNo,
868                                      raw_ostream &O) {
869   using namespace llvm::AMDGPU::SDWA;
870 
871   unsigned Imm = MI->getOperand(OpNo).getImm();
872   switch (Imm) {
873   case SdwaSel::BYTE_0: O << "BYTE_0"; break;
874   case SdwaSel::BYTE_1: O << "BYTE_1"; break;
875   case SdwaSel::BYTE_2: O << "BYTE_2"; break;
876   case SdwaSel::BYTE_3: O << "BYTE_3"; break;
877   case SdwaSel::WORD_0: O << "WORD_0"; break;
878   case SdwaSel::WORD_1: O << "WORD_1"; break;
879   case SdwaSel::DWORD: O << "DWORD"; break;
880   default: llvm_unreachable("Invalid SDWA data select operand");
881   }
882 }
883 
884 void AMDGPUInstPrinter::printSDWADstSel(const MCInst *MI, unsigned OpNo,
885                                         const MCSubtargetInfo &STI,
886                                         raw_ostream &O) {
887   O << "dst_sel:";
888   printSDWASel(MI, OpNo, O);
889 }
890 
891 void AMDGPUInstPrinter::printSDWASrc0Sel(const MCInst *MI, unsigned OpNo,
892                                          const MCSubtargetInfo &STI,
893                                          raw_ostream &O) {
894   O << "src0_sel:";
895   printSDWASel(MI, OpNo, O);
896 }
897 
898 void AMDGPUInstPrinter::printSDWASrc1Sel(const MCInst *MI, unsigned OpNo,
899                                          const MCSubtargetInfo &STI,
900                                          raw_ostream &O) {
901   O << "src1_sel:";
902   printSDWASel(MI, OpNo, O);
903 }
904 
905 void AMDGPUInstPrinter::printSDWADstUnused(const MCInst *MI, unsigned OpNo,
906                                            const MCSubtargetInfo &STI,
907                                            raw_ostream &O) {
908   using namespace llvm::AMDGPU::SDWA;
909 
910   O << "dst_unused:";
911   unsigned Imm = MI->getOperand(OpNo).getImm();
912   switch (Imm) {
913   case DstUnused::UNUSED_PAD: O << "UNUSED_PAD"; break;
914   case DstUnused::UNUSED_SEXT: O << "UNUSED_SEXT"; break;
915   case DstUnused::UNUSED_PRESERVE: O << "UNUSED_PRESERVE"; break;
916   default: llvm_unreachable("Invalid SDWA dest_unused operand");
917   }
918 }
919 
920 template <unsigned N>
921 void AMDGPUInstPrinter::printExpSrcN(const MCInst *MI, unsigned OpNo,
922                                      const MCSubtargetInfo &STI,
923                                      raw_ostream &O) {
924   unsigned Opc = MI->getOpcode();
925   int EnIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::en);
926   unsigned En = MI->getOperand(EnIdx).getImm();
927 
928   int ComprIdx = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::compr);
929 
930   // If compr is set, print as src0, src0, src1, src1
931   if (MI->getOperand(ComprIdx).getImm()) {
932     if (N == 1 || N == 2)
933       --OpNo;
934     else if (N == 3)
935       OpNo -= 2;
936   }
937 
938   if (En & (1 << N))
939     printRegOperand(MI->getOperand(OpNo).getReg(), O, MRI);
940   else
941     O << "off";
942 }
943 
944 void AMDGPUInstPrinter::printExpSrc0(const MCInst *MI, unsigned OpNo,
945                                      const MCSubtargetInfo &STI,
946                                      raw_ostream &O) {
947   printExpSrcN<0>(MI, OpNo, STI, O);
948 }
949 
950 void AMDGPUInstPrinter::printExpSrc1(const MCInst *MI, unsigned OpNo,
951                                      const MCSubtargetInfo &STI,
952                                      raw_ostream &O) {
953   printExpSrcN<1>(MI, OpNo, STI, O);
954 }
955 
956 void AMDGPUInstPrinter::printExpSrc2(const MCInst *MI, unsigned OpNo,
957                                      const MCSubtargetInfo &STI,
958                                      raw_ostream &O) {
959   printExpSrcN<2>(MI, OpNo, STI, O);
960 }
961 
962 void AMDGPUInstPrinter::printExpSrc3(const MCInst *MI, unsigned OpNo,
963                                      const MCSubtargetInfo &STI,
964                                      raw_ostream &O) {
965   printExpSrcN<3>(MI, OpNo, STI, O);
966 }
967 
968 void AMDGPUInstPrinter::printExpTgt(const MCInst *MI, unsigned OpNo,
969                                     const MCSubtargetInfo &STI,
970                                     raw_ostream &O) {
971   // This is really a 6 bit field.
972   uint32_t Tgt = MI->getOperand(OpNo).getImm() & ((1 << 6) - 1);
973 
974   if (Tgt <= 7)
975     O << " mrt" << Tgt;
976   else if (Tgt == 8)
977     O << " mrtz";
978   else if (Tgt == 9)
979     O << " null";
980   else if ((Tgt >= 12 && Tgt <= 15) || (Tgt == 16 && AMDGPU::isGFX10(STI)))
981     O << " pos" << Tgt - 12;
982   else if (AMDGPU::isGFX10(STI) && Tgt == 20)
983     O << " prim";
984   else if (Tgt >= 32 && Tgt <= 63)
985     O << " param" << Tgt - 32;
986   else {
987     // Reserved values 10, 11
988     O << " invalid_target_" << Tgt;
989   }
990 }
991 
992 static bool allOpsDefaultValue(const int* Ops, int NumOps, int Mod,
993                                bool IsPacked, bool HasDstSel) {
994   int DefaultValue = IsPacked && (Mod == SISrcMods::OP_SEL_1);
995 
996   for (int I = 0; I < NumOps; ++I) {
997     if (!!(Ops[I] & Mod) != DefaultValue)
998       return false;
999   }
1000 
1001   if (HasDstSel && (Ops[0] & SISrcMods::DST_OP_SEL) != 0)
1002     return false;
1003 
1004   return true;
1005 }
1006 
1007 void AMDGPUInstPrinter::printPackedModifier(const MCInst *MI,
1008                                             StringRef Name,
1009                                             unsigned Mod,
1010                                             raw_ostream &O) {
1011   unsigned Opc = MI->getOpcode();
1012   int NumOps = 0;
1013   int Ops[3];
1014 
1015   for (int OpName : { AMDGPU::OpName::src0_modifiers,
1016                       AMDGPU::OpName::src1_modifiers,
1017                       AMDGPU::OpName::src2_modifiers }) {
1018     int Idx = AMDGPU::getNamedOperandIdx(Opc, OpName);
1019     if (Idx == -1)
1020       break;
1021 
1022     Ops[NumOps++] = MI->getOperand(Idx).getImm();
1023   }
1024 
1025   const bool HasDstSel =
1026     NumOps > 0 &&
1027     Mod == SISrcMods::OP_SEL_0 &&
1028     MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::VOP3_OPSEL;
1029 
1030   const bool IsPacked =
1031     MII.get(MI->getOpcode()).TSFlags & SIInstrFlags::IsPacked;
1032 
1033   if (allOpsDefaultValue(Ops, NumOps, Mod, IsPacked, HasDstSel))
1034     return;
1035 
1036   O << Name;
1037   for (int I = 0; I < NumOps; ++I) {
1038     if (I != 0)
1039       O << ',';
1040 
1041     O << !!(Ops[I] & Mod);
1042   }
1043 
1044   if (HasDstSel) {
1045     O << ',' << !!(Ops[0] & SISrcMods::DST_OP_SEL);
1046   }
1047 
1048   O << ']';
1049 }
1050 
1051 void AMDGPUInstPrinter::printOpSel(const MCInst *MI, unsigned,
1052                                    const MCSubtargetInfo &STI,
1053                                    raw_ostream &O) {
1054   unsigned Opc = MI->getOpcode();
1055   if (Opc == AMDGPU::V_PERMLANE16_B32_gfx10 ||
1056       Opc == AMDGPU::V_PERMLANEX16_B32_gfx10) {
1057     auto FIN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src0_modifiers);
1058     auto BCN = AMDGPU::getNamedOperandIdx(Opc, AMDGPU::OpName::src1_modifiers);
1059     unsigned FI = !!(MI->getOperand(FIN).getImm() & SISrcMods::OP_SEL_0);
1060     unsigned BC = !!(MI->getOperand(BCN).getImm() & SISrcMods::OP_SEL_0);
1061     if (FI || BC)
1062       O << " op_sel:[" << FI << ',' << BC << ']';
1063     return;
1064   }
1065 
1066   printPackedModifier(MI, " op_sel:[", SISrcMods::OP_SEL_0, O);
1067 }
1068 
1069 void AMDGPUInstPrinter::printOpSelHi(const MCInst *MI, unsigned OpNo,
1070                                      const MCSubtargetInfo &STI,
1071                                      raw_ostream &O) {
1072   printPackedModifier(MI, " op_sel_hi:[", SISrcMods::OP_SEL_1, O);
1073 }
1074 
1075 void AMDGPUInstPrinter::printNegLo(const MCInst *MI, unsigned OpNo,
1076                                    const MCSubtargetInfo &STI,
1077                                    raw_ostream &O) {
1078   printPackedModifier(MI, " neg_lo:[", SISrcMods::NEG, O);
1079 }
1080 
1081 void AMDGPUInstPrinter::printNegHi(const MCInst *MI, unsigned OpNo,
1082                                    const MCSubtargetInfo &STI,
1083                                    raw_ostream &O) {
1084   printPackedModifier(MI, " neg_hi:[", SISrcMods::NEG_HI, O);
1085 }
1086 
1087 void AMDGPUInstPrinter::printInterpSlot(const MCInst *MI, unsigned OpNum,
1088                                         const MCSubtargetInfo &STI,
1089                                         raw_ostream &O) {
1090   unsigned Imm = MI->getOperand(OpNum).getImm();
1091   switch (Imm) {
1092   case 0:
1093     O << "p10";
1094     break;
1095   case 1:
1096     O << "p20";
1097     break;
1098   case 2:
1099     O << "p0";
1100     break;
1101   default:
1102     O << "invalid_param_" << Imm;
1103   }
1104 }
1105 
1106 void AMDGPUInstPrinter::printInterpAttr(const MCInst *MI, unsigned OpNum,
1107                                         const MCSubtargetInfo &STI,
1108                                         raw_ostream &O) {
1109   unsigned Attr = MI->getOperand(OpNum).getImm();
1110   O << "attr" << Attr;
1111 }
1112 
1113 void AMDGPUInstPrinter::printInterpAttrChan(const MCInst *MI, unsigned OpNum,
1114                                         const MCSubtargetInfo &STI,
1115                                         raw_ostream &O) {
1116   unsigned Chan = MI->getOperand(OpNum).getImm();
1117   O << '.' << "xyzw"[Chan & 0x3];
1118 }
1119 
1120 void AMDGPUInstPrinter::printVGPRIndexMode(const MCInst *MI, unsigned OpNo,
1121                                            const MCSubtargetInfo &STI,
1122                                            raw_ostream &O) {
1123   using namespace llvm::AMDGPU::VGPRIndexMode;
1124   unsigned Val = MI->getOperand(OpNo).getImm();
1125 
1126   if ((Val & ~ENABLE_MASK) != 0) {
1127     O << " " << formatHex(static_cast<uint64_t>(Val));
1128   } else {
1129     O << " gpr_idx(";
1130     bool NeedComma = false;
1131     for (unsigned ModeId = ID_MIN; ModeId <= ID_MAX; ++ModeId) {
1132       if (Val & (1 << ModeId)) {
1133         if (NeedComma)
1134           O << ',';
1135         O << IdSymbolic[ModeId];
1136         NeedComma = true;
1137       }
1138     }
1139     O << ')';
1140   }
1141 }
1142 
1143 void AMDGPUInstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo,
1144                                         const MCSubtargetInfo &STI,
1145                                         raw_ostream &O) {
1146   printOperand(MI, OpNo, STI, O);
1147   O  << ", ";
1148   printOperand(MI, OpNo + 1, STI, O);
1149 }
1150 
1151 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo,
1152                                    raw_ostream &O, StringRef Asm,
1153                                    StringRef Default) {
1154   const MCOperand &Op = MI->getOperand(OpNo);
1155   assert(Op.isImm());
1156   if (Op.getImm() == 1) {
1157     O << Asm;
1158   } else {
1159     O << Default;
1160   }
1161 }
1162 
1163 void AMDGPUInstPrinter::printIfSet(const MCInst *MI, unsigned OpNo,
1164                                    raw_ostream &O, char Asm) {
1165   const MCOperand &Op = MI->getOperand(OpNo);
1166   assert(Op.isImm());
1167   if (Op.getImm() == 1)
1168     O << Asm;
1169 }
1170 
1171 void AMDGPUInstPrinter::printHigh(const MCInst *MI, unsigned OpNo,
1172                                   const MCSubtargetInfo &STI,
1173                                   raw_ostream &O) {
1174   if (MI->getOperand(OpNo).getImm())
1175     O << " high";
1176 }
1177 
1178 void AMDGPUInstPrinter::printClampSI(const MCInst *MI, unsigned OpNo,
1179                                      const MCSubtargetInfo &STI,
1180                                      raw_ostream &O) {
1181   if (MI->getOperand(OpNo).getImm())
1182     O << " clamp";
1183 }
1184 
1185 void AMDGPUInstPrinter::printOModSI(const MCInst *MI, unsigned OpNo,
1186                                     const MCSubtargetInfo &STI,
1187                                     raw_ostream &O) {
1188   int Imm = MI->getOperand(OpNo).getImm();
1189   if (Imm == SIOutMods::MUL2)
1190     O << " mul:2";
1191   else if (Imm == SIOutMods::MUL4)
1192     O << " mul:4";
1193   else if (Imm == SIOutMods::DIV2)
1194     O << " div:2";
1195 }
1196 
1197 void AMDGPUInstPrinter::printSendMsg(const MCInst *MI, unsigned OpNo,
1198                                      const MCSubtargetInfo &STI,
1199                                      raw_ostream &O) {
1200   using namespace llvm::AMDGPU::SendMsg;
1201 
1202   const unsigned Imm16 = MI->getOperand(OpNo).getImm();
1203 
1204   uint16_t MsgId;
1205   uint16_t OpId;
1206   uint16_t StreamId;
1207   decodeMsg(Imm16, MsgId, OpId, StreamId);
1208 
1209   if (isValidMsgId(MsgId, STI) &&
1210       isValidMsgOp(MsgId, OpId) &&
1211       isValidMsgStream(MsgId, OpId, StreamId)) {
1212     O << "sendmsg(" << getMsgName(MsgId);
1213     if (msgRequiresOp(MsgId)) {
1214       O << ", " << getMsgOpName(MsgId, OpId);
1215       if (msgSupportsStream(MsgId, OpId)) {
1216         O << ", " << StreamId;
1217       }
1218     }
1219     O << ')';
1220   } else if (encodeMsg(MsgId, OpId, StreamId) == Imm16) {
1221     O << "sendmsg(" << MsgId << ", " << OpId << ", " << StreamId << ')';
1222   } else {
1223     O << Imm16; // Unknown imm16 code.
1224   }
1225 }
1226 
1227 static void printSwizzleBitmask(const uint16_t AndMask,
1228                                 const uint16_t OrMask,
1229                                 const uint16_t XorMask,
1230                                 raw_ostream &O) {
1231   using namespace llvm::AMDGPU::Swizzle;
1232 
1233   uint16_t Probe0 = ((0            & AndMask) | OrMask) ^ XorMask;
1234   uint16_t Probe1 = ((BITMASK_MASK & AndMask) | OrMask) ^ XorMask;
1235 
1236   O << "\"";
1237 
1238   for (unsigned Mask = 1 << (BITMASK_WIDTH - 1); Mask > 0; Mask >>= 1) {
1239     uint16_t p0 = Probe0 & Mask;
1240     uint16_t p1 = Probe1 & Mask;
1241 
1242     if (p0 == p1) {
1243       if (p0 == 0) {
1244         O << "0";
1245       } else {
1246         O << "1";
1247       }
1248     } else {
1249       if (p0 == 0) {
1250         O << "p";
1251       } else {
1252         O << "i";
1253       }
1254     }
1255   }
1256 
1257   O << "\"";
1258 }
1259 
1260 void AMDGPUInstPrinter::printSwizzle(const MCInst *MI, unsigned OpNo,
1261                                      const MCSubtargetInfo &STI,
1262                                      raw_ostream &O) {
1263   using namespace llvm::AMDGPU::Swizzle;
1264 
1265   uint16_t Imm = MI->getOperand(OpNo).getImm();
1266   if (Imm == 0) {
1267     return;
1268   }
1269 
1270   O << " offset:";
1271 
1272   if ((Imm & QUAD_PERM_ENC_MASK) == QUAD_PERM_ENC) {
1273 
1274     O << "swizzle(" << IdSymbolic[ID_QUAD_PERM];
1275     for (unsigned I = 0; I < LANE_NUM; ++I) {
1276       O << ",";
1277       O << formatDec(Imm & LANE_MASK);
1278       Imm >>= LANE_SHIFT;
1279     }
1280     O << ")";
1281 
1282   } else if ((Imm & BITMASK_PERM_ENC_MASK) == BITMASK_PERM_ENC) {
1283 
1284     uint16_t AndMask = (Imm >> BITMASK_AND_SHIFT) & BITMASK_MASK;
1285     uint16_t OrMask  = (Imm >> BITMASK_OR_SHIFT)  & BITMASK_MASK;
1286     uint16_t XorMask = (Imm >> BITMASK_XOR_SHIFT) & BITMASK_MASK;
1287 
1288     if (AndMask == BITMASK_MAX &&
1289         OrMask == 0 &&
1290         countPopulation(XorMask) == 1) {
1291 
1292       O << "swizzle(" << IdSymbolic[ID_SWAP];
1293       O << ",";
1294       O << formatDec(XorMask);
1295       O << ")";
1296 
1297     } else if (AndMask == BITMASK_MAX &&
1298                OrMask == 0 && XorMask > 0 &&
1299                isPowerOf2_64(XorMask + 1)) {
1300 
1301       O << "swizzle(" << IdSymbolic[ID_REVERSE];
1302       O << ",";
1303       O << formatDec(XorMask + 1);
1304       O << ")";
1305 
1306     } else {
1307 
1308       uint16_t GroupSize = BITMASK_MAX - AndMask + 1;
1309       if (GroupSize > 1 &&
1310           isPowerOf2_64(GroupSize) &&
1311           OrMask < GroupSize &&
1312           XorMask == 0) {
1313 
1314         O << "swizzle(" << IdSymbolic[ID_BROADCAST];
1315         O << ",";
1316         O << formatDec(GroupSize);
1317         O << ",";
1318         O << formatDec(OrMask);
1319         O << ")";
1320 
1321       } else {
1322         O << "swizzle(" << IdSymbolic[ID_BITMASK_PERM];
1323         O << ",";
1324         printSwizzleBitmask(AndMask, OrMask, XorMask, O);
1325         O << ")";
1326       }
1327     }
1328   } else {
1329     printU16ImmDecOperand(MI, OpNo, O);
1330   }
1331 }
1332 
1333 void AMDGPUInstPrinter::printWaitFlag(const MCInst *MI, unsigned OpNo,
1334                                       const MCSubtargetInfo &STI,
1335                                       raw_ostream &O) {
1336   AMDGPU::IsaVersion ISA = AMDGPU::getIsaVersion(STI.getCPU());
1337 
1338   unsigned SImm16 = MI->getOperand(OpNo).getImm();
1339   unsigned Vmcnt, Expcnt, Lgkmcnt;
1340   decodeWaitcnt(ISA, SImm16, Vmcnt, Expcnt, Lgkmcnt);
1341 
1342   bool NeedSpace = false;
1343 
1344   if (Vmcnt != getVmcntBitMask(ISA)) {
1345     O << "vmcnt(" << Vmcnt << ')';
1346     NeedSpace = true;
1347   }
1348 
1349   if (Expcnt != getExpcntBitMask(ISA)) {
1350     if (NeedSpace)
1351       O << ' ';
1352     O << "expcnt(" << Expcnt << ')';
1353     NeedSpace = true;
1354   }
1355 
1356   if (Lgkmcnt != getLgkmcntBitMask(ISA)) {
1357     if (NeedSpace)
1358       O << ' ';
1359     O << "lgkmcnt(" << Lgkmcnt << ')';
1360   }
1361 }
1362 
1363 void AMDGPUInstPrinter::printHwreg(const MCInst *MI, unsigned OpNo,
1364                                    const MCSubtargetInfo &STI, raw_ostream &O) {
1365   unsigned Id;
1366   unsigned Offset;
1367   unsigned Width;
1368 
1369   using namespace llvm::AMDGPU::Hwreg;
1370   unsigned Val = MI->getOperand(OpNo).getImm();
1371   decodeHwreg(Val, Id, Offset, Width);
1372   StringRef HwRegName = getHwreg(Id, STI);
1373 
1374   O << "hwreg(";
1375   if (!HwRegName.empty()) {
1376     O << HwRegName;
1377   } else {
1378     O << Id;
1379   }
1380   if (Width != WIDTH_DEFAULT_ || Offset != OFFSET_DEFAULT_) {
1381     O << ", " << Offset << ", " << Width;
1382   }
1383   O << ')';
1384 }
1385 
1386 void AMDGPUInstPrinter::printEndpgm(const MCInst *MI, unsigned OpNo,
1387                                     const MCSubtargetInfo &STI,
1388                                     raw_ostream &O) {
1389   uint16_t Imm = MI->getOperand(OpNo).getImm();
1390   if (Imm == 0) {
1391     return;
1392   }
1393 
1394   O << ' ' << formatDec(Imm);
1395 }
1396 
1397 #include "AMDGPUGenAsmWriter.inc"
1398 
1399 void R600InstPrinter::printInst(const MCInst *MI, uint64_t Address,
1400                                 StringRef Annot, const MCSubtargetInfo &STI,
1401                                 raw_ostream &O) {
1402   O.flush();
1403   printInstruction(MI, Address, O);
1404   printAnnotation(O, Annot);
1405 }
1406 
1407 void R600InstPrinter::printAbs(const MCInst *MI, unsigned OpNo,
1408                                raw_ostream &O) {
1409   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '|');
1410 }
1411 
1412 void R600InstPrinter::printBankSwizzle(const MCInst *MI, unsigned OpNo,
1413                                        raw_ostream &O) {
1414   int BankSwizzle = MI->getOperand(OpNo).getImm();
1415   switch (BankSwizzle) {
1416   case 1:
1417     O << "BS:VEC_021/SCL_122";
1418     break;
1419   case 2:
1420     O << "BS:VEC_120/SCL_212";
1421     break;
1422   case 3:
1423     O << "BS:VEC_102/SCL_221";
1424     break;
1425   case 4:
1426     O << "BS:VEC_201";
1427     break;
1428   case 5:
1429     O << "BS:VEC_210";
1430     break;
1431   default:
1432     break;
1433   }
1434 }
1435 
1436 void R600InstPrinter::printClamp(const MCInst *MI, unsigned OpNo,
1437                                  raw_ostream &O) {
1438   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "_SAT");
1439 }
1440 
1441 void R600InstPrinter::printCT(const MCInst *MI, unsigned OpNo,
1442                                 raw_ostream &O) {
1443   unsigned CT = MI->getOperand(OpNo).getImm();
1444   switch (CT) {
1445   case 0:
1446     O << 'U';
1447     break;
1448   case 1:
1449     O << 'N';
1450     break;
1451   default:
1452     break;
1453   }
1454 }
1455 
1456 void R600InstPrinter::printKCache(const MCInst *MI, unsigned OpNo,
1457                                   raw_ostream &O) {
1458   int KCacheMode = MI->getOperand(OpNo).getImm();
1459   if (KCacheMode > 0) {
1460     int KCacheBank = MI->getOperand(OpNo - 2).getImm();
1461     O << "CB" << KCacheBank << ':';
1462     int KCacheAddr = MI->getOperand(OpNo + 2).getImm();
1463     int LineSize = (KCacheMode == 1) ? 16 : 32;
1464     O << KCacheAddr * 16 << '-' << KCacheAddr * 16 + LineSize;
1465   }
1466 }
1467 
1468 void R600InstPrinter::printLast(const MCInst *MI, unsigned OpNo,
1469                                 raw_ostream &O) {
1470   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "*", " ");
1471 }
1472 
1473 void R600InstPrinter::printLiteral(const MCInst *MI, unsigned OpNo,
1474                                    raw_ostream &O) {
1475   const MCOperand &Op = MI->getOperand(OpNo);
1476   assert(Op.isImm() || Op.isExpr());
1477   if (Op.isImm()) {
1478     int64_t Imm = Op.getImm();
1479     O << Imm << '(' << BitsToFloat(Imm) << ')';
1480   }
1481   if (Op.isExpr()) {
1482     Op.getExpr()->print(O << '@', &MAI);
1483   }
1484 }
1485 
1486 void R600InstPrinter::printNeg(const MCInst *MI, unsigned OpNo,
1487                                raw_ostream &O) {
1488   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '-');
1489 }
1490 
1491 void R600InstPrinter::printOMOD(const MCInst *MI, unsigned OpNo,
1492                                 raw_ostream &O) {
1493   switch (MI->getOperand(OpNo).getImm()) {
1494   default: break;
1495   case 1:
1496     O << " * 2.0";
1497     break;
1498   case 2:
1499     O << " * 4.0";
1500     break;
1501   case 3:
1502     O << " / 2.0";
1503     break;
1504   }
1505 }
1506 
1507 void R600InstPrinter::printMemOperand(const MCInst *MI, unsigned OpNo,
1508                                       raw_ostream &O) {
1509   printOperand(MI, OpNo, O);
1510   O  << ", ";
1511   printOperand(MI, OpNo + 1, O);
1512 }
1513 
1514 void R600InstPrinter::printOperand(const MCInst *MI, unsigned OpNo,
1515                                    raw_ostream &O) {
1516   if (OpNo >= MI->getNumOperands()) {
1517     O << "/*Missing OP" << OpNo << "*/";
1518     return;
1519   }
1520 
1521   const MCOperand &Op = MI->getOperand(OpNo);
1522   if (Op.isReg()) {
1523     switch (Op.getReg()) {
1524     // This is the default predicate state, so we don't need to print it.
1525     case R600::PRED_SEL_OFF:
1526       break;
1527 
1528     default:
1529       O << getRegisterName(Op.getReg());
1530       break;
1531     }
1532   } else if (Op.isImm()) {
1533       O << Op.getImm();
1534   } else if (Op.isFPImm()) {
1535     // We special case 0.0 because otherwise it will be printed as an integer.
1536     if (Op.getFPImm() == 0.0)
1537       O << "0.0";
1538     else {
1539       O << Op.getFPImm();
1540     }
1541   } else if (Op.isExpr()) {
1542     const MCExpr *Exp = Op.getExpr();
1543     Exp->print(O, &MAI);
1544   } else {
1545     O << "/*INV_OP*/";
1546   }
1547 }
1548 
1549 void R600InstPrinter::printRel(const MCInst *MI, unsigned OpNo,
1550                                raw_ostream &O) {
1551   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, '+');
1552 }
1553 
1554 void R600InstPrinter::printRSel(const MCInst *MI, unsigned OpNo,
1555                                   raw_ostream &O) {
1556   unsigned Sel = MI->getOperand(OpNo).getImm();
1557   switch (Sel) {
1558   case 0:
1559     O << 'X';
1560     break;
1561   case 1:
1562     O << 'Y';
1563     break;
1564   case 2:
1565     O << 'Z';
1566     break;
1567   case 3:
1568     O << 'W';
1569     break;
1570   case 4:
1571     O << '0';
1572     break;
1573   case 5:
1574     O << '1';
1575     break;
1576   case 7:
1577     O << '_';
1578     break;
1579   default:
1580     break;
1581   }
1582 }
1583 
1584 void R600InstPrinter::printUpdateExecMask(const MCInst *MI, unsigned OpNo,
1585                                           raw_ostream &O) {
1586   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "ExecMask,");
1587 }
1588 
1589 void R600InstPrinter::printUpdatePred(const MCInst *MI, unsigned OpNo,
1590                                       raw_ostream &O) {
1591   AMDGPUInstPrinter::printIfSet(MI, OpNo, O, "Pred,");
1592 }
1593 
1594 void R600InstPrinter::printWrite(const MCInst *MI, unsigned OpNo,
1595                                  raw_ostream &O) {
1596   const MCOperand &Op = MI->getOperand(OpNo);
1597   if (Op.getImm() == 0) {
1598     O << " (MASKED)";
1599   }
1600 }
1601 
1602 #include "R600GenAsmWriter.inc"
1603