Вы не можете выбрать более 25 тем Темы должны начинаться с буквы или цифры, могут содержать дефисы(-) и должны содержать не более 35 символов.

PowerPC-Matrix_002dMultiply-Assist-Built_002din-Functions.html 9.8KB

3 лет назад
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
  2. <html>
  3. <!-- Copyright (C) 1988-2020 Free Software Foundation, Inc.
  4. Permission is granted to copy, distribute and/or modify this document
  5. under the terms of the GNU Free Documentation License, Version 1.3 or
  6. any later version published by the Free Software Foundation; with the
  7. Invariant Sections being "Funding Free Software", the Front-Cover
  8. Texts being (a) (see below), and with the Back-Cover Texts being (b)
  9. (see below). A copy of the license is included in the section entitled
  10. "GNU Free Documentation License".
  11. (a) The FSF's Front-Cover Text is:
  12. A GNU Manual
  13. (b) The FSF's Back-Cover Text is:
  14. You have freedom to copy and modify this GNU Manual, like GNU
  15. software. Copies published by the Free Software Foundation raise
  16. funds for GNU development. -->
  17. <!-- Created by GNU Texinfo 6.5, http://www.gnu.org/software/texinfo/ -->
  18. <head>
  19. <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
  20. <title>PowerPC Matrix-Multiply Assist Built-in Functions (Using the GNU Compiler Collection (GCC))</title>
  21. <meta name="description" content="PowerPC Matrix-Multiply Assist Built-in Functions (Using the GNU Compiler Collection (GCC))">
  22. <meta name="keywords" content="PowerPC Matrix-Multiply Assist Built-in Functions (Using the GNU Compiler Collection (GCC))">
  23. <meta name="resource-type" content="document">
  24. <meta name="distribution" content="global">
  25. <meta name="Generator" content="makeinfo">
  26. <link href="index.html#Top" rel="start" title="Top">
  27. <link href="Option-Index.html#Option-Index" rel="index" title="Option Index">
  28. <link href="index.html#SEC_Contents" rel="contents" title="Table of Contents">
  29. <link href="Target-Builtins.html#Target-Builtins" rel="up" title="Target Builtins">
  30. <link href="RX-Built_002din-Functions.html#RX-Built_002din-Functions" rel="next" title="RX Built-in Functions">
  31. <link href="PowerPC-Atomic-Memory-Operation-Functions.html#PowerPC-Atomic-Memory-Operation-Functions" rel="prev" title="PowerPC Atomic Memory Operation Functions">
  32. <style type="text/css">
  33. <!--
  34. a.summary-letter {text-decoration: none}
  35. blockquote.indentedblock {margin-right: 0em}
  36. blockquote.smallindentedblock {margin-right: 0em; font-size: smaller}
  37. blockquote.smallquotation {font-size: smaller}
  38. div.display {margin-left: 3.2em}
  39. div.example {margin-left: 3.2em}
  40. div.lisp {margin-left: 3.2em}
  41. div.smalldisplay {margin-left: 3.2em}
  42. div.smallexample {margin-left: 3.2em}
  43. div.smalllisp {margin-left: 3.2em}
  44. kbd {font-style: oblique}
  45. pre.display {font-family: inherit}
  46. pre.format {font-family: inherit}
  47. pre.menu-comment {font-family: serif}
  48. pre.menu-preformatted {font-family: serif}
  49. pre.smalldisplay {font-family: inherit; font-size: smaller}
  50. pre.smallexample {font-size: smaller}
  51. pre.smallformat {font-family: inherit; font-size: smaller}
  52. pre.smalllisp {font-size: smaller}
  53. span.nolinebreak {white-space: nowrap}
  54. span.roman {font-family: initial; font-weight: normal}
  55. span.sansserif {font-family: sans-serif; font-weight: normal}
  56. ul.no-bullet {list-style: none}
  57. -->
  58. </style>
  59. </head>
  60. <body lang="en">
  61. <a name="PowerPC-Matrix_002dMultiply-Assist-Built_002din-Functions"></a>
  62. <div class="header">
  63. <p>
  64. Next: <a href="RX-Built_002din-Functions.html#RX-Built_002din-Functions" accesskey="n" rel="next">RX Built-in Functions</a>, Previous: <a href="PowerPC-Atomic-Memory-Operation-Functions.html#PowerPC-Atomic-Memory-Operation-Functions" accesskey="p" rel="prev">PowerPC Atomic Memory Operation Functions</a>, Up: <a href="Target-Builtins.html#Target-Builtins" accesskey="u" rel="up">Target Builtins</a> &nbsp; [<a href="index.html#SEC_Contents" title="Table of contents" rel="contents">Contents</a>][<a href="Option-Index.html#Option-Index" title="Index" rel="index">Index</a>]</p>
  65. </div>
  66. <hr>
  67. <a name="PowerPC-Matrix_002dMultiply-Assist-Built_002din-Functions-1"></a>
  68. <h4 class="subsection">6.60.26 PowerPC Matrix-Multiply Assist Built-in Functions</h4>
  69. <p>ISA 3.1 of the PowerPC added new Matrix-Multiply Assist (MMA) instructions.
  70. GCC provides support for these instructions through the following built-in
  71. functions which are enabled with the <code>-mmma</code> option. The vec_t type
  72. below is defined to be a normal vector unsigned char type.  The uint2, uint4
  73. and uint8 parameters are 2-bit, 4-bit and 8-bit unsigned integer constants
  74. respectively.  The compiler will verify that they are constants and that
  75. their values are within range. 
  76. </p>
  77. <p>The built-in functions supported are:
  78. </p>
  79. <div class="smallexample">
  80. <pre class="smallexample">void __builtin_mma_xvi4ger8 (__vector_quad *, vec_t, vec_t);
  81. void __builtin_mma_xvi8ger4 (__vector_quad *, vec_t, vec_t);
  82. void __builtin_mma_xvi16ger2 (__vector_quad *, vec_t, vec_t);
  83. void __builtin_mma_xvi16ger2s (__vector_quad *, vec_t, vec_t);
  84. void __builtin_mma_xvf16ger2 (__vector_quad *, vec_t, vec_t);
  85. void __builtin_mma_xvbf16ger2 (__vector_quad *, vec_t, vec_t);
  86. void __builtin_mma_xvf32ger (__vector_quad *, vec_t, vec_t);
  87. void __builtin_mma_xvi4ger8pp (__vector_quad *, vec_t, vec_t);
  88. void __builtin_mma_xvi8ger4pp (__vector_quad *, vec_t, vec_t);
  89. void __builtin_mma_xvi8ger4spp(__vector_quad *, vec_t, vec_t);
  90. void __builtin_mma_xvi16ger2pp (__vector_quad *, vec_t, vec_t);
  91. void __builtin_mma_xvi16ger2spp (__vector_quad *, vec_t, vec_t);
  92. void __builtin_mma_xvf16ger2pp (__vector_quad *, vec_t, vec_t);
  93. void __builtin_mma_xvf16ger2pn (__vector_quad *, vec_t, vec_t);
  94. void __builtin_mma_xvf16ger2np (__vector_quad *, vec_t, vec_t);
  95. void __builtin_mma_xvf16ger2nn (__vector_quad *, vec_t, vec_t);
  96. void __builtin_mma_xvbf16ger2pp (__vector_quad *, vec_t, vec_t);
  97. void __builtin_mma_xvbf16ger2pn (__vector_quad *, vec_t, vec_t);
  98. void __builtin_mma_xvbf16ger2np (__vector_quad *, vec_t, vec_t);
  99. void __builtin_mma_xvbf16ger2nn (__vector_quad *, vec_t, vec_t);
  100. void __builtin_mma_xvf32gerpp (__vector_quad *, vec_t, vec_t);
  101. void __builtin_mma_xvf32gerpn (__vector_quad *, vec_t, vec_t);
  102. void __builtin_mma_xvf32gernp (__vector_quad *, vec_t, vec_t);
  103. void __builtin_mma_xvf32gernn (__vector_quad *, vec_t, vec_t);
  104. void __builtin_mma_pmxvi4ger8 (__vector_quad *, vec_t, vec_t, uint4, uint4, uint8);
  105. void __builtin_mma_pmxvi4ger8pp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint8);
  106. void __builtin_mma_pmxvi8ger4 (__vector_quad *, vec_t, vec_t, uint4, uint4, uint4);
  107. void __builtin_mma_pmxvi8ger4pp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint4);
  108. void __builtin_mma_pmxvi8ger4spp(__vector_quad *, vec_t, vec_t, uint4, uint4, uint4);
  109. void __builtin_mma_pmxvi16ger2 (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  110. void __builtin_mma_pmxvi16ger2s (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  111. void __builtin_mma_pmxvf16ger2 (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  112. void __builtin_mma_pmxvbf16ger2 (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  113. void __builtin_mma_pmxvi16ger2pp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  114. void __builtin_mma_pmxvi16ger2spp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  115. void __builtin_mma_pmxvf16ger2pp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  116. void __builtin_mma_pmxvf16ger2pn (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  117. void __builtin_mma_pmxvf16ger2np (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  118. void __builtin_mma_pmxvf16ger2nn (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  119. void __builtin_mma_pmxvbf16ger2pp (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  120. void __builtin_mma_pmxvbf16ger2pn (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  121. void __builtin_mma_pmxvbf16ger2np (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  122. void __builtin_mma_pmxvbf16ger2nn (__vector_quad *, vec_t, vec_t, uint4, uint4, uint2);
  123. void __builtin_mma_pmxvf32ger (__vector_quad *, vec_t, vec_t, uint4, uint4);
  124. void __builtin_mma_pmxvf32gerpp (__vector_quad *, vec_t, vec_t, uint4, uint4);
  125. void __builtin_mma_pmxvf32gerpn (__vector_quad *, vec_t, vec_t, uint4, uint4);
  126. void __builtin_mma_pmxvf32gernp (__vector_quad *, vec_t, vec_t, uint4, uint4);
  127. void __builtin_mma_pmxvf32gernn (__vector_quad *, vec_t, vec_t, uint4, uint4);
  128. void __builtin_mma_xvf64ger (__vector_quad *, __vector_pair, vec_t);
  129. void __builtin_mma_xvf64gerpp (__vector_quad *, __vector_pair, vec_t);
  130. void __builtin_mma_xvf64gerpn (__vector_quad *, __vector_pair, vec_t);
  131. void __builtin_mma_xvf64gernp (__vector_quad *, __vector_pair, vec_t);
  132. void __builtin_mma_xvf64gernn (__vector_quad *, __vector_pair, vec_t);
  133. void __builtin_mma_pmxvf64ger (__vector_quad *, __vector_pair, vec_t, uint4, uint2);
  134. void __builtin_mma_pmxvf64gerpp (__vector_quad *, __vector_pair, vec_t, uint4, uint2);
  135. void __builtin_mma_pmxvf64gerpn (__vector_quad *, __vector_pair, vec_t, uint4, uint2);
  136. void __builtin_mma_pmxvf64gernp (__vector_quad *, __vector_pair, vec_t, uint4, uint2);
  137. void __builtin_mma_pmxvf64gernn (__vector_quad *, __vector_pair, vec_t, uint4, uint2);
  138. void __builtin_mma_xxmtacc (__vector_quad *);
  139. void __builtin_mma_xxmfacc (__vector_quad *);
  140. void __builtin_mma_xxsetaccz (__vector_quad *);
  141. void __builtin_mma_assemble_acc (__vector_quad *, vec_t, vec_t, vec_t, vec_t);
  142. void __builtin_mma_disassemble_acc (void *, __vector_quad *);
  143. void __builtin_mma_assemble_pair (__vector_pair *, vec_t, vec_t);
  144. void __builtin_mma_disassemble_pair (void *, __vector_pair *);
  145. vec_t __builtin_vsx_xvcvspbf16 (vec_t);
  146. vec_t __builtin_vsx_xvcvbf16spn (vec_t);
  147. </pre></div>
  148. <hr>
  149. <div class="header">
  150. <p>
  151. Next: <a href="RX-Built_002din-Functions.html#RX-Built_002din-Functions" accesskey="n" rel="next">RX Built-in Functions</a>, Previous: <a href="PowerPC-Atomic-Memory-Operation-Functions.html#PowerPC-Atomic-Memory-Operation-Functions" accesskey="p" rel="prev">PowerPC Atomic Memory Operation Functions</a>, Up: <a href="Target-Builtins.html#Target-Builtins" accesskey="u" rel="up">Target Builtins</a> &nbsp; [<a href="index.html#SEC_Contents" title="Table of contents" rel="contents">Contents</a>][<a href="Option-Index.html#Option-Index" title="Index" rel="index">Index</a>]</p>
  152. </div>
  153. </body>
  154. </html>