tree: 5c0eb20e1dfc2cb4ed5b47100269b68d43b63298 [path history] [tgz]
  1. a32_sgemm_8x6/
  2. a64_ffhybrid_bf16fp32_mmla_6x16/
  3. a64_ffhybrid_fp16_mla_6x32/
  4. a64_ffhybrid_fp32_mla_6x16/
  5. a64_ffhybrid_fp32bf16fp32_mmla_4x24/
  6. a64_ffinterleaved_bf16fp32_dot_8x12/
  7. a64_ffinterleaved_bf16fp32_mmla_8x12/
  8. a64_ffinterleaved_fp16_mla_8x24/
  9. a64_ffinterleaved_fp32_mla_8x12/
  10. a64_gemm_s16_8x12/
  11. a64_gemm_s8_4x4/
  12. a64_gemm_s8_8x12/
  13. a64_gemm_u16_8x12/
  14. a64_gemm_u8_4x4/
  15. a64_gemm_u8_8x12/
  16. a64_hgemm_8x24/
  17. a64_hybrid_bf16fp32_dot_6x16/
  18. a64_hybrid_bf16fp32_mmla_6x16/
  19. a64_hybrid_fp16_mla_6x32/
  20. a64_hybrid_fp32_mla_4x24/
  21. a64_hybrid_fp32_mla_6x16/
  22. a64_hybrid_fp32_mla_8x4/
  23. a64_hybrid_fp32bf16fp32_mmla_4x24/
  24. a64_hybrid_fp32bf16fp32_mmla_6x16/
  25. a64_hybrid_s8qa_dot_4x16/
  26. a64_hybrid_s8qa_mmla_4x16/
  27. a64_hybrid_s8qs_dot_6x16/
  28. a64_hybrid_s8qs_mmla_6x16/
  29. a64_hybrid_s8s32_dot_6x16/
  30. a64_hybrid_s8s32_mmla_6x16/
  31. a64_hybrid_u8qa_dot_4x16/
  32. a64_hybrid_u8qa_mmla_4x16/
  33. a64_hybrid_u8u32_dot_6x16/
  34. a64_hybrid_u8u32_mmla_6x16/
  35. a64_interleaved_bf16fp32_dot_8x12/
  36. a64_interleaved_bf16fp32_mmla_8x12/
  37. a64_interleaved_s8s32_mmla_8x12/
  38. a64_interleaved_u8u32_mmla_8x12/
  39. a64_sgemm_8x12/
  40. a64_sgemm_8x6/
  41. a64_sgemv_pretransposed/
  42. a64_smallK_hybrid_fp32_mla_6x4/
  43. a64_smallK_hybrid_fp32_mla_8x4/
  44. a64_smallK_hybrid_s8s32_dot_6x4/
  45. a64_smallK_hybrid_s8s32_dot_8x4/
  46. a64_smallK_hybrid_u8u32_dot_6x4/
  47. a64_smallK_hybrid_u8u32_dot_8x4/
  48. sme2_gemv_bf16fp32_dot_16VL/
  49. sme2_gemv_fp32_mla_16VL/
  50. sme2_gemv_fp32bf16fp32_dot_16VL/
  51. sme2_gemv_s8qa_dot_16VL/
  52. sme2_gemv_u8qa_dot_16VL/
  53. sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/
  54. sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/
  55. sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/
  56. sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/
  57. sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/
  58. sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/
  59. sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/
  60. sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/
  61. sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/
  62. sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/
  63. sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/
  64. sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/
  65. sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/
  66. sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/
  67. sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/
  68. sve_ffhybrid_bf16fp32_mmla_6x4VL/
  69. sve_ffhybrid_fp16_mla_6x4VL/
  70. sve_ffhybrid_fp32_mla_6x4VL/
  71. sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/
  72. sve_ffinterleaved_bf16fp32_mmla_8x3VL/
  73. sve_ffinterleaved_fp16_mla_8x3VL/
  74. sve_ffinterleaved_fp32_mla_8x3VL/
  75. sve_hybrid_bf16fp32_dot_6x4VL/
  76. sve_hybrid_bf16fp32_mmla_6x4VL/
  77. sve_hybrid_fp16_mla_6x4VL/
  78. sve_hybrid_fp32_mla_6x4VL/
  79. sve_hybrid_fp32_mla_8x1VL/
  80. sve_hybrid_fp32bf16fp32_mmla_4x6VL/
  81. sve_hybrid_fp32bf16fp32_mmla_6x4VL/
  82. sve_hybrid_s8qa_dot_4x4VL/
  83. sve_hybrid_s8qa_mmla_4x4VL/
  84. sve_hybrid_s8qs_dot_6x4VL/
  85. sve_hybrid_s8qs_mmla_6x4VL/
  86. sve_hybrid_s8s32_dot_6x4VL/
  87. sve_hybrid_s8s32_mmla_6x4VL/
  88. sve_hybrid_u8qa_dot_4x4VL/
  89. sve_hybrid_u8qa_mmla_4x4VL/
  90. sve_hybrid_u8u32_dot_6x4VL/
  91. sve_hybrid_u8u32_mmla_6x4VL/
  92. sve_interleaved_bf16fp32_dot_8x3VL/
  93. sve_interleaved_bf16fp32_mmla_8x3VL/
  94. sve_interleaved_fp16_mla_8x3VL/
  95. sve_interleaved_fp32_mla_8x3VL/
  96. sve_interleaved_fp32_mmla_8x3VL/
  97. sve_interleaved_s8s32_dot_8x3VL/
  98. sve_interleaved_s8s32_mmla_8x3VL/
  99. sve_interleaved_u8u32_dot_8x3VL/
  100. sve_interleaved_u8u32_mmla_8x3VL/
  101. sve_smallK_hybrid_fp32_mla_8x1VL/
  102. sve_smallK_hybrid_s8s32_dot_8x1VL/
  103. sve_smallK_hybrid_u8u32_dot_8x1VL/
  104. a32_sgemm_8x6.hpp
  105. a64_ffhybrid_bf16fp32_mmla_6x16.hpp
  106. a64_ffhybrid_fp16_mla_6x32.hpp
  107. a64_ffhybrid_fp32_mla_6x16.hpp
  108. a64_ffhybrid_fp32bf16fp32_mmla_4x24.hpp
  109. a64_ffinterleaved_bf16fp32_dot_8x12.hpp
  110. a64_ffinterleaved_bf16fp32_mmla_8x12.hpp
  111. a64_ffinterleaved_fp16_mla_8x24.hpp
  112. a64_ffinterleaved_fp32_mla_8x12.hpp
  113. a64_gemm_s16_8x12.hpp
  114. a64_gemm_s8_4x4.hpp
  115. a64_gemm_s8_8x12.hpp
  116. a64_gemm_u16_8x12.hpp
  117. a64_gemm_u8_4x4.hpp
  118. a64_gemm_u8_8x12.hpp
  119. a64_hgemm_8x24.hpp
  120. a64_hybrid_bf16fp32_dot_6x16.hpp
  121. a64_hybrid_bf16fp32_mmla_6x16.hpp
  122. a64_hybrid_fp16_mla_6x32.hpp
  123. a64_hybrid_fp32_mla_4x24.hpp
  124. a64_hybrid_fp32_mla_6x16.hpp
  125. a64_hybrid_fp32_mla_8x4.hpp
  126. a64_hybrid_fp32bf16fp32_mmla_4x24.hpp
  127. a64_hybrid_fp32bf16fp32_mmla_6x16.hpp
  128. a64_hybrid_s8qa_dot_4x16.hpp
  129. a64_hybrid_s8qa_mmla_4x16.hpp
  130. a64_hybrid_s8qs_dot_6x16.hpp
  131. a64_hybrid_s8qs_mmla_6x16.hpp
  132. a64_hybrid_s8s32_dot_6x16.hpp
  133. a64_hybrid_s8s32_mmla_6x16.hpp
  134. a64_hybrid_u8qa_dot_4x16.hpp
  135. a64_hybrid_u8qa_mmla_4x16.hpp
  136. a64_hybrid_u8u32_dot_6x16.hpp
  137. a64_hybrid_u8u32_mmla_6x16.hpp
  138. a64_interleaved_bf16fp32_dot_8x12.hpp
  139. a64_interleaved_bf16fp32_mmla_8x12.hpp
  140. a64_interleaved_s8s32_mmla_8x12.hpp
  141. a64_interleaved_u8u32_mmla_8x12.hpp
  142. a64_sgemm_8x12.hpp
  143. a64_sgemm_8x6.hpp
  144. a64_sgemv_pretransposed.hpp
  145. a64_smallK_hybrid_fp32_mla_6x4.hpp
  146. a64_smallK_hybrid_fp32_mla_8x4.hpp
  147. a64_smallK_hybrid_s8s32_dot_6x4.hpp
  148. a64_smallK_hybrid_s8s32_dot_8x4.hpp
  149. a64_smallK_hybrid_u8u32_dot_6x4.hpp
  150. a64_smallK_hybrid_u8u32_dot_8x4.hpp
  151. sme2_gemv_bf16fp32_dot_16VL.hpp
  152. sme2_gemv_fp32_mla_16VL.hpp
  153. sme2_gemv_fp32bf16fp32_dot_16VL.hpp
  154. sme2_gemv_s8qa_dot_16VL.hpp
  155. sme2_gemv_u8qa_dot_16VL.hpp
  156. sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL.hpp
  157. sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL.hpp
  158. sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL.hpp
  159. sme2_interleaved_nomerge_fp32_mopa_1VLx4VL.hpp
  160. sme2_interleaved_nomerge_fp32_mopa_2VLx2VL.hpp
  161. sme2_interleaved_nomerge_fp32_mopa_4VLx1VL.hpp
  162. sme2_interleaved_nomerge_s8q_mopa_1VLx4VL.hpp
  163. sme2_interleaved_nomerge_s8q_mopa_2VLx2VL.hpp
  164. sme2_interleaved_nomerge_s8q_mopa_4VLx1VL.hpp
  165. sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL.hpp
  166. sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL.hpp
  167. sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL.hpp
  168. sme2_interleaved_nomerge_u8q_mopa_1VLx4VL.hpp
  169. sme2_interleaved_nomerge_u8q_mopa_2VLx2VL.hpp
  170. sme2_interleaved_nomerge_u8q_mopa_4VLx1VL.hpp
  171. sve_ffhybrid_bf16fp32_mmla_6x4VL.hpp
  172. sve_ffhybrid_fp16_mla_6x4VL.hpp
  173. sve_ffhybrid_fp32_mla_6x4VL.hpp
  174. sve_ffhybrid_fp32bf16fp32_mmla_4x6VL.hpp
  175. sve_ffinterleaved_bf16fp32_mmla_8x3VL.hpp
  176. sve_ffinterleaved_fp16_mla_8x3VL.hpp
  177. sve_ffinterleaved_fp32_mla_8x3VL.hpp
  178. sve_hybrid_bf16fp32_dot_6x4VL.hpp
  179. sve_hybrid_bf16fp32_mmla_6x4VL.hpp
  180. sve_hybrid_fp16_mla_6x4VL.hpp
  181. sve_hybrid_fp32_mla_6x4VL.hpp
  182. sve_hybrid_fp32_mla_8x1VL.hpp
  183. sve_hybrid_fp32bf16fp32_mmla_4x6VL.hpp
  184. sve_hybrid_fp32bf16fp32_mmla_6x4VL.hpp
  185. sve_hybrid_s8qa_dot_4x4VL.hpp
  186. sve_hybrid_s8qa_mmla_4x4VL.hpp
  187. sve_hybrid_s8qs_dot_6x4VL.hpp
  188. sve_hybrid_s8qs_mmla_6x4VL.hpp
  189. sve_hybrid_s8s32_dot_6x4VL.hpp
  190. sve_hybrid_s8s32_mmla_6x4VL.hpp
  191. sve_hybrid_u8qa_dot_4x4VL.hpp
  192. sve_hybrid_u8qa_mmla_4x4VL.hpp
  193. sve_hybrid_u8u32_dot_6x4VL.hpp
  194. sve_hybrid_u8u32_mmla_6x4VL.hpp
  195. sve_interleaved_bf16fp32_dot_8x3VL.hpp
  196. sve_interleaved_bf16fp32_mmla_8x3VL.hpp
  197. sve_interleaved_fp16_mla_8x3VL.hpp
  198. sve_interleaved_fp32_mla_8x3VL.hpp
  199. sve_interleaved_fp32_mmla_8x3VL.hpp
  200. sve_interleaved_s8s32_dot_8x3VL.hpp
  201. sve_interleaved_s8s32_mmla_8x3VL.hpp
  202. sve_interleaved_u8u32_dot_8x3VL.hpp
  203. sve_interleaved_u8u32_mmla_8x3VL.hpp
  204. sve_smallK_hybrid_fp32_mla_8x1VL.hpp
  205. sve_smallK_hybrid_s8s32_dot_8x1VL.hpp
  206. sve_smallK_hybrid_u8u32_dot_8x1VL.hpp