| """ |
| Auto-generated by generate-wrappers.py script. Do not modify |
| """ |
| |
| OPERATOR_SRCS = [ |
| "XNNPACK/src/operators/argmax-pooling-nhwc.c", |
| "XNNPACK/src/operators/average-pooling-nhwc.c", |
| "XNNPACK/src/operators/binary-elementwise-nd.c", |
| "XNNPACK/src/operators/channel-shuffle-nc.c", |
| "XNNPACK/src/operators/constant-pad-nd.c", |
| "XNNPACK/src/operators/convolution-nchw.c", |
| "XNNPACK/src/operators/convolution-nhwc.c", |
| "XNNPACK/src/operators/deconvolution-nhwc.c", |
| "XNNPACK/src/operators/depth-to-space-nchw2nhwc.c", |
| "XNNPACK/src/operators/depth-to-space-nhwc.c", |
| "XNNPACK/src/operators/fully-connected-nc.c", |
| "XNNPACK/src/operators/global-average-pooling-ncw.c", |
| "XNNPACK/src/operators/global-average-pooling-nwc.c", |
| "XNNPACK/src/operators/lut-elementwise-nc.c", |
| "XNNPACK/src/operators/max-pooling-nhwc.c", |
| "XNNPACK/src/operators/prelu-nc.c", |
| "XNNPACK/src/operators/resize-bilinear-nchw.c", |
| "XNNPACK/src/operators/resize-bilinear-nhwc.c", |
| "XNNPACK/src/operators/softmax-nc.c", |
| "XNNPACK/src/operators/unary-elementwise-nc.c", |
| "XNNPACK/src/operators/unpooling-nhwc.c", |
| ] |
| |
| SUBGRAPH_SRCS = [ |
| "XNNPACK/src/subgraph/abs.c", |
| "XNNPACK/src/subgraph/add2.c", |
| "XNNPACK/src/subgraph/argmax-pooling-2d.c", |
| "XNNPACK/src/subgraph/average-pooling-2d.c", |
| "XNNPACK/src/subgraph/bankers-rounding.c", |
| "XNNPACK/src/subgraph/ceiling.c", |
| "XNNPACK/src/subgraph/clamp.c", |
| "XNNPACK/src/subgraph/convert.c", |
| "XNNPACK/src/subgraph/convolution-2d.c", |
| "XNNPACK/src/subgraph/deconvolution-2d.c", |
| "XNNPACK/src/subgraph/depth-to-space.c", |
| "XNNPACK/src/subgraph/depthwise-convolution-2d.c", |
| "XNNPACK/src/subgraph/divide.c", |
| "XNNPACK/src/subgraph/elu.c", |
| "XNNPACK/src/subgraph/floor.c", |
| "XNNPACK/src/subgraph/fully-connected.c", |
| "XNNPACK/src/subgraph/global-average-pooling-2d.c", |
| "XNNPACK/src/subgraph/hardswish.c", |
| "XNNPACK/src/subgraph/leaky-relu.c", |
| "XNNPACK/src/subgraph/max-pooling-2d.c", |
| "XNNPACK/src/subgraph/maximum2.c", |
| "XNNPACK/src/subgraph/minimum2.c", |
| "XNNPACK/src/subgraph/multiply2.c", |
| "XNNPACK/src/subgraph/negate.c", |
| "XNNPACK/src/subgraph/prelu.c", |
| "XNNPACK/src/subgraph/sigmoid.c", |
| "XNNPACK/src/subgraph/softmax.c", |
| "XNNPACK/src/subgraph/square-root.c", |
| "XNNPACK/src/subgraph/square.c", |
| "XNNPACK/src/subgraph/squared-difference.c", |
| "XNNPACK/src/subgraph/static-constant-pad.c", |
| "XNNPACK/src/subgraph/static-reshape.c", |
| "XNNPACK/src/subgraph/static-resize-bilinear-2d.c", |
| "XNNPACK/src/subgraph/subtract.c", |
| "XNNPACK/src/subgraph/unpooling-2d.c", |
| ] |
| |
| LOGGING_SRCS = [ |
| "XNNPACK/src/datatype-strings.c", |
| "XNNPACK/src/operator-strings.c", |
| "XNNPACK/src/subgraph-strings.c", |
| ] |
| |
| HOT_SRCS = [ |
| "XNNPACK/src/indirection.c", |
| "XNNPACK/src/operator-run.c", |
| "XNNPACK/src/packing.c", |
| ] |
| |
| TABLE_SRCS = [ |
| "XNNPACK/src/tables/exp2-k-over-64.c", |
| "XNNPACK/src/tables/exp2-k-over-2048.c", |
| "XNNPACK/src/tables/exp2minus-k-over-4.c", |
| "XNNPACK/src/tables/exp2minus-k-over-8.c", |
| "XNNPACK/src/tables/exp2minus-k-over-16.c", |
| "XNNPACK/src/tables/exp2minus-k-over-64.c", |
| "XNNPACK/src/tables/exp2minus-k-over-2048.c", |
| ] |
| |
| JIT_SRCS = [ |
| "XNNPACK/src/jit/aarch32-assembler.cc", |
| "XNNPACK/src/jit/aarch64-assembler.cc", |
| "XNNPACK/src/jit/assembler.cc", |
| "XNNPACK/src/jit/memory.c", |
| ] |
| |
| JIT_AARCH32_SRCS = [ |
| "XNNPACK/src/f32-gemm/4x8-aarch32-neon-cortex-a7.cc", |
| "XNNPACK/src/f32-gemm/4x8-aarch32-neon-cortex-a53.cc", |
| "XNNPACK/src/f32-gemm/4x8-aarch32-neon-cortex-a55.cc", |
| "XNNPACK/src/f32-gemm/4x8-aarch32-neon-cortex-a75.cc", |
| "XNNPACK/src/f32-gemm/4x8-aarch32-neon-ld64.cc", |
| "XNNPACK/src/f32-igemm/4x8-aarch32-neon-cortex-a7.cc", |
| "XNNPACK/src/f32-igemm/4x8-aarch32-neon-cortex-a53.cc", |
| "XNNPACK/src/f32-igemm/4x8-aarch32-neon-cortex-a55.cc", |
| "XNNPACK/src/f32-igemm/4x8-aarch32-neon-cortex-a75.cc", |
| "XNNPACK/src/f32-igemm/4x8-aarch32-neon-ld64.cc", |
| "XNNPACK/src/qc8-gemm/4x8-fp32-aarch32-neonv8-mlal-lane-ld64.cc", |
| "XNNPACK/src/qc8-gemm/4x8c4-fp32-aarch32-neondot-ld64.cc", |
| "XNNPACK/src/qc8-igemm/4x8-fp32-aarch32-neonv8-mlal-lane-ld64.cc", |
| "XNNPACK/src/qc8-igemm/4x8c4-fp32-aarch32-neondot-ld64.cc", |
| "XNNPACK/src/qs8-gemm/4x8-rndnu-aarch32-neon-mlal-lane-ld64.cc", |
| "XNNPACK/src/qs8-gemm/4x8c4-rndnu-aarch32-neondot-ld64.cc", |
| "XNNPACK/src/qs8-igemm/4x8-rndnu-aarch32-neon-mlal-lane-ld64.cc", |
| "XNNPACK/src/qs8-igemm/4x8c4-rndnu-aarch32-neondot-ld64.cc", |
| ] |
| |
| JIT_AARCH64_SRCS = [ |
| "XNNPACK/src/f32-gemm/1x8-aarch64-neonfma-cortex-a75.cc", |
| "XNNPACK/src/f32-gemm/6x8-aarch64-neonfma-cortex-a75.cc", |
| "XNNPACK/src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.cc", |
| "XNNPACK/src/f32-igemm/6x8-aarch64-neonfma-cortex-a75.cc", |
| ] |
| |
| PROD_SCALAR_PORTABLE_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/params-init.c", |
| "XNNPACK/src/u8-lut32norm/scalar.c", |
| "XNNPACK/src/xx-copy/memcpy.c", |
| "XNNPACK/src/x8-lut/gen/lut-scalar-x4.c", |
| "XNNPACK/src/x32-depthtospace2d-chw2hwc/scalar.c", |
| ] |
| |
| PROD_SSE_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f32-avgpool/9p8x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-avgpool/9x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-conv-hwc2chw/3x3s2p1c3x4-sse-2x2.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x3-minmax-sse.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x4-minmax-sse.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x9-minmax-sse.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x25-minmax-sse.c", |
| "XNNPACK/src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-2x4-acc2.c", |
| "XNNPACK/src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4-acc3.c", |
| "XNNPACK/src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-4x4.c", |
| "XNNPACK/src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-2x4.c", |
| "XNNPACK/src/f32-gavgpool-cw/sse-x4.c", |
| "XNNPACK/src/f32-gavgpool/7p7x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-gavgpool/7x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-gemm/gen/1x8-minmax-sse-load1.c", |
| "XNNPACK/src/f32-gemm/gen/4x2c4-minmax-sse.c", |
| "XNNPACK/src/f32-gemm/gen/4x8-minmax-sse-load1.c", |
| "XNNPACK/src/f32-ibilinear-chw/gen/sse-p8.c", |
| "XNNPACK/src/f32-ibilinear/gen/sse-c8.c", |
| "XNNPACK/src/f32-igemm/gen/1x8-minmax-sse-load1.c", |
| "XNNPACK/src/f32-igemm/gen/4x2c4-minmax-sse.c", |
| "XNNPACK/src/f32-igemm/gen/4x8-minmax-sse-load1.c", |
| "XNNPACK/src/f32-maxpool/9p8x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-pavgpool/9p8x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-pavgpool/9x-minmax-sse-c4.c", |
| "XNNPACK/src/f32-rmax/sse.c", |
| "XNNPACK/src/f32-spmm/gen/32x1-minmax-sse.c", |
| "XNNPACK/src/f32-vbinary/gen/vadd-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vaddc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vdiv-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vdivc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vmaxc-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vmin-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vminc-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vmul-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vmulc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vrdivc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vrsubc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiff-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiffc-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vsub-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vbinary/gen/vsubc-minmax-sse-x8.c", |
| "XNNPACK/src/f32-vclamp/gen/vclamp-sse-x8.c", |
| "XNNPACK/src/f32-vhswish/gen/vhswish-sse-x8.c", |
| "XNNPACK/src/f32-vlrelu/gen/vlrelu-sse-x8.c", |
| "XNNPACK/src/f32-vmulcaddc/gen/c4-minmax-sse-2x.c", |
| "XNNPACK/src/f32-vsqrt/gen/sse-sqrt-x4.c", |
| "XNNPACK/src/f32-vunary/gen/vabs-sse-x8.c", |
| "XNNPACK/src/f32-vunary/gen/vneg-sse-x8.c", |
| "XNNPACK/src/f32-vunary/gen/vsqr-sse-x8.c", |
| "XNNPACK/src/x32-packx/x4-sse.c", |
| ] |
| |
| PROD_SSE2_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-f32-vcvt/gen/vcvt-sse2-int16-x32.c", |
| "XNNPACK/src/f32-argmaxpool/4x-sse2-c4.c", |
| "XNNPACK/src/f32-argmaxpool/9p8x-sse2-c4.c", |
| "XNNPACK/src/f32-argmaxpool/9x-sse2-c4.c", |
| "XNNPACK/src/f32-f16-vcvt/gen/vcvt-sse2-x16.c", |
| "XNNPACK/src/f32-prelu/gen/sse2-2x8.c", |
| "XNNPACK/src/f32-qs8-vcvt/gen/vcvt-sse2-x32.c", |
| "XNNPACK/src/f32-qu8-vcvt/gen/vcvt-sse2-x32.c", |
| "XNNPACK/src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x20-acc2.c", |
| "XNNPACK/src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x12.c", |
| "XNNPACK/src/f32-vlrelu/gen/vlrelu-sse2-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndd-sse2-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndne-sse2-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndu-sse2-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndz-sse2-x8.c", |
| "XNNPACK/src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x8.c", |
| "XNNPACK/src/qc8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c", |
| "XNNPACK/src/qc8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c", |
| "XNNPACK/src/qc8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qc8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qs8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16-add16.c", |
| "XNNPACK/src/qs8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16-add16.c", |
| "XNNPACK/src/qs8-f32-vcvt/gen/vcvt-sse2-x32.c", |
| "XNNPACK/src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c", |
| "XNNPACK/src/qs8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c", |
| "XNNPACK/src/qs8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qs8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qs8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qs8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-avgpool/9p8x-minmax-sse2-c8.c", |
| "XNNPACK/src/qu8-avgpool/9x-minmax-sse2-c8.c", |
| "XNNPACK/src/qu8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c", |
| "XNNPACK/src/qu8-f32-vcvt/gen/vcvt-sse2-x32.c", |
| "XNNPACK/src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c", |
| "XNNPACK/src/qu8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c", |
| "XNNPACK/src/qu8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qu8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c", |
| "XNNPACK/src/s8-ibilinear/gen/sse2-c8.c", |
| "XNNPACK/src/s8-maxpool/9p8x-minmax-sse2-c16.c", |
| "XNNPACK/src/s8-vclamp/sse2-x64.c", |
| "XNNPACK/src/u8-ibilinear/gen/sse2-c8.c", |
| "XNNPACK/src/u8-maxpool/9p8x-minmax-sse2-c16.c", |
| "XNNPACK/src/u8-rmax/sse2.c", |
| "XNNPACK/src/u8-vclamp/sse2-x64.c", |
| "XNNPACK/src/xx-fill/sse2-x64.c", |
| "XNNPACK/src/xx-pad/sse2.c", |
| "XNNPACK/src/x8-zip/xm-sse2.c", |
| "XNNPACK/src/x8-zip/x2-sse2.c", |
| "XNNPACK/src/x8-zip/x3-sse2.c", |
| "XNNPACK/src/x8-zip/x4-sse2.c", |
| "XNNPACK/src/x32-unpool/sse2.c", |
| "XNNPACK/src/x32-zip/xm-sse2.c", |
| "XNNPACK/src/x32-zip/x2-sse2.c", |
| "XNNPACK/src/x32-zip/x3-sse2.c", |
| "XNNPACK/src/x32-zip/x4-sse2.c", |
| ] |
| |
| PROD_SSSE3_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-2x4-acc2.c", |
| ] |
| |
| PROD_SSE41_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-f32-vcvt/gen/vcvt-sse41-int16-x16.c", |
| "XNNPACK/src/f32-f16-vcvt/gen/vcvt-sse41-x8.c", |
| "XNNPACK/src/f32-prelu/gen/sse41-2x8.c", |
| "XNNPACK/src/f32-qs8-vcvt/gen/vcvt-sse41-x32.c", |
| "XNNPACK/src/f32-vlrelu/gen/vlrelu-sse41-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndd-sse41-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndne-sse41-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndu-sse41-x8.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndz-sse41-x8.c", |
| "XNNPACK/src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x8.c", |
| "XNNPACK/src/qc8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c", |
| "XNNPACK/src/qc8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c", |
| "XNNPACK/src/qc8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qc8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qs8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16-add16.c", |
| "XNNPACK/src/qs8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16-add16.c", |
| "XNNPACK/src/qs8-f32-vcvt/gen/vcvt-sse41-x16.c", |
| "XNNPACK/src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c", |
| "XNNPACK/src/qs8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c", |
| "XNNPACK/src/qs8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qs8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x8.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c", |
| "XNNPACK/src/qs8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c", |
| "XNNPACK/src/qs8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c", |
| "XNNPACK/src/qu8-f32-vcvt/gen/vcvt-sse41-x16.c", |
| "XNNPACK/src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c", |
| "XNNPACK/src/qu8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c", |
| "XNNPACK/src/qu8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qu8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-sse41-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c", |
| "XNNPACK/src/qu8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c", |
| "XNNPACK/src/qu8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c", |
| "XNNPACK/src/s8-ibilinear/gen/sse41-c16.c", |
| "XNNPACK/src/s8-maxpool/9p8x-minmax-sse41-c16.c", |
| "XNNPACK/src/s8-vclamp/sse41-x64.c", |
| "XNNPACK/src/u8-ibilinear/gen/sse41-c16.c", |
| ] |
| |
| PROD_AVX_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-f32-vcvt/gen/vcvt-avx-int16-x16.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x25-minmax-avx.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x3-minmax-avx.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x4-minmax-avx.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x9-minmax-avx.c", |
| "XNNPACK/src/f32-f16-vcvt/gen/vcvt-avx-x24.c", |
| "XNNPACK/src/f32-gemm/gen/1x16-minmax-avx-broadcast.c", |
| "XNNPACK/src/f32-gemm/gen/5x16-minmax-avx-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/1x16-minmax-avx-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/5x16-minmax-avx-broadcast.c", |
| "XNNPACK/src/f32-prelu/gen/avx-2x16.c", |
| "XNNPACK/src/f32-qs8-vcvt/gen/vcvt-avx-x32.c", |
| "XNNPACK/src/f32-qu8-vcvt/gen/vcvt-avx-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vadd-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vaddc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vdiv-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vdivc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vmaxc-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vmin-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vminc-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vmul-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vmulc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vrdivc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vrsubc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiff-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiffc-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vsub-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vsubc-minmax-avx-x16.c", |
| "XNNPACK/src/f32-vclamp/gen/vclamp-avx-x16.c", |
| "XNNPACK/src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x32.c", |
| "XNNPACK/src/f32-vhswish/gen/vhswish-avx-x16.c", |
| "XNNPACK/src/f32-vlrelu/gen/vlrelu-avx-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndd-avx-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndne-avx-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndu-avx-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndz-avx-x16.c", |
| "XNNPACK/src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x40.c", |
| "XNNPACK/src/f32-vsqrt/gen/avx-sqrt-x8.c", |
| "XNNPACK/src/f32-vunary/gen/vabs-avx-x16.c", |
| "XNNPACK/src/f32-vunary/gen/vneg-avx-x16.c", |
| "XNNPACK/src/f32-vunary/gen/vsqr-avx-x16.c", |
| "XNNPACK/src/qc8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c", |
| "XNNPACK/src/qc8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c", |
| "XNNPACK/src/qc8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qc8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qc8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qc8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c", |
| "XNNPACK/src/qs8-f32-vcvt/gen/vcvt-avx-x32.c", |
| "XNNPACK/src/qs8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qs8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qs8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qs8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-avx-mul32-ld32-x8.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x8.c", |
| "XNNPACK/src/qs8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c", |
| "XNNPACK/src/qs8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x9-minmax-fp32-avx-mul16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x25-minmax-fp32-avx-mul16.c", |
| "XNNPACK/src/qu8-f32-vcvt/gen/vcvt-avx-x32.c", |
| "XNNPACK/src/qu8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qu8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qu8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qu8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-avx-mul32-ld32-x8.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-avx-mul32-ld32-x8.c", |
| "XNNPACK/src/qu8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c", |
| "XNNPACK/src/qu8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c", |
| "XNNPACK/src/x8-lut/gen/lut-avx-x64.c", |
| ] |
| |
| PROD_F16C_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-f32-vcvt/gen/vcvt-f16c-x16.c", |
| "XNNPACK/src/f16-gavgpool/gen/7p7x-minmax-f16c-c8.c", |
| "XNNPACK/src/f16-gavgpool/gen/7x-minmax-f16c-c8.c", |
| "XNNPACK/src/f16-maxpool/9p8x-minmax-f16c-c8.c", |
| "XNNPACK/src/f16-prelu/gen/f16c-2x16.c", |
| "XNNPACK/src/f16-vbinary/gen/vadd-minmax-f16c-x16.c", |
| "XNNPACK/src/f16-vbinary/gen/vaddc-minmax-f16c-x16.c", |
| "XNNPACK/src/f16-vbinary/gen/vmul-minmax-f16c-x16.c", |
| "XNNPACK/src/f16-vbinary/gen/vmulc-minmax-f16c-x16.c", |
| "XNNPACK/src/f16-vclamp/gen/vclamp-f16c-x16.c", |
| "XNNPACK/src/f16-vhswish/gen/vhswish-f16c-x16.c", |
| "XNNPACK/src/f16-vlrelu/gen/vlrelu-f16c-x16.c", |
| "XNNPACK/src/f32-f16-vcvt/gen/vcvt-f16c-x16.c", |
| ] |
| |
| PROD_XOP_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/qc8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c", |
| "XNNPACK/src/qc8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c", |
| "XNNPACK/src/qc8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qc8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qc8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c", |
| "XNNPACK/src/qs8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qs8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qs8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-xop-mul32-ld32-x8.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x8.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x9-minmax-fp32-xop-mul32.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x25-minmax-fp32-xop-mul32.c", |
| "XNNPACK/src/qu8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qu8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qu8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-xop-mul32-ld32-x8.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-xop-mul32-ld32-x8.c", |
| ] |
| |
| PROD_FMA3_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-dwconv/gen/up8x25-minmax-fma3-acc2.c", |
| "XNNPACK/src/f16-dwconv/gen/up16x3-minmax-fma3.c", |
| "XNNPACK/src/f16-dwconv/gen/up16x4-minmax-fma3.c", |
| "XNNPACK/src/f16-dwconv/gen/up16x9-minmax-fma3.c", |
| "XNNPACK/src/f16-ibilinear/gen/fma3-c8.c", |
| "XNNPACK/src/f16-vmulcaddc/gen/c8-minmax-fma3-2x.c", |
| "XNNPACK/src/f32-dwconv/gen/up8x25-minmax-fma3.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x3-minmax-fma3.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x4-minmax-fma3.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x9-minmax-fma3.c", |
| "XNNPACK/src/f32-gemm/gen/1x16-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-gemm/gen/1x16s4-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-gemm/gen/4x16s4-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-gemm/gen/5x16-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/1x16-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/1x16s4-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/4x16s4-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/5x16-minmax-fma3-broadcast.c", |
| "XNNPACK/src/f32-vhswish/gen/vhswish-fma3-x16.c", |
| ] |
| |
| PROD_AVX2_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-gemm/gen/1x16-minmax-avx2-broadcast.c", |
| "XNNPACK/src/f16-gemm/gen/4x16-minmax-avx2-broadcast.c", |
| "XNNPACK/src/f16-igemm/gen/1x16-minmax-avx2-broadcast.c", |
| "XNNPACK/src/f16-igemm/gen/4x16-minmax-avx2-broadcast.c", |
| "XNNPACK/src/f32-qs8-vcvt/gen/vcvt-avx2-x64.c", |
| "XNNPACK/src/f32-qu8-vcvt/gen/vcvt-avx2-x64.c", |
| "XNNPACK/src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x56.c", |
| "XNNPACK/src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x40.c", |
| "XNNPACK/src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qc8-gemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qc8-gemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qc8-igemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qc8-igemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qs8-f32-vcvt/gen/vcvt-avx2-x16.c", |
| "XNNPACK/src/qs8-gemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qs8-gemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qs8-igemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qs8-igemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x16.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qu8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c", |
| "XNNPACK/src/qu8-f32-vcvt/gen/vcvt-avx2-x16.c", |
| "XNNPACK/src/qu8-gemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qu8-gemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qu8-igemm/gen/1x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qu8-igemm/gen/3x8c8-minmax-fp32-avx2.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-avx2-mul32-ld64-x16.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c", |
| "XNNPACK/src/x8-lut/gen/lut-avx2-x128.c", |
| ] |
| |
| PROD_AVX512F_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f32-dwconv/gen/up16x3-minmax-avx512f.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x4-minmax-avx512f.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x9-minmax-avx512f.c", |
| "XNNPACK/src/f32-dwconv/gen/up16x25-minmax-avx512f.c", |
| "XNNPACK/src/f32-gemm/gen/1x16-minmax-avx512f-broadcast.c", |
| "XNNPACK/src/f32-gemm/gen/7x16-minmax-avx512f-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/1x16-minmax-avx512f-broadcast.c", |
| "XNNPACK/src/f32-igemm/gen/7x16-minmax-avx512f-broadcast.c", |
| "XNNPACK/src/f32-prelu/gen/avx512f-2x16.c", |
| "XNNPACK/src/f32-vbinary/gen/vadd-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vaddc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vdiv-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vdivc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vmaxc-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vmin-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vminc-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vmul-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vmulc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vrdivc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vrsubc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiff-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vsqrdiffc-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vsub-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vbinary/gen/vsubc-minmax-avx512f-x32.c", |
| "XNNPACK/src/f32-vclamp/gen/vclamp-avx512f-x16.c", |
| "XNNPACK/src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x64.c", |
| "XNNPACK/src/f32-vhswish/gen/vhswish-avx512f-x16.c", |
| "XNNPACK/src/f32-vlrelu/gen/vlrelu-avx512f-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndd-avx512f-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndne-avx512f-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndu-avx512f-x16.c", |
| "XNNPACK/src/f32-vrnd/gen/vrndz-avx512f-x16.c", |
| "XNNPACK/src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x64.c", |
| "XNNPACK/src/f32-vunary/gen/vabs-avx512f-x16.c", |
| "XNNPACK/src/f32-vunary/gen/vneg-avx512f-x16.c", |
| "XNNPACK/src/f32-vunary/gen/vsqr-avx512f-x16.c", |
| ] |
| |
| PROD_AVX512SKX_MICROKERNEL_SRCS = [ |
| "XNNPACK/src/f16-f32-vcvt/gen/vcvt-avx512skx-x16.c", |
| "XNNPACK/src/f32-f16-vcvt/gen/vcvt-avx512skx-x16.c", |
| "XNNPACK/src/f32-qs8-vcvt/gen/vcvt-avx512skx-x128.c", |
| "XNNPACK/src/f32-qu8-vcvt/gen/vcvt-avx512skx-x128.c", |
| "XNNPACK/src/qc8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qc8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qc8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qc8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qc8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qc8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qs8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qs8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qs8-f32-vcvt/gen/vcvt-avx512skx-x32.c", |
| "XNNPACK/src/qs8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qs8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qs8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qs8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qs8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c", |
| "XNNPACK/src/qs8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c", |
| "XNNPACK/src/qu8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qu8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c", |
| "XNNPACK/src/qu8-f32-vcvt/gen/vcvt-avx512skx-x32.c", |
| "XNNPACK/src/qu8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qu8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qu8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qu8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c", |
| "XNNPACK/src/qu8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c", |
| "XNNPACK/src/qu8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c", |
| "XNNPACK/src/x8-lut/gen/lut-avx512skx-vpshufb-x64.c", |
| ] |