11//
2- // Copyright © 2020-2021 Arm Ltd. All rights reserved.
2+ // Copyright © 2020-2022 Arm Ltd. All rights reserved.
33// SPDX-License-Identifier: MIT
44//
55
@@ -109,6 +109,8 @@ opencl_srcs = [
109109 " src/core/CL/cl_kernels/nhwc/normalization_layer.cl" ,
110110 " src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer.cl" ,
111111 " src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer_quantized.cl" ,
112+ " src/core/CL/cl_kernels/nhwc/pooling_3d_layer.cl" ,
113+ " src/core/CL/cl_kernels/nhwc/pooling_3d_layer_quantized.cl" ,
112114 " src/core/CL/cl_kernels/nhwc/pooling_layer.cl" ,
113115 " src/core/CL/cl_kernels/nhwc/pooling_layer_quantized.cl" ,
114116 " src/core/CL/cl_kernels/nhwc/reorg_layer.cl" ,
@@ -278,7 +280,6 @@ cc_library_static {
278280 " src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp" ,
279281 " src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp" ,
280282 " src/core/NEON/kernels/NELogicalKernel.cpp" ,
281- " src/core/NEON/kernels/NEMaxUnpoolingLayerKernel.cpp" ,
282283 " src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp" ,
283284 " src/core/NEON/kernels/NENormalizationLayerKernel.cpp" ,
284285 " src/core/NEON/kernels/NEPadLayerKernel.cpp" ,
@@ -296,12 +297,16 @@ cc_library_static {
296297 " src/core/NEON/kernels/NEStackLayerKernel.cpp" ,
297298 " src/core/NEON/kernels/NEStridedSliceKernel.cpp" ,
298299 " src/core/NEON/kernels/NETileKernel.cpp" ,
300+ " src/core/NEON/kernels/arm_conv/addressing.cpp" ,
299301 " src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp" ,
300302 " src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp" ,
301303 " src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp" ,
304+ " src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp" ,
302305 " src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp" ,
303306 " src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp" ,
304307 " src/core/NEON/kernels/arm_conv/depthwise/interleaves/8b_mla.cpp" ,
308+ " src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp" ,
309+ " src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp" ,
305310 " src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp" ,
306311 " src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp" ,
307312 " src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp" ,
@@ -363,6 +368,16 @@ cc_library_static {
363368 " src/core/Utils.cpp" ,
364369 " src/core/Validate.cpp" ,
365370 " src/core/Version.cpp" ,
371+ " src/core/experimental/dynamic_fusion/ClKernelBuildingAPI.cpp" ,
372+ " src/core/experimental/dynamic_fusion/ClKernelBuildingImpl/components/ClDirectConvolutionKernelComponent.cpp" ,
373+ " src/core/experimental/dynamic_fusion/ClKernelBuildingImpl/components/ClElementwiseAddKernelComponent.cpp" ,
374+ " src/core/experimental/dynamic_fusion/ClKernelBuildingImpl/components/ClStoreKernelComponents.cpp" ,
375+ " src/core/experimental/dynamic_fusion/OperatorGraph.cpp" ,
376+ " src/core/experimental/dynamic_fusion/WorkloadImpl/ClFusedKernelGraph.cpp" ,
377+ " src/core/experimental/dynamic_fusion/WorkloadImpl/ClKernelGraph.cpp" ,
378+ " src/core/experimental/dynamic_fusion/WorkloadImpl/ClWorkload.cpp" ,
379+ " src/core/experimental/dynamic_fusion/WorkloadImpl/DependencyGraph.cpp" ,
380+ " src/core/experimental/dynamic_fusion/WorkloadImpl/OperatorGraphImpl.cpp" ,
366381 " src/core/helpers/SoftmaxHelpers.cpp" ,
367382 " src/core/helpers/WindowHelpers.cpp" ,
368383 " src/core/utils/AssemblyUtils.cpp" ,
@@ -412,9 +427,11 @@ cc_library_static {
412427 " src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp" ,
413428 " src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp" ,
414429 " src/cpu/kernels/CpuIm2ColKernel.cpp" ,
430+ " src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp" ,
415431 " src/cpu/kernels/CpuMulKernel.cpp" ,
416432 " src/cpu/kernels/CpuPermuteKernel.cpp" ,
417433 " src/cpu/kernels/CpuPool2dKernel.cpp" ,
434+ " src/cpu/kernels/CpuPool3dKernel.cpp" ,
418435 " src/cpu/kernels/CpuQuantizeKernel.cpp" ,
419436 " src/cpu/kernels/CpuReshapeKernel.cpp" ,
420437 " src/cpu/kernels/CpuScaleKernel.cpp" ,
@@ -439,20 +456,44 @@ cc_library_static {
439456 " src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp" ,
440457 " src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp" ,
441458 " src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp" ,
459+ " src/cpu/kernels/cast/generic/neon/bfloat16.cpp" ,
460+ " src/cpu/kernels/cast/generic/neon/fp16.cpp" ,
442461 " src/cpu/kernels/crop/generic/neon/fp16.cpp" ,
443462 " src/cpu/kernels/crop/generic/neon/fp32.cpp" ,
444463 " src/cpu/kernels/crop/generic/neon/impl.cpp" ,
445464 " src/cpu/kernels/crop/generic/neon/integer.cpp" ,
465+ " src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp" ,
466+ " src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp" ,
467+ " src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp" ,
468+ " src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp" ,
469+ " src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp" ,
470+ " src/cpu/kernels/directconv2d/nchw/all.cpp" ,
471+ " src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp" ,
472+ " src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp" ,
446473 " src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp" ,
447474 " src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp" ,
448475 " src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp" ,
449476 " src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp" ,
450477 " src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp" ,
451478 " src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp" ,
452479 " src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp" ,
480+ " src/cpu/kernels/elementwise_unary/generic/neon/impl.cpp" ,
453481 " src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp" ,
454482 " src/cpu/kernels/floor/neon/fp16.cpp" ,
455483 " src/cpu/kernels/floor/neon/fp32.cpp" ,
484+ " src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp" ,
485+ " src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp" ,
486+ " src/cpu/kernels/fuse_batch_normalization/generic/impl.cpp" ,
487+ " src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp" ,
488+ " src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp" ,
489+ " src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp" ,
490+ " src/cpu/kernels/fuse_batch_normalization/nhwc/neon/impl.cpp" ,
491+ " src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp" ,
492+ " src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp" ,
493+ " src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp" ,
494+ " src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp" ,
495+ " src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp" ,
496+ " src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp" ,
456497 " src/cpu/kernels/genproposals/generic/neon/fp16.cpp" ,
457498 " src/cpu/kernels/genproposals/generic/neon/fp32.cpp" ,
458499 " src/cpu/kernels/genproposals/generic/neon/impl.cpp" ,
@@ -462,6 +503,9 @@ cc_library_static {
462503 " src/cpu/kernels/instancenorm/generic/neon/impl.cpp" ,
463504 " src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp" ,
464505 " src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp" ,
506+ " src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp" ,
507+ " src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp" ,
508+ " src/cpu/kernels/l2normlayer/generic/neon/impl.cpp" ,
465509 " src/cpu/kernels/maxunpool/generic/neon/fp16.cpp" ,
466510 " src/cpu/kernels/maxunpool/generic/neon/fp32.cpp" ,
467511 " src/cpu/kernels/maxunpool/generic/neon/impl.cpp" ,
@@ -475,6 +519,11 @@ cc_library_static {
475519 " src/cpu/kernels/pool2d/neon/nchw/all.cpp" ,
476520 " src/cpu/kernels/pool2d/neon/qasymm8.cpp" ,
477521 " src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp" ,
522+ " src/cpu/kernels/pool3d/neon/fp16.cpp" ,
523+ " src/cpu/kernels/pool3d/neon/fp32.cpp" ,
524+ " src/cpu/kernels/pool3d/neon/impl.cpp" ,
525+ " src/cpu/kernels/pool3d/neon/qasymm8.cpp" ,
526+ " src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ,
478527 " src/cpu/kernels/range/generic/neon/fp16.cpp" ,
479528 " src/cpu/kernels/range/generic/neon/fp32.cpp" ,
480529 " src/cpu/kernels/range/generic/neon/impl.cpp" ,
@@ -494,6 +543,7 @@ cc_library_static {
494543 " src/cpu/kernels/select/generic/neon/integer.cpp" ,
495544 " src/cpu/kernels/softmax/generic/neon/fp16.cpp" ,
496545 " src/cpu/kernels/softmax/generic/neon/fp32.cpp" ,
546+ " src/cpu/kernels/softmax/generic/neon/impl.cpp" ,
497547 " src/cpu/kernels/softmax/generic/neon/qasymm8.cpp" ,
498548 " src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp" ,
499549 " src/cpu/kernels/sub/neon/qasymm8.cpp" ,
@@ -522,9 +572,11 @@ cc_library_static {
522572 " src/cpu/operators/CpuGemmDirectConv2d.cpp" ,
523573 " src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp" ,
524574 " src/cpu/operators/CpuGemmLowpOutputStage.cpp" ,
575+ " src/cpu/operators/CpuMaxUnpooling.cpp" ,
525576 " src/cpu/operators/CpuMul.cpp" ,
526577 " src/cpu/operators/CpuPermute.cpp" ,
527578 " src/cpu/operators/CpuPool2d.cpp" ,
579+ " src/cpu/operators/CpuPool3d.cpp" ,
528580 " src/cpu/operators/CpuQuantize.cpp" ,
529581 " src/cpu/operators/CpuReshape.cpp" ,
530582 " src/cpu/operators/CpuScale.cpp" ,
@@ -571,6 +623,7 @@ cc_library_static {
571623 " src/gpu/cl/kernels/ClMulKernel.cpp" ,
572624 " src/gpu/cl/kernels/ClPermuteKernel.cpp" ,
573625 " src/gpu/cl/kernels/ClPool2dKernel.cpp" ,
626+ " src/gpu/cl/kernels/ClPool3dKernel.cpp" ,
574627 " src/gpu/cl/kernels/ClQuantizeKernel.cpp" ,
575628 " src/gpu/cl/kernels/ClReshapeKernel.cpp" ,
576629 " src/gpu/cl/kernels/ClScaleKernel.cpp" ,
@@ -583,6 +636,7 @@ cc_library_static {
583636 " src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp" ,
584637 " src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp" ,
585638 " src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp" ,
639+ " src/gpu/cl/kernels/experimental/dynamic_fusion/ClCompositeKernel.cpp" ,
586640 " src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp" ,
587641 " src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp" ,
588642 " src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp" ,
@@ -617,13 +671,15 @@ cc_library_static {
617671 " src/gpu/cl/operators/ClPRelu.cpp" ,
618672 " src/gpu/cl/operators/ClPermute.cpp" ,
619673 " src/gpu/cl/operators/ClPool2d.cpp" ,
674+ " src/gpu/cl/operators/ClPool3d.cpp" ,
620675 " src/gpu/cl/operators/ClQuantize.cpp" ,
621676 " src/gpu/cl/operators/ClReshape.cpp" ,
622677 " src/gpu/cl/operators/ClScale.cpp" ,
623678 " src/gpu/cl/operators/ClSoftmax.cpp" ,
624679 " src/gpu/cl/operators/ClSub.cpp" ,
625680 " src/gpu/cl/operators/ClTranspose.cpp" ,
626681 " src/gpu/cl/operators/ClWinogradConv2d.cpp" ,
682+ " src/gpu/cl/operators/experimental/dynamic_fusion/ClCompositeOperator.cpp" ,
627683 " src/runtime/Allocator.cpp" ,
628684 " src/runtime/BlobLifetimeManager.cpp" ,
629685 " src/runtime/BlobMemoryPool.cpp" ,
@@ -700,6 +756,7 @@ cc_library_static {
700756 " src/runtime/CL/functions/CLPadLayer.cpp" ,
701757 " src/runtime/CL/functions/CLPermute.cpp" ,
702758 " src/runtime/CL/functions/CLPixelWiseMultiplication.cpp" ,
759+ " src/runtime/CL/functions/CLPooling3dLayer.cpp" ,
703760 " src/runtime/CL/functions/CLPoolingLayer.cpp" ,
704761 " src/runtime/CL/functions/CLPriorBoxLayer.cpp" ,
705762 " src/runtime/CL/functions/CLQLSTMLayer.cpp" ,
@@ -810,6 +867,7 @@ cc_library_static {
810867 " src/runtime/NEON/functions/NEPadLayer.cpp" ,
811868 " src/runtime/NEON/functions/NEPermute.cpp" ,
812869 " src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp" ,
870+ " src/runtime/NEON/functions/NEPooling3dLayer.cpp" ,
813871 " src/runtime/NEON/functions/NEPoolingLayer.cpp" ,
814872 " src/runtime/NEON/functions/NEPriorBoxLayer.cpp" ,
815873 " src/runtime/NEON/functions/NEQLSTMLayer.cpp" ,
@@ -913,6 +971,9 @@ cc_library_static {
913971 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp" ,
914972 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp" ,
915973 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp" ,
974+ " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp" ,
975+ " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp" ,
976+ " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp" ,
916977 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp" ,
917978 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp" ,
918979 " src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp" ,
0 commit comments