`/* Implementation of the MATMUL intrinsic Copyright (C) 2002-2020 Free Software Foundation, Inc. Contributed by Thomas Koenig <tkoenig@gcc.gnu.org>. This file is part of the GNU Fortran runtime library (libgfortran). Libgfortran is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. Libgfortran is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. Under Section 7 of GPL version 3, you are granted additional permissions described in the GCC Runtime Library Exception, version 3.1, as published by the Free Software Foundation. You should have received a copy of the GNU General Public License and a copy of the GCC Runtime Library Exception along with this program; see the files COPYING3 and COPYING.RUNTIME respectively. If not, see <http://www.gnu.org/licenses/>. */ #include "libgfortran.h" #include <string.h> #include <assert.h>' include(iparm.m4)dnl /* These are the specific versions of matmul with -mprefer-avx128. */ `#if defined (HAVE_'rtype_name`) /* Prototype for the BLAS ?gemm subroutine, a pointer to which can be passed to us by the front-end, in which case we call it for large matrices. */ typedef void (*blas_call)(const char *, const char *, const int *, const int *, const int *, const 'rtype_name` *, const 'rtype_name` *, const int *, const 'rtype_name` *, const int *, const 'rtype_name` *, 'rtype_name` *, const int *, int, int); #if defined(HAVE_AVX) && defined(HAVE_FMA3) && defined(HAVE_AVX128) 'define(`matmul_name',`matmul_'rtype_code`_avx128_fma3')dnl `void 'matmul_name` ('rtype` * const restrict retarray, 'rtype` * const restrict a, 'rtype` * const restrict b, int try_blas, int blas_limit, blas_call gemm) __attribute__((__target__("avx,fma"))); internal_proto('matmul_name`); 'include(matmul_internal.m4)dnl `#endif #if defined(HAVE_AVX) && defined(HAVE_FMA4) && defined(HAVE_AVX128) 'define(`matmul_name',`matmul_'rtype_code`_avx128_fma4')dnl `void 'matmul_name` ('rtype` * const restrict retarray, 'rtype` * const restrict a, 'rtype` * const restrict b, int try_blas, int blas_limit, blas_call gemm) __attribute__((__target__("avx,fma4"))); internal_proto('matmul_name`); 'include(matmul_internal.m4)dnl `#endif #endif ' |