1 `/* Implementation of the MATMUL intrinsic
2 Copyright 2002, 2005, 2006, 2007, 2009, 2012 Free Software Foundation, Inc.
3 Contributed by Paul Brook <paul@nowt.org>
5 This file is part of the GNU Fortran runtime library (libgfortran).
7 Libgfortran is free software; you can redistribute it and/or
8 modify it under the terms of the GNU General Public
9 License as published by the Free Software Foundation; either
10 version 3 of the License, or (at your option) any later version.
12 Libgfortran is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 Under Section 7 of GPL version 3, you are granted additional
18 permissions described in the GCC Runtime Library Exception, version
19 3.1, as published by the Free Software Foundation.
21 You should have received a copy of the GNU General Public License and
22 a copy of the GCC Runtime Library Exception along with this program;
23 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
24 <http://www.gnu.org/licenses/>. */
26 #include "libgfortran.h"
32 `#if defined (HAVE_'rtype_name`)
34 /* Dimensions: retarray(x,y) a(x, count) b(count,y).
35 Either a or b can be rank 1. In this case x or y is 1. */
37 extern void matmul_'rtype_code` ('rtype` * const restrict,
38 gfc_array_l1 * const restrict, gfc_array_l1 * const restrict);
39 export_proto(matmul_'rtype_code`);
42 matmul_'rtype_code` ('rtype` * const restrict retarray,
43 gfc_array_l1 * const restrict a, gfc_array_l1 * const restrict b)
45 const GFC_LOGICAL_1 * restrict abase;
46 const GFC_LOGICAL_1 * restrict bbase;
47 'rtype_name` * restrict dest;
59 const GFC_LOGICAL_1 * restrict pa;
60 const GFC_LOGICAL_1 * restrict pb;
66 assert (GFC_DESCRIPTOR_RANK (a) == 2
67 || GFC_DESCRIPTOR_RANK (b) == 2);
69 if (retarray->base_addr == NULL)
71 if (GFC_DESCRIPTOR_RANK (a) == 1)
73 GFC_DIMENSION_SET(retarray->dim[0], 0,
74 GFC_DESCRIPTOR_EXTENT(b,1) - 1, 1);
76 else if (GFC_DESCRIPTOR_RANK (b) == 1)
78 GFC_DIMENSION_SET(retarray->dim[0], 0,
79 GFC_DESCRIPTOR_EXTENT(a,0) - 1, 1);
83 GFC_DIMENSION_SET(retarray->dim[0], 0,
84 GFC_DESCRIPTOR_EXTENT(a,0) - 1, 1);
86 GFC_DIMENSION_SET(retarray->dim[1], 0,
87 GFC_DESCRIPTOR_EXTENT(b,1) - 1,
88 GFC_DESCRIPTOR_EXTENT(retarray,0));
92 = xmalloc (sizeof ('rtype_name`) * size0 ((array_t *) retarray));
95 else if (unlikely (compile_options.bounds_check))
97 index_type ret_extent, arg_extent;
99 if (GFC_DESCRIPTOR_RANK (a) == 1)
101 arg_extent = GFC_DESCRIPTOR_EXTENT(b,1);
102 ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,0);
103 if (arg_extent != ret_extent)
104 runtime_error ("Incorrect extent in return array in"
105 " MATMUL intrinsic: is %ld, should be %ld",
106 (long int) ret_extent, (long int) arg_extent);
108 else if (GFC_DESCRIPTOR_RANK (b) == 1)
110 arg_extent = GFC_DESCRIPTOR_EXTENT(a,0);
111 ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,0);
112 if (arg_extent != ret_extent)
113 runtime_error ("Incorrect extent in return array in"
114 " MATMUL intrinsic: is %ld, should be %ld",
115 (long int) ret_extent, (long int) arg_extent);
119 arg_extent = GFC_DESCRIPTOR_EXTENT(a,0);
120 ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,0);
121 if (arg_extent != ret_extent)
122 runtime_error ("Incorrect extent in return array in"
123 " MATMUL intrinsic for dimension 1:"
124 " is %ld, should be %ld",
125 (long int) ret_extent, (long int) arg_extent);
127 arg_extent = GFC_DESCRIPTOR_EXTENT(b,1);
128 ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,1);
129 if (arg_extent != ret_extent)
130 runtime_error ("Incorrect extent in return array in"
131 " MATMUL intrinsic for dimension 2:"
132 " is %ld, should be %ld",
133 (long int) ret_extent, (long int) arg_extent);
137 abase = a->base_addr;
138 a_kind = GFC_DESCRIPTOR_SIZE (a);
140 if (a_kind == 1 || a_kind == 2 || a_kind == 4 || a_kind == 8
141 #ifdef HAVE_GFC_LOGICAL_16
145 abase = GFOR_POINTER_TO_L1 (abase, a_kind);
147 internal_error (NULL, "Funny sized logical array");
149 bbase = b->base_addr;
150 b_kind = GFC_DESCRIPTOR_SIZE (b);
152 if (b_kind == 1 || b_kind == 2 || b_kind == 4 || b_kind == 8
153 #ifdef HAVE_GFC_LOGICAL_16
157 bbase = GFOR_POINTER_TO_L1 (bbase, b_kind);
159 internal_error (NULL, "Funny sized logical array");
161 dest = retarray->base_addr;
163 sinclude(`matmul_asm_'rtype_code`.m4')dnl
165 if (GFC_DESCRIPTOR_RANK (retarray) == 1)
167 rxstride = GFC_DESCRIPTOR_STRIDE(retarray,0);
172 rxstride = GFC_DESCRIPTOR_STRIDE(retarray,0);
173 rystride = GFC_DESCRIPTOR_STRIDE(retarray,1);
176 /* If we have rank 1 parameters, zero the absent stride, and set the size to
178 if (GFC_DESCRIPTOR_RANK (a) == 1)
180 astride = GFC_DESCRIPTOR_STRIDE_BYTES(a,0);
181 count = GFC_DESCRIPTOR_EXTENT(a,0);
188 astride = GFC_DESCRIPTOR_STRIDE_BYTES(a,1);
189 count = GFC_DESCRIPTOR_EXTENT(a,1);
190 xstride = GFC_DESCRIPTOR_STRIDE_BYTES(a,0);
191 xcount = GFC_DESCRIPTOR_EXTENT(a,0);
193 if (GFC_DESCRIPTOR_RANK (b) == 1)
195 bstride = GFC_DESCRIPTOR_STRIDE_BYTES(b,0);
196 assert(count == GFC_DESCRIPTOR_EXTENT(b,0));
203 bstride = GFC_DESCRIPTOR_STRIDE_BYTES(b,0);
204 assert(count == GFC_DESCRIPTOR_EXTENT(b,0));
205 ystride = GFC_DESCRIPTOR_STRIDE_BYTES(b,1);
206 ycount = GFC_DESCRIPTOR_EXTENT(b,1);
209 for (y = 0; y < ycount; y++)
211 for (x = 0; x < xcount; x++)
213 /* Do the summation for this element. For real and integer types
214 this is the same as DOT_PRODUCT. For complex types we use do
215 a*b, not conjg(a)*b. */
220 for (n = 0; n < count; n++)
234 abase -= xstride * xcount;
236 dest += rystride - (rxstride * xcount);