1*b1e83836Smrg /* Implementation of the SUM intrinsic
2*b1e83836Smrg Copyright (C) 2002-2022 Free Software Foundation, Inc.
3*b1e83836Smrg Contributed by Paul Brook <paul@nowt.org>
4*b1e83836Smrg
5*b1e83836Smrg This file is part of the GNU Fortran 95 runtime library (libgfortran).
6*b1e83836Smrg
7*b1e83836Smrg Libgfortran is free software; you can redistribute it and/or
8*b1e83836Smrg modify it under the terms of the GNU General Public
9*b1e83836Smrg License as published by the Free Software Foundation; either
10*b1e83836Smrg version 3 of the License, or (at your option) any later version.
11*b1e83836Smrg
12*b1e83836Smrg Libgfortran is distributed in the hope that it will be useful,
13*b1e83836Smrg but WITHOUT ANY WARRANTY; without even the implied warranty of
14*b1e83836Smrg MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15*b1e83836Smrg GNU General Public License for more details.
16*b1e83836Smrg
17*b1e83836Smrg Under Section 7 of GPL version 3, you are granted additional
18*b1e83836Smrg permissions described in the GCC Runtime Library Exception, version
19*b1e83836Smrg 3.1, as published by the Free Software Foundation.
20*b1e83836Smrg
21*b1e83836Smrg You should have received a copy of the GNU General Public License and
22*b1e83836Smrg a copy of the GCC Runtime Library Exception along with this program;
23*b1e83836Smrg see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
24*b1e83836Smrg <http://www.gnu.org/licenses/>. */
25*b1e83836Smrg
26*b1e83836Smrg #include "libgfortran.h"
27*b1e83836Smrg
28*b1e83836Smrg
29*b1e83836Smrg #if defined (HAVE_GFC_COMPLEX_17) && defined (HAVE_GFC_COMPLEX_17)
30*b1e83836Smrg
31*b1e83836Smrg
32*b1e83836Smrg extern void sum_c17 (gfc_array_c17 * const restrict,
33*b1e83836Smrg gfc_array_c17 * const restrict, const index_type * const restrict);
34*b1e83836Smrg export_proto(sum_c17);
35*b1e83836Smrg
36*b1e83836Smrg void
sum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim)37*b1e83836Smrg sum_c17 (gfc_array_c17 * const restrict retarray,
38*b1e83836Smrg gfc_array_c17 * const restrict array,
39*b1e83836Smrg const index_type * const restrict pdim)
40*b1e83836Smrg {
41*b1e83836Smrg index_type count[GFC_MAX_DIMENSIONS];
42*b1e83836Smrg index_type extent[GFC_MAX_DIMENSIONS];
43*b1e83836Smrg index_type sstride[GFC_MAX_DIMENSIONS];
44*b1e83836Smrg index_type dstride[GFC_MAX_DIMENSIONS];
45*b1e83836Smrg const GFC_COMPLEX_17 * restrict base;
46*b1e83836Smrg GFC_COMPLEX_17 * restrict dest;
47*b1e83836Smrg index_type rank;
48*b1e83836Smrg index_type n;
49*b1e83836Smrg index_type len;
50*b1e83836Smrg index_type delta;
51*b1e83836Smrg index_type dim;
52*b1e83836Smrg int continue_loop;
53*b1e83836Smrg
54*b1e83836Smrg /* Make dim zero based to avoid confusion. */
55*b1e83836Smrg rank = GFC_DESCRIPTOR_RANK (array) - 1;
56*b1e83836Smrg dim = (*pdim) - 1;
57*b1e83836Smrg
58*b1e83836Smrg if (unlikely (dim < 0 || dim > rank))
59*b1e83836Smrg {
60*b1e83836Smrg runtime_error ("Dim argument incorrect in SUM intrinsic: "
61*b1e83836Smrg "is %ld, should be between 1 and %ld",
62*b1e83836Smrg (long int) dim + 1, (long int) rank + 1);
63*b1e83836Smrg }
64*b1e83836Smrg
65*b1e83836Smrg len = GFC_DESCRIPTOR_EXTENT(array,dim);
66*b1e83836Smrg if (len < 0)
67*b1e83836Smrg len = 0;
68*b1e83836Smrg delta = GFC_DESCRIPTOR_STRIDE(array,dim);
69*b1e83836Smrg
70*b1e83836Smrg for (n = 0; n < dim; n++)
71*b1e83836Smrg {
72*b1e83836Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
73*b1e83836Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
74*b1e83836Smrg
75*b1e83836Smrg if (extent[n] < 0)
76*b1e83836Smrg extent[n] = 0;
77*b1e83836Smrg }
78*b1e83836Smrg for (n = dim; n < rank; n++)
79*b1e83836Smrg {
80*b1e83836Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array, n + 1);
81*b1e83836Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
82*b1e83836Smrg
83*b1e83836Smrg if (extent[n] < 0)
84*b1e83836Smrg extent[n] = 0;
85*b1e83836Smrg }
86*b1e83836Smrg
87*b1e83836Smrg if (retarray->base_addr == NULL)
88*b1e83836Smrg {
89*b1e83836Smrg size_t alloc_size, str;
90*b1e83836Smrg
91*b1e83836Smrg for (n = 0; n < rank; n++)
92*b1e83836Smrg {
93*b1e83836Smrg if (n == 0)
94*b1e83836Smrg str = 1;
95*b1e83836Smrg else
96*b1e83836Smrg str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
97*b1e83836Smrg
98*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
99*b1e83836Smrg
100*b1e83836Smrg }
101*b1e83836Smrg
102*b1e83836Smrg retarray->offset = 0;
103*b1e83836Smrg retarray->dtype.rank = rank;
104*b1e83836Smrg
105*b1e83836Smrg alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
106*b1e83836Smrg
107*b1e83836Smrg retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
108*b1e83836Smrg if (alloc_size == 0)
109*b1e83836Smrg {
110*b1e83836Smrg /* Make sure we have a zero-sized array. */
111*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
112*b1e83836Smrg return;
113*b1e83836Smrg
114*b1e83836Smrg }
115*b1e83836Smrg }
116*b1e83836Smrg else
117*b1e83836Smrg {
118*b1e83836Smrg if (rank != GFC_DESCRIPTOR_RANK (retarray))
119*b1e83836Smrg runtime_error ("rank of return array incorrect in"
120*b1e83836Smrg " SUM intrinsic: is %ld, should be %ld",
121*b1e83836Smrg (long int) (GFC_DESCRIPTOR_RANK (retarray)),
122*b1e83836Smrg (long int) rank);
123*b1e83836Smrg
124*b1e83836Smrg if (unlikely (compile_options.bounds_check))
125*b1e83836Smrg bounds_ifunction_return ((array_t *) retarray, extent,
126*b1e83836Smrg "return value", "SUM");
127*b1e83836Smrg }
128*b1e83836Smrg
129*b1e83836Smrg for (n = 0; n < rank; n++)
130*b1e83836Smrg {
131*b1e83836Smrg count[n] = 0;
132*b1e83836Smrg dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
133*b1e83836Smrg if (extent[n] <= 0)
134*b1e83836Smrg return;
135*b1e83836Smrg }
136*b1e83836Smrg
137*b1e83836Smrg base = array->base_addr;
138*b1e83836Smrg dest = retarray->base_addr;
139*b1e83836Smrg
140*b1e83836Smrg continue_loop = 1;
141*b1e83836Smrg while (continue_loop)
142*b1e83836Smrg {
143*b1e83836Smrg const GFC_COMPLEX_17 * restrict src;
144*b1e83836Smrg GFC_COMPLEX_17 result;
145*b1e83836Smrg src = base;
146*b1e83836Smrg {
147*b1e83836Smrg
148*b1e83836Smrg result = 0;
149*b1e83836Smrg if (len <= 0)
150*b1e83836Smrg *dest = 0;
151*b1e83836Smrg else
152*b1e83836Smrg {
153*b1e83836Smrg #if ! defined HAVE_BACK_ARG
154*b1e83836Smrg for (n = 0; n < len; n++, src += delta)
155*b1e83836Smrg {
156*b1e83836Smrg #endif
157*b1e83836Smrg
158*b1e83836Smrg result += *src;
159*b1e83836Smrg }
160*b1e83836Smrg
161*b1e83836Smrg *dest = result;
162*b1e83836Smrg }
163*b1e83836Smrg }
164*b1e83836Smrg /* Advance to the next element. */
165*b1e83836Smrg count[0]++;
166*b1e83836Smrg base += sstride[0];
167*b1e83836Smrg dest += dstride[0];
168*b1e83836Smrg n = 0;
169*b1e83836Smrg while (count[n] == extent[n])
170*b1e83836Smrg {
171*b1e83836Smrg /* When we get to the end of a dimension, reset it and increment
172*b1e83836Smrg the next dimension. */
173*b1e83836Smrg count[n] = 0;
174*b1e83836Smrg /* We could precalculate these products, but this is a less
175*b1e83836Smrg frequently used path so probably not worth it. */
176*b1e83836Smrg base -= sstride[n] * extent[n];
177*b1e83836Smrg dest -= dstride[n] * extent[n];
178*b1e83836Smrg n++;
179*b1e83836Smrg if (n >= rank)
180*b1e83836Smrg {
181*b1e83836Smrg /* Break out of the loop. */
182*b1e83836Smrg continue_loop = 0;
183*b1e83836Smrg break;
184*b1e83836Smrg }
185*b1e83836Smrg else
186*b1e83836Smrg {
187*b1e83836Smrg count[n]++;
188*b1e83836Smrg base += sstride[n];
189*b1e83836Smrg dest += dstride[n];
190*b1e83836Smrg }
191*b1e83836Smrg }
192*b1e83836Smrg }
193*b1e83836Smrg }
194*b1e83836Smrg
195*b1e83836Smrg
196*b1e83836Smrg extern void msum_c17 (gfc_array_c17 * const restrict,
197*b1e83836Smrg gfc_array_c17 * const restrict, const index_type * const restrict,
198*b1e83836Smrg gfc_array_l1 * const restrict);
199*b1e83836Smrg export_proto(msum_c17);
200*b1e83836Smrg
201*b1e83836Smrg void
msum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim,gfc_array_l1 * const restrict mask)202*b1e83836Smrg msum_c17 (gfc_array_c17 * const restrict retarray,
203*b1e83836Smrg gfc_array_c17 * const restrict array,
204*b1e83836Smrg const index_type * const restrict pdim,
205*b1e83836Smrg gfc_array_l1 * const restrict mask)
206*b1e83836Smrg {
207*b1e83836Smrg index_type count[GFC_MAX_DIMENSIONS];
208*b1e83836Smrg index_type extent[GFC_MAX_DIMENSIONS];
209*b1e83836Smrg index_type sstride[GFC_MAX_DIMENSIONS];
210*b1e83836Smrg index_type dstride[GFC_MAX_DIMENSIONS];
211*b1e83836Smrg index_type mstride[GFC_MAX_DIMENSIONS];
212*b1e83836Smrg GFC_COMPLEX_17 * restrict dest;
213*b1e83836Smrg const GFC_COMPLEX_17 * restrict base;
214*b1e83836Smrg const GFC_LOGICAL_1 * restrict mbase;
215*b1e83836Smrg index_type rank;
216*b1e83836Smrg index_type dim;
217*b1e83836Smrg index_type n;
218*b1e83836Smrg index_type len;
219*b1e83836Smrg index_type delta;
220*b1e83836Smrg index_type mdelta;
221*b1e83836Smrg int mask_kind;
222*b1e83836Smrg
223*b1e83836Smrg if (mask == NULL)
224*b1e83836Smrg {
225*b1e83836Smrg #ifdef HAVE_BACK_ARG
226*b1e83836Smrg sum_c17 (retarray, array, pdim, back);
227*b1e83836Smrg #else
228*b1e83836Smrg sum_c17 (retarray, array, pdim);
229*b1e83836Smrg #endif
230*b1e83836Smrg return;
231*b1e83836Smrg }
232*b1e83836Smrg
233*b1e83836Smrg dim = (*pdim) - 1;
234*b1e83836Smrg rank = GFC_DESCRIPTOR_RANK (array) - 1;
235*b1e83836Smrg
236*b1e83836Smrg
237*b1e83836Smrg if (unlikely (dim < 0 || dim > rank))
238*b1e83836Smrg {
239*b1e83836Smrg runtime_error ("Dim argument incorrect in SUM intrinsic: "
240*b1e83836Smrg "is %ld, should be between 1 and %ld",
241*b1e83836Smrg (long int) dim + 1, (long int) rank + 1);
242*b1e83836Smrg }
243*b1e83836Smrg
244*b1e83836Smrg len = GFC_DESCRIPTOR_EXTENT(array,dim);
245*b1e83836Smrg if (len <= 0)
246*b1e83836Smrg return;
247*b1e83836Smrg
248*b1e83836Smrg mbase = mask->base_addr;
249*b1e83836Smrg
250*b1e83836Smrg mask_kind = GFC_DESCRIPTOR_SIZE (mask);
251*b1e83836Smrg
252*b1e83836Smrg if (mask_kind == 1 || mask_kind == 2 || mask_kind == 4 || mask_kind == 8
253*b1e83836Smrg #ifdef HAVE_GFC_LOGICAL_16
254*b1e83836Smrg || mask_kind == 16
255*b1e83836Smrg #endif
256*b1e83836Smrg )
257*b1e83836Smrg mbase = GFOR_POINTER_TO_L1 (mbase, mask_kind);
258*b1e83836Smrg else
259*b1e83836Smrg runtime_error ("Funny sized logical array");
260*b1e83836Smrg
261*b1e83836Smrg delta = GFC_DESCRIPTOR_STRIDE(array,dim);
262*b1e83836Smrg mdelta = GFC_DESCRIPTOR_STRIDE_BYTES(mask,dim);
263*b1e83836Smrg
264*b1e83836Smrg for (n = 0; n < dim; n++)
265*b1e83836Smrg {
266*b1e83836Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
267*b1e83836Smrg mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask,n);
268*b1e83836Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
269*b1e83836Smrg
270*b1e83836Smrg if (extent[n] < 0)
271*b1e83836Smrg extent[n] = 0;
272*b1e83836Smrg
273*b1e83836Smrg }
274*b1e83836Smrg for (n = dim; n < rank; n++)
275*b1e83836Smrg {
276*b1e83836Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n + 1);
277*b1e83836Smrg mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask, n + 1);
278*b1e83836Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
279*b1e83836Smrg
280*b1e83836Smrg if (extent[n] < 0)
281*b1e83836Smrg extent[n] = 0;
282*b1e83836Smrg }
283*b1e83836Smrg
284*b1e83836Smrg if (retarray->base_addr == NULL)
285*b1e83836Smrg {
286*b1e83836Smrg size_t alloc_size, str;
287*b1e83836Smrg
288*b1e83836Smrg for (n = 0; n < rank; n++)
289*b1e83836Smrg {
290*b1e83836Smrg if (n == 0)
291*b1e83836Smrg str = 1;
292*b1e83836Smrg else
293*b1e83836Smrg str= GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
294*b1e83836Smrg
295*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
296*b1e83836Smrg
297*b1e83836Smrg }
298*b1e83836Smrg
299*b1e83836Smrg alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
300*b1e83836Smrg
301*b1e83836Smrg retarray->offset = 0;
302*b1e83836Smrg retarray->dtype.rank = rank;
303*b1e83836Smrg
304*b1e83836Smrg if (alloc_size == 0)
305*b1e83836Smrg {
306*b1e83836Smrg /* Make sure we have a zero-sized array. */
307*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
308*b1e83836Smrg return;
309*b1e83836Smrg }
310*b1e83836Smrg else
311*b1e83836Smrg retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
312*b1e83836Smrg
313*b1e83836Smrg }
314*b1e83836Smrg else
315*b1e83836Smrg {
316*b1e83836Smrg if (rank != GFC_DESCRIPTOR_RANK (retarray))
317*b1e83836Smrg runtime_error ("rank of return array incorrect in SUM intrinsic");
318*b1e83836Smrg
319*b1e83836Smrg if (unlikely (compile_options.bounds_check))
320*b1e83836Smrg {
321*b1e83836Smrg bounds_ifunction_return ((array_t *) retarray, extent,
322*b1e83836Smrg "return value", "SUM");
323*b1e83836Smrg bounds_equal_extents ((array_t *) mask, (array_t *) array,
324*b1e83836Smrg "MASK argument", "SUM");
325*b1e83836Smrg }
326*b1e83836Smrg }
327*b1e83836Smrg
328*b1e83836Smrg for (n = 0; n < rank; n++)
329*b1e83836Smrg {
330*b1e83836Smrg count[n] = 0;
331*b1e83836Smrg dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
332*b1e83836Smrg if (extent[n] <= 0)
333*b1e83836Smrg return;
334*b1e83836Smrg }
335*b1e83836Smrg
336*b1e83836Smrg dest = retarray->base_addr;
337*b1e83836Smrg base = array->base_addr;
338*b1e83836Smrg
339*b1e83836Smrg while (base)
340*b1e83836Smrg {
341*b1e83836Smrg const GFC_COMPLEX_17 * restrict src;
342*b1e83836Smrg const GFC_LOGICAL_1 * restrict msrc;
343*b1e83836Smrg GFC_COMPLEX_17 result;
344*b1e83836Smrg src = base;
345*b1e83836Smrg msrc = mbase;
346*b1e83836Smrg {
347*b1e83836Smrg
348*b1e83836Smrg result = 0;
349*b1e83836Smrg for (n = 0; n < len; n++, src += delta, msrc += mdelta)
350*b1e83836Smrg {
351*b1e83836Smrg
352*b1e83836Smrg if (*msrc)
353*b1e83836Smrg result += *src;
354*b1e83836Smrg }
355*b1e83836Smrg *dest = result;
356*b1e83836Smrg }
357*b1e83836Smrg /* Advance to the next element. */
358*b1e83836Smrg count[0]++;
359*b1e83836Smrg base += sstride[0];
360*b1e83836Smrg mbase += mstride[0];
361*b1e83836Smrg dest += dstride[0];
362*b1e83836Smrg n = 0;
363*b1e83836Smrg while (count[n] == extent[n])
364*b1e83836Smrg {
365*b1e83836Smrg /* When we get to the end of a dimension, reset it and increment
366*b1e83836Smrg the next dimension. */
367*b1e83836Smrg count[n] = 0;
368*b1e83836Smrg /* We could precalculate these products, but this is a less
369*b1e83836Smrg frequently used path so probably not worth it. */
370*b1e83836Smrg base -= sstride[n] * extent[n];
371*b1e83836Smrg mbase -= mstride[n] * extent[n];
372*b1e83836Smrg dest -= dstride[n] * extent[n];
373*b1e83836Smrg n++;
374*b1e83836Smrg if (n >= rank)
375*b1e83836Smrg {
376*b1e83836Smrg /* Break out of the loop. */
377*b1e83836Smrg base = NULL;
378*b1e83836Smrg break;
379*b1e83836Smrg }
380*b1e83836Smrg else
381*b1e83836Smrg {
382*b1e83836Smrg count[n]++;
383*b1e83836Smrg base += sstride[n];
384*b1e83836Smrg mbase += mstride[n];
385*b1e83836Smrg dest += dstride[n];
386*b1e83836Smrg }
387*b1e83836Smrg }
388*b1e83836Smrg }
389*b1e83836Smrg }
390*b1e83836Smrg
391*b1e83836Smrg
392*b1e83836Smrg extern void ssum_c17 (gfc_array_c17 * const restrict,
393*b1e83836Smrg gfc_array_c17 * const restrict, const index_type * const restrict,
394*b1e83836Smrg GFC_LOGICAL_4 *);
395*b1e83836Smrg export_proto(ssum_c17);
396*b1e83836Smrg
397*b1e83836Smrg void
ssum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim,GFC_LOGICAL_4 * mask)398*b1e83836Smrg ssum_c17 (gfc_array_c17 * const restrict retarray,
399*b1e83836Smrg gfc_array_c17 * const restrict array,
400*b1e83836Smrg const index_type * const restrict pdim,
401*b1e83836Smrg GFC_LOGICAL_4 * mask)
402*b1e83836Smrg {
403*b1e83836Smrg index_type count[GFC_MAX_DIMENSIONS];
404*b1e83836Smrg index_type extent[GFC_MAX_DIMENSIONS];
405*b1e83836Smrg index_type dstride[GFC_MAX_DIMENSIONS];
406*b1e83836Smrg GFC_COMPLEX_17 * restrict dest;
407*b1e83836Smrg index_type rank;
408*b1e83836Smrg index_type n;
409*b1e83836Smrg index_type dim;
410*b1e83836Smrg
411*b1e83836Smrg
412*b1e83836Smrg if (mask == NULL || *mask)
413*b1e83836Smrg {
414*b1e83836Smrg #ifdef HAVE_BACK_ARG
415*b1e83836Smrg sum_c17 (retarray, array, pdim, back);
416*b1e83836Smrg #else
417*b1e83836Smrg sum_c17 (retarray, array, pdim);
418*b1e83836Smrg #endif
419*b1e83836Smrg return;
420*b1e83836Smrg }
421*b1e83836Smrg /* Make dim zero based to avoid confusion. */
422*b1e83836Smrg dim = (*pdim) - 1;
423*b1e83836Smrg rank = GFC_DESCRIPTOR_RANK (array) - 1;
424*b1e83836Smrg
425*b1e83836Smrg if (unlikely (dim < 0 || dim > rank))
426*b1e83836Smrg {
427*b1e83836Smrg runtime_error ("Dim argument incorrect in SUM intrinsic: "
428*b1e83836Smrg "is %ld, should be between 1 and %ld",
429*b1e83836Smrg (long int) dim + 1, (long int) rank + 1);
430*b1e83836Smrg }
431*b1e83836Smrg
432*b1e83836Smrg for (n = 0; n < dim; n++)
433*b1e83836Smrg {
434*b1e83836Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
435*b1e83836Smrg
436*b1e83836Smrg if (extent[n] <= 0)
437*b1e83836Smrg extent[n] = 0;
438*b1e83836Smrg }
439*b1e83836Smrg
440*b1e83836Smrg for (n = dim; n < rank; n++)
441*b1e83836Smrg {
442*b1e83836Smrg extent[n] =
443*b1e83836Smrg GFC_DESCRIPTOR_EXTENT(array,n + 1);
444*b1e83836Smrg
445*b1e83836Smrg if (extent[n] <= 0)
446*b1e83836Smrg extent[n] = 0;
447*b1e83836Smrg }
448*b1e83836Smrg
449*b1e83836Smrg if (retarray->base_addr == NULL)
450*b1e83836Smrg {
451*b1e83836Smrg size_t alloc_size, str;
452*b1e83836Smrg
453*b1e83836Smrg for (n = 0; n < rank; n++)
454*b1e83836Smrg {
455*b1e83836Smrg if (n == 0)
456*b1e83836Smrg str = 1;
457*b1e83836Smrg else
458*b1e83836Smrg str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
459*b1e83836Smrg
460*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
461*b1e83836Smrg
462*b1e83836Smrg }
463*b1e83836Smrg
464*b1e83836Smrg retarray->offset = 0;
465*b1e83836Smrg retarray->dtype.rank = rank;
466*b1e83836Smrg
467*b1e83836Smrg alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
468*b1e83836Smrg
469*b1e83836Smrg if (alloc_size == 0)
470*b1e83836Smrg {
471*b1e83836Smrg /* Make sure we have a zero-sized array. */
472*b1e83836Smrg GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
473*b1e83836Smrg return;
474*b1e83836Smrg }
475*b1e83836Smrg else
476*b1e83836Smrg retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
477*b1e83836Smrg }
478*b1e83836Smrg else
479*b1e83836Smrg {
480*b1e83836Smrg if (rank != GFC_DESCRIPTOR_RANK (retarray))
481*b1e83836Smrg runtime_error ("rank of return array incorrect in"
482*b1e83836Smrg " SUM intrinsic: is %ld, should be %ld",
483*b1e83836Smrg (long int) (GFC_DESCRIPTOR_RANK (retarray)),
484*b1e83836Smrg (long int) rank);
485*b1e83836Smrg
486*b1e83836Smrg if (unlikely (compile_options.bounds_check))
487*b1e83836Smrg {
488*b1e83836Smrg for (n=0; n < rank; n++)
489*b1e83836Smrg {
490*b1e83836Smrg index_type ret_extent;
491*b1e83836Smrg
492*b1e83836Smrg ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,n);
493*b1e83836Smrg if (extent[n] != ret_extent)
494*b1e83836Smrg runtime_error ("Incorrect extent in return value of"
495*b1e83836Smrg " SUM intrinsic in dimension %ld:"
496*b1e83836Smrg " is %ld, should be %ld", (long int) n + 1,
497*b1e83836Smrg (long int) ret_extent, (long int) extent[n]);
498*b1e83836Smrg }
499*b1e83836Smrg }
500*b1e83836Smrg }
501*b1e83836Smrg
502*b1e83836Smrg for (n = 0; n < rank; n++)
503*b1e83836Smrg {
504*b1e83836Smrg count[n] = 0;
505*b1e83836Smrg dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
506*b1e83836Smrg }
507*b1e83836Smrg
508*b1e83836Smrg dest = retarray->base_addr;
509*b1e83836Smrg
510*b1e83836Smrg while(1)
511*b1e83836Smrg {
512*b1e83836Smrg *dest = 0;
513*b1e83836Smrg count[0]++;
514*b1e83836Smrg dest += dstride[0];
515*b1e83836Smrg n = 0;
516*b1e83836Smrg while (count[n] == extent[n])
517*b1e83836Smrg {
518*b1e83836Smrg /* When we get to the end of a dimension, reset it and increment
519*b1e83836Smrg the next dimension. */
520*b1e83836Smrg count[n] = 0;
521*b1e83836Smrg /* We could precalculate these products, but this is a less
522*b1e83836Smrg frequently used path so probably not worth it. */
523*b1e83836Smrg dest -= dstride[n] * extent[n];
524*b1e83836Smrg n++;
525*b1e83836Smrg if (n >= rank)
526*b1e83836Smrg return;
527*b1e83836Smrg else
528*b1e83836Smrg {
529*b1e83836Smrg count[n]++;
530*b1e83836Smrg dest += dstride[n];
531*b1e83836Smrg }
532*b1e83836Smrg }
533*b1e83836Smrg }
534*b1e83836Smrg }
535*b1e83836Smrg
536*b1e83836Smrg #endif
537