xref: /netbsd-src/external/gpl3/gcc/dist/libgfortran/generated/sum_c17.c (revision b1e838363e3c6fc78a55519254d99869742dd33c)
1*b1e83836Smrg /* Implementation of the SUM intrinsic
2*b1e83836Smrg    Copyright (C) 2002-2022 Free Software Foundation, Inc.
3*b1e83836Smrg    Contributed by Paul Brook <paul@nowt.org>
4*b1e83836Smrg 
5*b1e83836Smrg This file is part of the GNU Fortran 95 runtime library (libgfortran).
6*b1e83836Smrg 
7*b1e83836Smrg Libgfortran is free software; you can redistribute it and/or
8*b1e83836Smrg modify it under the terms of the GNU General Public
9*b1e83836Smrg License as published by the Free Software Foundation; either
10*b1e83836Smrg version 3 of the License, or (at your option) any later version.
11*b1e83836Smrg 
12*b1e83836Smrg Libgfortran is distributed in the hope that it will be useful,
13*b1e83836Smrg but WITHOUT ANY WARRANTY; without even the implied warranty of
14*b1e83836Smrg MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15*b1e83836Smrg GNU General Public License for more details.
16*b1e83836Smrg 
17*b1e83836Smrg Under Section 7 of GPL version 3, you are granted additional
18*b1e83836Smrg permissions described in the GCC Runtime Library Exception, version
19*b1e83836Smrg 3.1, as published by the Free Software Foundation.
20*b1e83836Smrg 
21*b1e83836Smrg You should have received a copy of the GNU General Public License and
22*b1e83836Smrg a copy of the GCC Runtime Library Exception along with this program;
23*b1e83836Smrg see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
24*b1e83836Smrg <http://www.gnu.org/licenses/>.  */
25*b1e83836Smrg 
26*b1e83836Smrg #include "libgfortran.h"
27*b1e83836Smrg 
28*b1e83836Smrg 
29*b1e83836Smrg #if defined (HAVE_GFC_COMPLEX_17) && defined (HAVE_GFC_COMPLEX_17)
30*b1e83836Smrg 
31*b1e83836Smrg 
32*b1e83836Smrg extern void sum_c17 (gfc_array_c17 * const restrict,
33*b1e83836Smrg 	gfc_array_c17 * const restrict, const index_type * const restrict);
34*b1e83836Smrg export_proto(sum_c17);
35*b1e83836Smrg 
36*b1e83836Smrg void
sum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim)37*b1e83836Smrg sum_c17 (gfc_array_c17 * const restrict retarray,
38*b1e83836Smrg 	gfc_array_c17 * const restrict array,
39*b1e83836Smrg 	const index_type * const restrict pdim)
40*b1e83836Smrg {
41*b1e83836Smrg   index_type count[GFC_MAX_DIMENSIONS];
42*b1e83836Smrg   index_type extent[GFC_MAX_DIMENSIONS];
43*b1e83836Smrg   index_type sstride[GFC_MAX_DIMENSIONS];
44*b1e83836Smrg   index_type dstride[GFC_MAX_DIMENSIONS];
45*b1e83836Smrg   const GFC_COMPLEX_17 * restrict base;
46*b1e83836Smrg   GFC_COMPLEX_17 * restrict dest;
47*b1e83836Smrg   index_type rank;
48*b1e83836Smrg   index_type n;
49*b1e83836Smrg   index_type len;
50*b1e83836Smrg   index_type delta;
51*b1e83836Smrg   index_type dim;
52*b1e83836Smrg   int continue_loop;
53*b1e83836Smrg 
54*b1e83836Smrg   /* Make dim zero based to avoid confusion.  */
55*b1e83836Smrg   rank = GFC_DESCRIPTOR_RANK (array) - 1;
56*b1e83836Smrg   dim = (*pdim) - 1;
57*b1e83836Smrg 
58*b1e83836Smrg   if (unlikely (dim < 0 || dim > rank))
59*b1e83836Smrg     {
60*b1e83836Smrg       runtime_error ("Dim argument incorrect in SUM intrinsic: "
61*b1e83836Smrg  		     "is %ld, should be between 1 and %ld",
62*b1e83836Smrg 		     (long int) dim + 1, (long int) rank + 1);
63*b1e83836Smrg     }
64*b1e83836Smrg 
65*b1e83836Smrg   len = GFC_DESCRIPTOR_EXTENT(array,dim);
66*b1e83836Smrg   if (len < 0)
67*b1e83836Smrg     len = 0;
68*b1e83836Smrg   delta = GFC_DESCRIPTOR_STRIDE(array,dim);
69*b1e83836Smrg 
70*b1e83836Smrg   for (n = 0; n < dim; n++)
71*b1e83836Smrg     {
72*b1e83836Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
73*b1e83836Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
74*b1e83836Smrg 
75*b1e83836Smrg       if (extent[n] < 0)
76*b1e83836Smrg 	extent[n] = 0;
77*b1e83836Smrg     }
78*b1e83836Smrg   for (n = dim; n < rank; n++)
79*b1e83836Smrg     {
80*b1e83836Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array, n + 1);
81*b1e83836Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
82*b1e83836Smrg 
83*b1e83836Smrg       if (extent[n] < 0)
84*b1e83836Smrg 	extent[n] = 0;
85*b1e83836Smrg     }
86*b1e83836Smrg 
87*b1e83836Smrg   if (retarray->base_addr == NULL)
88*b1e83836Smrg     {
89*b1e83836Smrg       size_t alloc_size, str;
90*b1e83836Smrg 
91*b1e83836Smrg       for (n = 0; n < rank; n++)
92*b1e83836Smrg 	{
93*b1e83836Smrg 	  if (n == 0)
94*b1e83836Smrg 	    str = 1;
95*b1e83836Smrg 	  else
96*b1e83836Smrg 	    str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
97*b1e83836Smrg 
98*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
99*b1e83836Smrg 
100*b1e83836Smrg 	}
101*b1e83836Smrg 
102*b1e83836Smrg       retarray->offset = 0;
103*b1e83836Smrg       retarray->dtype.rank = rank;
104*b1e83836Smrg 
105*b1e83836Smrg       alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
106*b1e83836Smrg 
107*b1e83836Smrg       retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
108*b1e83836Smrg       if (alloc_size == 0)
109*b1e83836Smrg 	{
110*b1e83836Smrg 	  /* Make sure we have a zero-sized array.  */
111*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
112*b1e83836Smrg 	  return;
113*b1e83836Smrg 
114*b1e83836Smrg 	}
115*b1e83836Smrg     }
116*b1e83836Smrg   else
117*b1e83836Smrg     {
118*b1e83836Smrg       if (rank != GFC_DESCRIPTOR_RANK (retarray))
119*b1e83836Smrg 	runtime_error ("rank of return array incorrect in"
120*b1e83836Smrg 		       " SUM intrinsic: is %ld, should be %ld",
121*b1e83836Smrg 		       (long int) (GFC_DESCRIPTOR_RANK (retarray)),
122*b1e83836Smrg 		       (long int) rank);
123*b1e83836Smrg 
124*b1e83836Smrg       if (unlikely (compile_options.bounds_check))
125*b1e83836Smrg 	bounds_ifunction_return ((array_t *) retarray, extent,
126*b1e83836Smrg 				 "return value", "SUM");
127*b1e83836Smrg     }
128*b1e83836Smrg 
129*b1e83836Smrg   for (n = 0; n < rank; n++)
130*b1e83836Smrg     {
131*b1e83836Smrg       count[n] = 0;
132*b1e83836Smrg       dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
133*b1e83836Smrg       if (extent[n] <= 0)
134*b1e83836Smrg 	return;
135*b1e83836Smrg     }
136*b1e83836Smrg 
137*b1e83836Smrg   base = array->base_addr;
138*b1e83836Smrg   dest = retarray->base_addr;
139*b1e83836Smrg 
140*b1e83836Smrg   continue_loop = 1;
141*b1e83836Smrg   while (continue_loop)
142*b1e83836Smrg     {
143*b1e83836Smrg       const GFC_COMPLEX_17 * restrict src;
144*b1e83836Smrg       GFC_COMPLEX_17 result;
145*b1e83836Smrg       src = base;
146*b1e83836Smrg       {
147*b1e83836Smrg 
148*b1e83836Smrg   result = 0;
149*b1e83836Smrg 	if (len <= 0)
150*b1e83836Smrg 	  *dest = 0;
151*b1e83836Smrg 	else
152*b1e83836Smrg 	  {
153*b1e83836Smrg #if ! defined HAVE_BACK_ARG
154*b1e83836Smrg 	    for (n = 0; n < len; n++, src += delta)
155*b1e83836Smrg 	      {
156*b1e83836Smrg #endif
157*b1e83836Smrg 
158*b1e83836Smrg   result += *src;
159*b1e83836Smrg 	      }
160*b1e83836Smrg 
161*b1e83836Smrg 	    *dest = result;
162*b1e83836Smrg 	  }
163*b1e83836Smrg       }
164*b1e83836Smrg       /* Advance to the next element.  */
165*b1e83836Smrg       count[0]++;
166*b1e83836Smrg       base += sstride[0];
167*b1e83836Smrg       dest += dstride[0];
168*b1e83836Smrg       n = 0;
169*b1e83836Smrg       while (count[n] == extent[n])
170*b1e83836Smrg 	{
171*b1e83836Smrg 	  /* When we get to the end of a dimension, reset it and increment
172*b1e83836Smrg 	     the next dimension.  */
173*b1e83836Smrg 	  count[n] = 0;
174*b1e83836Smrg 	  /* We could precalculate these products, but this is a less
175*b1e83836Smrg 	     frequently used path so probably not worth it.  */
176*b1e83836Smrg 	  base -= sstride[n] * extent[n];
177*b1e83836Smrg 	  dest -= dstride[n] * extent[n];
178*b1e83836Smrg 	  n++;
179*b1e83836Smrg 	  if (n >= rank)
180*b1e83836Smrg 	    {
181*b1e83836Smrg 	      /* Break out of the loop.  */
182*b1e83836Smrg 	      continue_loop = 0;
183*b1e83836Smrg 	      break;
184*b1e83836Smrg 	    }
185*b1e83836Smrg 	  else
186*b1e83836Smrg 	    {
187*b1e83836Smrg 	      count[n]++;
188*b1e83836Smrg 	      base += sstride[n];
189*b1e83836Smrg 	      dest += dstride[n];
190*b1e83836Smrg 	    }
191*b1e83836Smrg 	}
192*b1e83836Smrg     }
193*b1e83836Smrg }
194*b1e83836Smrg 
195*b1e83836Smrg 
196*b1e83836Smrg extern void msum_c17 (gfc_array_c17 * const restrict,
197*b1e83836Smrg 	gfc_array_c17 * const restrict, const index_type * const restrict,
198*b1e83836Smrg 	gfc_array_l1 * const restrict);
199*b1e83836Smrg export_proto(msum_c17);
200*b1e83836Smrg 
201*b1e83836Smrg void
msum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim,gfc_array_l1 * const restrict mask)202*b1e83836Smrg msum_c17 (gfc_array_c17 * const restrict retarray,
203*b1e83836Smrg 	gfc_array_c17 * const restrict array,
204*b1e83836Smrg 	const index_type * const restrict pdim,
205*b1e83836Smrg 	gfc_array_l1 * const restrict mask)
206*b1e83836Smrg {
207*b1e83836Smrg   index_type count[GFC_MAX_DIMENSIONS];
208*b1e83836Smrg   index_type extent[GFC_MAX_DIMENSIONS];
209*b1e83836Smrg   index_type sstride[GFC_MAX_DIMENSIONS];
210*b1e83836Smrg   index_type dstride[GFC_MAX_DIMENSIONS];
211*b1e83836Smrg   index_type mstride[GFC_MAX_DIMENSIONS];
212*b1e83836Smrg   GFC_COMPLEX_17 * restrict dest;
213*b1e83836Smrg   const GFC_COMPLEX_17 * restrict base;
214*b1e83836Smrg   const GFC_LOGICAL_1 * restrict mbase;
215*b1e83836Smrg   index_type rank;
216*b1e83836Smrg   index_type dim;
217*b1e83836Smrg   index_type n;
218*b1e83836Smrg   index_type len;
219*b1e83836Smrg   index_type delta;
220*b1e83836Smrg   index_type mdelta;
221*b1e83836Smrg   int mask_kind;
222*b1e83836Smrg 
223*b1e83836Smrg   if (mask == NULL)
224*b1e83836Smrg     {
225*b1e83836Smrg #ifdef HAVE_BACK_ARG
226*b1e83836Smrg       sum_c17 (retarray, array, pdim, back);
227*b1e83836Smrg #else
228*b1e83836Smrg       sum_c17 (retarray, array, pdim);
229*b1e83836Smrg #endif
230*b1e83836Smrg       return;
231*b1e83836Smrg     }
232*b1e83836Smrg 
233*b1e83836Smrg   dim = (*pdim) - 1;
234*b1e83836Smrg   rank = GFC_DESCRIPTOR_RANK (array) - 1;
235*b1e83836Smrg 
236*b1e83836Smrg 
237*b1e83836Smrg   if (unlikely (dim < 0 || dim > rank))
238*b1e83836Smrg     {
239*b1e83836Smrg       runtime_error ("Dim argument incorrect in SUM intrinsic: "
240*b1e83836Smrg  		     "is %ld, should be between 1 and %ld",
241*b1e83836Smrg 		     (long int) dim + 1, (long int) rank + 1);
242*b1e83836Smrg     }
243*b1e83836Smrg 
244*b1e83836Smrg   len = GFC_DESCRIPTOR_EXTENT(array,dim);
245*b1e83836Smrg   if (len <= 0)
246*b1e83836Smrg     return;
247*b1e83836Smrg 
248*b1e83836Smrg   mbase = mask->base_addr;
249*b1e83836Smrg 
250*b1e83836Smrg   mask_kind = GFC_DESCRIPTOR_SIZE (mask);
251*b1e83836Smrg 
252*b1e83836Smrg   if (mask_kind == 1 || mask_kind == 2 || mask_kind == 4 || mask_kind == 8
253*b1e83836Smrg #ifdef HAVE_GFC_LOGICAL_16
254*b1e83836Smrg       || mask_kind == 16
255*b1e83836Smrg #endif
256*b1e83836Smrg       )
257*b1e83836Smrg     mbase = GFOR_POINTER_TO_L1 (mbase, mask_kind);
258*b1e83836Smrg   else
259*b1e83836Smrg     runtime_error ("Funny sized logical array");
260*b1e83836Smrg 
261*b1e83836Smrg   delta = GFC_DESCRIPTOR_STRIDE(array,dim);
262*b1e83836Smrg   mdelta = GFC_DESCRIPTOR_STRIDE_BYTES(mask,dim);
263*b1e83836Smrg 
264*b1e83836Smrg   for (n = 0; n < dim; n++)
265*b1e83836Smrg     {
266*b1e83836Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
267*b1e83836Smrg       mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask,n);
268*b1e83836Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
269*b1e83836Smrg 
270*b1e83836Smrg       if (extent[n] < 0)
271*b1e83836Smrg 	extent[n] = 0;
272*b1e83836Smrg 
273*b1e83836Smrg     }
274*b1e83836Smrg   for (n = dim; n < rank; n++)
275*b1e83836Smrg     {
276*b1e83836Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n + 1);
277*b1e83836Smrg       mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask, n + 1);
278*b1e83836Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
279*b1e83836Smrg 
280*b1e83836Smrg       if (extent[n] < 0)
281*b1e83836Smrg 	extent[n] = 0;
282*b1e83836Smrg     }
283*b1e83836Smrg 
284*b1e83836Smrg   if (retarray->base_addr == NULL)
285*b1e83836Smrg     {
286*b1e83836Smrg       size_t alloc_size, str;
287*b1e83836Smrg 
288*b1e83836Smrg       for (n = 0; n < rank; n++)
289*b1e83836Smrg 	{
290*b1e83836Smrg 	  if (n == 0)
291*b1e83836Smrg 	    str = 1;
292*b1e83836Smrg 	  else
293*b1e83836Smrg 	    str= GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
294*b1e83836Smrg 
295*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
296*b1e83836Smrg 
297*b1e83836Smrg 	}
298*b1e83836Smrg 
299*b1e83836Smrg       alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
300*b1e83836Smrg 
301*b1e83836Smrg       retarray->offset = 0;
302*b1e83836Smrg       retarray->dtype.rank = rank;
303*b1e83836Smrg 
304*b1e83836Smrg       if (alloc_size == 0)
305*b1e83836Smrg 	{
306*b1e83836Smrg 	  /* Make sure we have a zero-sized array.  */
307*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
308*b1e83836Smrg 	  return;
309*b1e83836Smrg 	}
310*b1e83836Smrg       else
311*b1e83836Smrg 	retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
312*b1e83836Smrg 
313*b1e83836Smrg     }
314*b1e83836Smrg   else
315*b1e83836Smrg     {
316*b1e83836Smrg       if (rank != GFC_DESCRIPTOR_RANK (retarray))
317*b1e83836Smrg 	runtime_error ("rank of return array incorrect in SUM intrinsic");
318*b1e83836Smrg 
319*b1e83836Smrg       if (unlikely (compile_options.bounds_check))
320*b1e83836Smrg 	{
321*b1e83836Smrg 	  bounds_ifunction_return ((array_t *) retarray, extent,
322*b1e83836Smrg 				   "return value", "SUM");
323*b1e83836Smrg 	  bounds_equal_extents ((array_t *) mask, (array_t *) array,
324*b1e83836Smrg 	  			"MASK argument", "SUM");
325*b1e83836Smrg 	}
326*b1e83836Smrg     }
327*b1e83836Smrg 
328*b1e83836Smrg   for (n = 0; n < rank; n++)
329*b1e83836Smrg     {
330*b1e83836Smrg       count[n] = 0;
331*b1e83836Smrg       dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
332*b1e83836Smrg       if (extent[n] <= 0)
333*b1e83836Smrg 	return;
334*b1e83836Smrg     }
335*b1e83836Smrg 
336*b1e83836Smrg   dest = retarray->base_addr;
337*b1e83836Smrg   base = array->base_addr;
338*b1e83836Smrg 
339*b1e83836Smrg   while (base)
340*b1e83836Smrg     {
341*b1e83836Smrg       const GFC_COMPLEX_17 * restrict src;
342*b1e83836Smrg       const GFC_LOGICAL_1 * restrict msrc;
343*b1e83836Smrg       GFC_COMPLEX_17 result;
344*b1e83836Smrg       src = base;
345*b1e83836Smrg       msrc = mbase;
346*b1e83836Smrg       {
347*b1e83836Smrg 
348*b1e83836Smrg   result = 0;
349*b1e83836Smrg 	for (n = 0; n < len; n++, src += delta, msrc += mdelta)
350*b1e83836Smrg 	  {
351*b1e83836Smrg 
352*b1e83836Smrg   if (*msrc)
353*b1e83836Smrg     result += *src;
354*b1e83836Smrg 	  }
355*b1e83836Smrg 	*dest = result;
356*b1e83836Smrg       }
357*b1e83836Smrg       /* Advance to the next element.  */
358*b1e83836Smrg       count[0]++;
359*b1e83836Smrg       base += sstride[0];
360*b1e83836Smrg       mbase += mstride[0];
361*b1e83836Smrg       dest += dstride[0];
362*b1e83836Smrg       n = 0;
363*b1e83836Smrg       while (count[n] == extent[n])
364*b1e83836Smrg 	{
365*b1e83836Smrg 	  /* When we get to the end of a dimension, reset it and increment
366*b1e83836Smrg 	     the next dimension.  */
367*b1e83836Smrg 	  count[n] = 0;
368*b1e83836Smrg 	  /* We could precalculate these products, but this is a less
369*b1e83836Smrg 	     frequently used path so probably not worth it.  */
370*b1e83836Smrg 	  base -= sstride[n] * extent[n];
371*b1e83836Smrg 	  mbase -= mstride[n] * extent[n];
372*b1e83836Smrg 	  dest -= dstride[n] * extent[n];
373*b1e83836Smrg 	  n++;
374*b1e83836Smrg 	  if (n >= rank)
375*b1e83836Smrg 	    {
376*b1e83836Smrg 	      /* Break out of the loop.  */
377*b1e83836Smrg 	      base = NULL;
378*b1e83836Smrg 	      break;
379*b1e83836Smrg 	    }
380*b1e83836Smrg 	  else
381*b1e83836Smrg 	    {
382*b1e83836Smrg 	      count[n]++;
383*b1e83836Smrg 	      base += sstride[n];
384*b1e83836Smrg 	      mbase += mstride[n];
385*b1e83836Smrg 	      dest += dstride[n];
386*b1e83836Smrg 	    }
387*b1e83836Smrg 	}
388*b1e83836Smrg     }
389*b1e83836Smrg }
390*b1e83836Smrg 
391*b1e83836Smrg 
392*b1e83836Smrg extern void ssum_c17 (gfc_array_c17 * const restrict,
393*b1e83836Smrg 	gfc_array_c17 * const restrict, const index_type * const restrict,
394*b1e83836Smrg 	GFC_LOGICAL_4 *);
395*b1e83836Smrg export_proto(ssum_c17);
396*b1e83836Smrg 
397*b1e83836Smrg void
ssum_c17(gfc_array_c17 * const restrict retarray,gfc_array_c17 * const restrict array,const index_type * const restrict pdim,GFC_LOGICAL_4 * mask)398*b1e83836Smrg ssum_c17 (gfc_array_c17 * const restrict retarray,
399*b1e83836Smrg 	gfc_array_c17 * const restrict array,
400*b1e83836Smrg 	const index_type * const restrict pdim,
401*b1e83836Smrg 	GFC_LOGICAL_4 * mask)
402*b1e83836Smrg {
403*b1e83836Smrg   index_type count[GFC_MAX_DIMENSIONS];
404*b1e83836Smrg   index_type extent[GFC_MAX_DIMENSIONS];
405*b1e83836Smrg   index_type dstride[GFC_MAX_DIMENSIONS];
406*b1e83836Smrg   GFC_COMPLEX_17 * restrict dest;
407*b1e83836Smrg   index_type rank;
408*b1e83836Smrg   index_type n;
409*b1e83836Smrg   index_type dim;
410*b1e83836Smrg 
411*b1e83836Smrg 
412*b1e83836Smrg   if (mask == NULL || *mask)
413*b1e83836Smrg     {
414*b1e83836Smrg #ifdef HAVE_BACK_ARG
415*b1e83836Smrg       sum_c17 (retarray, array, pdim, back);
416*b1e83836Smrg #else
417*b1e83836Smrg       sum_c17 (retarray, array, pdim);
418*b1e83836Smrg #endif
419*b1e83836Smrg       return;
420*b1e83836Smrg     }
421*b1e83836Smrg   /* Make dim zero based to avoid confusion.  */
422*b1e83836Smrg   dim = (*pdim) - 1;
423*b1e83836Smrg   rank = GFC_DESCRIPTOR_RANK (array) - 1;
424*b1e83836Smrg 
425*b1e83836Smrg   if (unlikely (dim < 0 || dim > rank))
426*b1e83836Smrg     {
427*b1e83836Smrg       runtime_error ("Dim argument incorrect in SUM intrinsic: "
428*b1e83836Smrg  		     "is %ld, should be between 1 and %ld",
429*b1e83836Smrg 		     (long int) dim + 1, (long int) rank + 1);
430*b1e83836Smrg     }
431*b1e83836Smrg 
432*b1e83836Smrg   for (n = 0; n < dim; n++)
433*b1e83836Smrg     {
434*b1e83836Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
435*b1e83836Smrg 
436*b1e83836Smrg       if (extent[n] <= 0)
437*b1e83836Smrg 	extent[n] = 0;
438*b1e83836Smrg     }
439*b1e83836Smrg 
440*b1e83836Smrg   for (n = dim; n < rank; n++)
441*b1e83836Smrg     {
442*b1e83836Smrg       extent[n] =
443*b1e83836Smrg 	GFC_DESCRIPTOR_EXTENT(array,n + 1);
444*b1e83836Smrg 
445*b1e83836Smrg       if (extent[n] <= 0)
446*b1e83836Smrg 	extent[n] = 0;
447*b1e83836Smrg     }
448*b1e83836Smrg 
449*b1e83836Smrg   if (retarray->base_addr == NULL)
450*b1e83836Smrg     {
451*b1e83836Smrg       size_t alloc_size, str;
452*b1e83836Smrg 
453*b1e83836Smrg       for (n = 0; n < rank; n++)
454*b1e83836Smrg 	{
455*b1e83836Smrg 	  if (n == 0)
456*b1e83836Smrg 	    str = 1;
457*b1e83836Smrg 	  else
458*b1e83836Smrg 	    str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
459*b1e83836Smrg 
460*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
461*b1e83836Smrg 
462*b1e83836Smrg 	}
463*b1e83836Smrg 
464*b1e83836Smrg       retarray->offset = 0;
465*b1e83836Smrg       retarray->dtype.rank = rank;
466*b1e83836Smrg 
467*b1e83836Smrg       alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
468*b1e83836Smrg 
469*b1e83836Smrg       if (alloc_size == 0)
470*b1e83836Smrg 	{
471*b1e83836Smrg 	  /* Make sure we have a zero-sized array.  */
472*b1e83836Smrg 	  GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
473*b1e83836Smrg 	  return;
474*b1e83836Smrg 	}
475*b1e83836Smrg       else
476*b1e83836Smrg 	retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_COMPLEX_17));
477*b1e83836Smrg     }
478*b1e83836Smrg   else
479*b1e83836Smrg     {
480*b1e83836Smrg       if (rank != GFC_DESCRIPTOR_RANK (retarray))
481*b1e83836Smrg 	runtime_error ("rank of return array incorrect in"
482*b1e83836Smrg 		       " SUM intrinsic: is %ld, should be %ld",
483*b1e83836Smrg 		       (long int) (GFC_DESCRIPTOR_RANK (retarray)),
484*b1e83836Smrg 		       (long int) rank);
485*b1e83836Smrg 
486*b1e83836Smrg       if (unlikely (compile_options.bounds_check))
487*b1e83836Smrg 	{
488*b1e83836Smrg 	  for (n=0; n < rank; n++)
489*b1e83836Smrg 	    {
490*b1e83836Smrg 	      index_type ret_extent;
491*b1e83836Smrg 
492*b1e83836Smrg 	      ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,n);
493*b1e83836Smrg 	      if (extent[n] != ret_extent)
494*b1e83836Smrg 		runtime_error ("Incorrect extent in return value of"
495*b1e83836Smrg 			       " SUM intrinsic in dimension %ld:"
496*b1e83836Smrg 			       " is %ld, should be %ld", (long int) n + 1,
497*b1e83836Smrg 			       (long int) ret_extent, (long int) extent[n]);
498*b1e83836Smrg 	    }
499*b1e83836Smrg 	}
500*b1e83836Smrg     }
501*b1e83836Smrg 
502*b1e83836Smrg   for (n = 0; n < rank; n++)
503*b1e83836Smrg     {
504*b1e83836Smrg       count[n] = 0;
505*b1e83836Smrg       dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
506*b1e83836Smrg     }
507*b1e83836Smrg 
508*b1e83836Smrg   dest = retarray->base_addr;
509*b1e83836Smrg 
510*b1e83836Smrg   while(1)
511*b1e83836Smrg     {
512*b1e83836Smrg       *dest = 0;
513*b1e83836Smrg       count[0]++;
514*b1e83836Smrg       dest += dstride[0];
515*b1e83836Smrg       n = 0;
516*b1e83836Smrg       while (count[n] == extent[n])
517*b1e83836Smrg 	{
518*b1e83836Smrg 	  /* When we get to the end of a dimension, reset it and increment
519*b1e83836Smrg 	     the next dimension.  */
520*b1e83836Smrg 	  count[n] = 0;
521*b1e83836Smrg 	  /* We could precalculate these products, but this is a less
522*b1e83836Smrg 	     frequently used path so probably not worth it.  */
523*b1e83836Smrg 	  dest -= dstride[n] * extent[n];
524*b1e83836Smrg 	  n++;
525*b1e83836Smrg 	  if (n >= rank)
526*b1e83836Smrg 	    return;
527*b1e83836Smrg 	  else
528*b1e83836Smrg 	    {
529*b1e83836Smrg 	      count[n]++;
530*b1e83836Smrg 	      dest += dstride[n];
531*b1e83836Smrg 	    }
532*b1e83836Smrg       	}
533*b1e83836Smrg     }
534*b1e83836Smrg }
535*b1e83836Smrg 
536*b1e83836Smrg #endif
537