xref: /netbsd-src/external/gpl3/gcc.old/dist/libgfortran/generated/norm2_r4.c (revision 4c3eb207d36f67d31994830c0a694161fc1ca39b)
1627f7eb2Smrg /* Implementation of the NORM2 intrinsic
2*4c3eb207Smrg    Copyright (C) 2010-2020 Free Software Foundation, Inc.
3627f7eb2Smrg    Contributed by Tobias Burnus  <burnus@net-b.de>
4627f7eb2Smrg 
5627f7eb2Smrg This file is part of the GNU Fortran runtime library (libgfortran).
6627f7eb2Smrg 
7627f7eb2Smrg Libgfortran is free software; you can redistribute it and/or
8627f7eb2Smrg modify it under the terms of the GNU General Public
9627f7eb2Smrg License as published by the Free Software Foundation; either
10627f7eb2Smrg version 3 of the License, or (at your option) any later version.
11627f7eb2Smrg 
12627f7eb2Smrg Libgfortran is distributed in the hope that it will be useful,
13627f7eb2Smrg but WITHOUT ANY WARRANTY; without even the implied warranty of
14627f7eb2Smrg MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15627f7eb2Smrg GNU General Public License for more details.
16627f7eb2Smrg 
17627f7eb2Smrg Under Section 7 of GPL version 3, you are granted additional
18627f7eb2Smrg permissions described in the GCC Runtime Library Exception, version
19627f7eb2Smrg 3.1, as published by the Free Software Foundation.
20627f7eb2Smrg 
21627f7eb2Smrg You should have received a copy of the GNU General Public License and
22627f7eb2Smrg a copy of the GCC Runtime Library Exception along with this program;
23627f7eb2Smrg see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
24627f7eb2Smrg <http://www.gnu.org/licenses/>.  */
25627f7eb2Smrg 
26627f7eb2Smrg #include "libgfortran.h"
27627f7eb2Smrg 
28627f7eb2Smrg 
29627f7eb2Smrg 
30627f7eb2Smrg #if defined (HAVE_GFC_REAL_4) && defined (HAVE_GFC_REAL_4) && defined (HAVE_SQRTF) && defined (HAVE_FABSF)
31627f7eb2Smrg 
32627f7eb2Smrg #define MATHFUNC(funcname) funcname ## f
33627f7eb2Smrg 
34627f7eb2Smrg 
35627f7eb2Smrg extern void norm2_r4 (gfc_array_r4 * const restrict,
36627f7eb2Smrg 	gfc_array_r4 * const restrict, const index_type * const restrict);
37627f7eb2Smrg export_proto(norm2_r4);
38627f7eb2Smrg 
39627f7eb2Smrg void
norm2_r4(gfc_array_r4 * const restrict retarray,gfc_array_r4 * const restrict array,const index_type * const restrict pdim)40627f7eb2Smrg norm2_r4 (gfc_array_r4 * const restrict retarray,
41627f7eb2Smrg 	gfc_array_r4 * const restrict array,
42627f7eb2Smrg 	const index_type * const restrict pdim)
43627f7eb2Smrg {
44627f7eb2Smrg   index_type count[GFC_MAX_DIMENSIONS];
45627f7eb2Smrg   index_type extent[GFC_MAX_DIMENSIONS];
46627f7eb2Smrg   index_type sstride[GFC_MAX_DIMENSIONS];
47627f7eb2Smrg   index_type dstride[GFC_MAX_DIMENSIONS];
48627f7eb2Smrg   const GFC_REAL_4 * restrict base;
49627f7eb2Smrg   GFC_REAL_4 * restrict dest;
50627f7eb2Smrg   index_type rank;
51627f7eb2Smrg   index_type n;
52627f7eb2Smrg   index_type len;
53627f7eb2Smrg   index_type delta;
54627f7eb2Smrg   index_type dim;
55627f7eb2Smrg   int continue_loop;
56627f7eb2Smrg 
57627f7eb2Smrg   /* Make dim zero based to avoid confusion.  */
58627f7eb2Smrg   rank = GFC_DESCRIPTOR_RANK (array) - 1;
59627f7eb2Smrg   dim = (*pdim) - 1;
60627f7eb2Smrg 
61627f7eb2Smrg   if (unlikely (dim < 0 || dim > rank))
62627f7eb2Smrg     {
63627f7eb2Smrg       runtime_error ("Dim argument incorrect in NORM intrinsic: "
64627f7eb2Smrg  		     "is %ld, should be between 1 and %ld",
65627f7eb2Smrg 		     (long int) dim + 1, (long int) rank + 1);
66627f7eb2Smrg     }
67627f7eb2Smrg 
68627f7eb2Smrg   len = GFC_DESCRIPTOR_EXTENT(array,dim);
69627f7eb2Smrg   if (len < 0)
70627f7eb2Smrg     len = 0;
71627f7eb2Smrg   delta = GFC_DESCRIPTOR_STRIDE(array,dim);
72627f7eb2Smrg 
73627f7eb2Smrg   for (n = 0; n < dim; n++)
74627f7eb2Smrg     {
75627f7eb2Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
76627f7eb2Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
77627f7eb2Smrg 
78627f7eb2Smrg       if (extent[n] < 0)
79627f7eb2Smrg 	extent[n] = 0;
80627f7eb2Smrg     }
81627f7eb2Smrg   for (n = dim; n < rank; n++)
82627f7eb2Smrg     {
83627f7eb2Smrg       sstride[n] = GFC_DESCRIPTOR_STRIDE(array, n + 1);
84627f7eb2Smrg       extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
85627f7eb2Smrg 
86627f7eb2Smrg       if (extent[n] < 0)
87627f7eb2Smrg 	extent[n] = 0;
88627f7eb2Smrg     }
89627f7eb2Smrg 
90627f7eb2Smrg   if (retarray->base_addr == NULL)
91627f7eb2Smrg     {
92627f7eb2Smrg       size_t alloc_size, str;
93627f7eb2Smrg 
94627f7eb2Smrg       for (n = 0; n < rank; n++)
95627f7eb2Smrg 	{
96627f7eb2Smrg 	  if (n == 0)
97627f7eb2Smrg 	    str = 1;
98627f7eb2Smrg 	  else
99627f7eb2Smrg 	    str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
100627f7eb2Smrg 
101627f7eb2Smrg 	  GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
102627f7eb2Smrg 
103627f7eb2Smrg 	}
104627f7eb2Smrg 
105627f7eb2Smrg       retarray->offset = 0;
106627f7eb2Smrg       retarray->dtype.rank = rank;
107627f7eb2Smrg 
108627f7eb2Smrg       alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
109627f7eb2Smrg 
110627f7eb2Smrg       retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_REAL_4));
111627f7eb2Smrg       if (alloc_size == 0)
112627f7eb2Smrg 	{
113627f7eb2Smrg 	  /* Make sure we have a zero-sized array.  */
114627f7eb2Smrg 	  GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
115627f7eb2Smrg 	  return;
116627f7eb2Smrg 
117627f7eb2Smrg 	}
118627f7eb2Smrg     }
119627f7eb2Smrg   else
120627f7eb2Smrg     {
121627f7eb2Smrg       if (rank != GFC_DESCRIPTOR_RANK (retarray))
122627f7eb2Smrg 	runtime_error ("rank of return array incorrect in"
123627f7eb2Smrg 		       " NORM intrinsic: is %ld, should be %ld",
124627f7eb2Smrg 		       (long int) (GFC_DESCRIPTOR_RANK (retarray)),
125627f7eb2Smrg 		       (long int) rank);
126627f7eb2Smrg 
127627f7eb2Smrg       if (unlikely (compile_options.bounds_check))
128627f7eb2Smrg 	bounds_ifunction_return ((array_t *) retarray, extent,
129627f7eb2Smrg 				 "return value", "NORM");
130627f7eb2Smrg     }
131627f7eb2Smrg 
132627f7eb2Smrg   for (n = 0; n < rank; n++)
133627f7eb2Smrg     {
134627f7eb2Smrg       count[n] = 0;
135627f7eb2Smrg       dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
136627f7eb2Smrg       if (extent[n] <= 0)
137627f7eb2Smrg 	return;
138627f7eb2Smrg     }
139627f7eb2Smrg 
140627f7eb2Smrg   base = array->base_addr;
141627f7eb2Smrg   dest = retarray->base_addr;
142627f7eb2Smrg 
143627f7eb2Smrg   continue_loop = 1;
144627f7eb2Smrg   while (continue_loop)
145627f7eb2Smrg     {
146627f7eb2Smrg       const GFC_REAL_4 * restrict src;
147627f7eb2Smrg       GFC_REAL_4 result;
148627f7eb2Smrg       src = base;
149627f7eb2Smrg       {
150627f7eb2Smrg 
151627f7eb2Smrg 	GFC_REAL_4 scale;
152627f7eb2Smrg 	result = 0;
153627f7eb2Smrg 	scale = 1;
154627f7eb2Smrg 	if (len <= 0)
155627f7eb2Smrg 	  *dest = 0;
156627f7eb2Smrg 	else
157627f7eb2Smrg 	  {
158627f7eb2Smrg #if ! defined HAVE_BACK_ARG
159627f7eb2Smrg 	    for (n = 0; n < len; n++, src += delta)
160627f7eb2Smrg 	      {
161627f7eb2Smrg #endif
162627f7eb2Smrg 
163627f7eb2Smrg 	  if (*src != 0)
164627f7eb2Smrg 	    {
165627f7eb2Smrg 	      GFC_REAL_4 absX, val;
166627f7eb2Smrg 	      absX = MATHFUNC(fabs) (*src);
167627f7eb2Smrg 	      if (scale < absX)
168627f7eb2Smrg 		{
169627f7eb2Smrg 		  val = scale / absX;
170627f7eb2Smrg 		  result = 1 + result * val * val;
171627f7eb2Smrg 		  scale = absX;
172627f7eb2Smrg 		}
173627f7eb2Smrg 	      else
174627f7eb2Smrg 		{
175627f7eb2Smrg 		  val = absX / scale;
176627f7eb2Smrg 		  result += val * val;
177627f7eb2Smrg 		}
178627f7eb2Smrg 	    }
179627f7eb2Smrg 	      }
180627f7eb2Smrg 	    result = scale * MATHFUNC(sqrt) (result);
181627f7eb2Smrg 	    *dest = result;
182627f7eb2Smrg 	  }
183627f7eb2Smrg       }
184627f7eb2Smrg       /* Advance to the next element.  */
185627f7eb2Smrg       count[0]++;
186627f7eb2Smrg       base += sstride[0];
187627f7eb2Smrg       dest += dstride[0];
188627f7eb2Smrg       n = 0;
189627f7eb2Smrg       while (count[n] == extent[n])
190627f7eb2Smrg 	{
191627f7eb2Smrg 	  /* When we get to the end of a dimension, reset it and increment
192627f7eb2Smrg 	     the next dimension.  */
193627f7eb2Smrg 	  count[n] = 0;
194627f7eb2Smrg 	  /* We could precalculate these products, but this is a less
195627f7eb2Smrg 	     frequently used path so probably not worth it.  */
196627f7eb2Smrg 	  base -= sstride[n] * extent[n];
197627f7eb2Smrg 	  dest -= dstride[n] * extent[n];
198627f7eb2Smrg 	  n++;
199627f7eb2Smrg 	  if (n >= rank)
200627f7eb2Smrg 	    {
201627f7eb2Smrg 	      /* Break out of the loop.  */
202627f7eb2Smrg 	      continue_loop = 0;
203627f7eb2Smrg 	      break;
204627f7eb2Smrg 	    }
205627f7eb2Smrg 	  else
206627f7eb2Smrg 	    {
207627f7eb2Smrg 	      count[n]++;
208627f7eb2Smrg 	      base += sstride[n];
209627f7eb2Smrg 	      dest += dstride[n];
210627f7eb2Smrg 	    }
211627f7eb2Smrg 	}
212627f7eb2Smrg     }
213627f7eb2Smrg }
214627f7eb2Smrg 
215627f7eb2Smrg #endif
216