1627f7eb2Smrg /* Implementation of the NORM2 intrinsic
2*4c3eb207Smrg Copyright (C) 2010-2020 Free Software Foundation, Inc.
3627f7eb2Smrg Contributed by Tobias Burnus <burnus@net-b.de>
4627f7eb2Smrg
5627f7eb2Smrg This file is part of the GNU Fortran runtime library (libgfortran).
6627f7eb2Smrg
7627f7eb2Smrg Libgfortran is free software; you can redistribute it and/or
8627f7eb2Smrg modify it under the terms of the GNU General Public
9627f7eb2Smrg License as published by the Free Software Foundation; either
10627f7eb2Smrg version 3 of the License, or (at your option) any later version.
11627f7eb2Smrg
12627f7eb2Smrg Libgfortran is distributed in the hope that it will be useful,
13627f7eb2Smrg but WITHOUT ANY WARRANTY; without even the implied warranty of
14627f7eb2Smrg MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15627f7eb2Smrg GNU General Public License for more details.
16627f7eb2Smrg
17627f7eb2Smrg Under Section 7 of GPL version 3, you are granted additional
18627f7eb2Smrg permissions described in the GCC Runtime Library Exception, version
19627f7eb2Smrg 3.1, as published by the Free Software Foundation.
20627f7eb2Smrg
21627f7eb2Smrg You should have received a copy of the GNU General Public License and
22627f7eb2Smrg a copy of the GCC Runtime Library Exception along with this program;
23627f7eb2Smrg see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
24627f7eb2Smrg <http://www.gnu.org/licenses/>. */
25627f7eb2Smrg
26627f7eb2Smrg #include "libgfortran.h"
27627f7eb2Smrg
28627f7eb2Smrg
29627f7eb2Smrg
30627f7eb2Smrg #if defined (HAVE_GFC_REAL_4) && defined (HAVE_GFC_REAL_4) && defined (HAVE_SQRTF) && defined (HAVE_FABSF)
31627f7eb2Smrg
32627f7eb2Smrg #define MATHFUNC(funcname) funcname ## f
33627f7eb2Smrg
34627f7eb2Smrg
35627f7eb2Smrg extern void norm2_r4 (gfc_array_r4 * const restrict,
36627f7eb2Smrg gfc_array_r4 * const restrict, const index_type * const restrict);
37627f7eb2Smrg export_proto(norm2_r4);
38627f7eb2Smrg
39627f7eb2Smrg void
norm2_r4(gfc_array_r4 * const restrict retarray,gfc_array_r4 * const restrict array,const index_type * const restrict pdim)40627f7eb2Smrg norm2_r4 (gfc_array_r4 * const restrict retarray,
41627f7eb2Smrg gfc_array_r4 * const restrict array,
42627f7eb2Smrg const index_type * const restrict pdim)
43627f7eb2Smrg {
44627f7eb2Smrg index_type count[GFC_MAX_DIMENSIONS];
45627f7eb2Smrg index_type extent[GFC_MAX_DIMENSIONS];
46627f7eb2Smrg index_type sstride[GFC_MAX_DIMENSIONS];
47627f7eb2Smrg index_type dstride[GFC_MAX_DIMENSIONS];
48627f7eb2Smrg const GFC_REAL_4 * restrict base;
49627f7eb2Smrg GFC_REAL_4 * restrict dest;
50627f7eb2Smrg index_type rank;
51627f7eb2Smrg index_type n;
52627f7eb2Smrg index_type len;
53627f7eb2Smrg index_type delta;
54627f7eb2Smrg index_type dim;
55627f7eb2Smrg int continue_loop;
56627f7eb2Smrg
57627f7eb2Smrg /* Make dim zero based to avoid confusion. */
58627f7eb2Smrg rank = GFC_DESCRIPTOR_RANK (array) - 1;
59627f7eb2Smrg dim = (*pdim) - 1;
60627f7eb2Smrg
61627f7eb2Smrg if (unlikely (dim < 0 || dim > rank))
62627f7eb2Smrg {
63627f7eb2Smrg runtime_error ("Dim argument incorrect in NORM intrinsic: "
64627f7eb2Smrg "is %ld, should be between 1 and %ld",
65627f7eb2Smrg (long int) dim + 1, (long int) rank + 1);
66627f7eb2Smrg }
67627f7eb2Smrg
68627f7eb2Smrg len = GFC_DESCRIPTOR_EXTENT(array,dim);
69627f7eb2Smrg if (len < 0)
70627f7eb2Smrg len = 0;
71627f7eb2Smrg delta = GFC_DESCRIPTOR_STRIDE(array,dim);
72627f7eb2Smrg
73627f7eb2Smrg for (n = 0; n < dim; n++)
74627f7eb2Smrg {
75627f7eb2Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n);
76627f7eb2Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array,n);
77627f7eb2Smrg
78627f7eb2Smrg if (extent[n] < 0)
79627f7eb2Smrg extent[n] = 0;
80627f7eb2Smrg }
81627f7eb2Smrg for (n = dim; n < rank; n++)
82627f7eb2Smrg {
83627f7eb2Smrg sstride[n] = GFC_DESCRIPTOR_STRIDE(array, n + 1);
84627f7eb2Smrg extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1);
85627f7eb2Smrg
86627f7eb2Smrg if (extent[n] < 0)
87627f7eb2Smrg extent[n] = 0;
88627f7eb2Smrg }
89627f7eb2Smrg
90627f7eb2Smrg if (retarray->base_addr == NULL)
91627f7eb2Smrg {
92627f7eb2Smrg size_t alloc_size, str;
93627f7eb2Smrg
94627f7eb2Smrg for (n = 0; n < rank; n++)
95627f7eb2Smrg {
96627f7eb2Smrg if (n == 0)
97627f7eb2Smrg str = 1;
98627f7eb2Smrg else
99627f7eb2Smrg str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1];
100627f7eb2Smrg
101627f7eb2Smrg GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str);
102627f7eb2Smrg
103627f7eb2Smrg }
104627f7eb2Smrg
105627f7eb2Smrg retarray->offset = 0;
106627f7eb2Smrg retarray->dtype.rank = rank;
107627f7eb2Smrg
108627f7eb2Smrg alloc_size = GFC_DESCRIPTOR_STRIDE(retarray,rank-1) * extent[rank-1];
109627f7eb2Smrg
110627f7eb2Smrg retarray->base_addr = xmallocarray (alloc_size, sizeof (GFC_REAL_4));
111627f7eb2Smrg if (alloc_size == 0)
112627f7eb2Smrg {
113627f7eb2Smrg /* Make sure we have a zero-sized array. */
114627f7eb2Smrg GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1);
115627f7eb2Smrg return;
116627f7eb2Smrg
117627f7eb2Smrg }
118627f7eb2Smrg }
119627f7eb2Smrg else
120627f7eb2Smrg {
121627f7eb2Smrg if (rank != GFC_DESCRIPTOR_RANK (retarray))
122627f7eb2Smrg runtime_error ("rank of return array incorrect in"
123627f7eb2Smrg " NORM intrinsic: is %ld, should be %ld",
124627f7eb2Smrg (long int) (GFC_DESCRIPTOR_RANK (retarray)),
125627f7eb2Smrg (long int) rank);
126627f7eb2Smrg
127627f7eb2Smrg if (unlikely (compile_options.bounds_check))
128627f7eb2Smrg bounds_ifunction_return ((array_t *) retarray, extent,
129627f7eb2Smrg "return value", "NORM");
130627f7eb2Smrg }
131627f7eb2Smrg
132627f7eb2Smrg for (n = 0; n < rank; n++)
133627f7eb2Smrg {
134627f7eb2Smrg count[n] = 0;
135627f7eb2Smrg dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n);
136627f7eb2Smrg if (extent[n] <= 0)
137627f7eb2Smrg return;
138627f7eb2Smrg }
139627f7eb2Smrg
140627f7eb2Smrg base = array->base_addr;
141627f7eb2Smrg dest = retarray->base_addr;
142627f7eb2Smrg
143627f7eb2Smrg continue_loop = 1;
144627f7eb2Smrg while (continue_loop)
145627f7eb2Smrg {
146627f7eb2Smrg const GFC_REAL_4 * restrict src;
147627f7eb2Smrg GFC_REAL_4 result;
148627f7eb2Smrg src = base;
149627f7eb2Smrg {
150627f7eb2Smrg
151627f7eb2Smrg GFC_REAL_4 scale;
152627f7eb2Smrg result = 0;
153627f7eb2Smrg scale = 1;
154627f7eb2Smrg if (len <= 0)
155627f7eb2Smrg *dest = 0;
156627f7eb2Smrg else
157627f7eb2Smrg {
158627f7eb2Smrg #if ! defined HAVE_BACK_ARG
159627f7eb2Smrg for (n = 0; n < len; n++, src += delta)
160627f7eb2Smrg {
161627f7eb2Smrg #endif
162627f7eb2Smrg
163627f7eb2Smrg if (*src != 0)
164627f7eb2Smrg {
165627f7eb2Smrg GFC_REAL_4 absX, val;
166627f7eb2Smrg absX = MATHFUNC(fabs) (*src);
167627f7eb2Smrg if (scale < absX)
168627f7eb2Smrg {
169627f7eb2Smrg val = scale / absX;
170627f7eb2Smrg result = 1 + result * val * val;
171627f7eb2Smrg scale = absX;
172627f7eb2Smrg }
173627f7eb2Smrg else
174627f7eb2Smrg {
175627f7eb2Smrg val = absX / scale;
176627f7eb2Smrg result += val * val;
177627f7eb2Smrg }
178627f7eb2Smrg }
179627f7eb2Smrg }
180627f7eb2Smrg result = scale * MATHFUNC(sqrt) (result);
181627f7eb2Smrg *dest = result;
182627f7eb2Smrg }
183627f7eb2Smrg }
184627f7eb2Smrg /* Advance to the next element. */
185627f7eb2Smrg count[0]++;
186627f7eb2Smrg base += sstride[0];
187627f7eb2Smrg dest += dstride[0];
188627f7eb2Smrg n = 0;
189627f7eb2Smrg while (count[n] == extent[n])
190627f7eb2Smrg {
191627f7eb2Smrg /* When we get to the end of a dimension, reset it and increment
192627f7eb2Smrg the next dimension. */
193627f7eb2Smrg count[n] = 0;
194627f7eb2Smrg /* We could precalculate these products, but this is a less
195627f7eb2Smrg frequently used path so probably not worth it. */
196627f7eb2Smrg base -= sstride[n] * extent[n];
197627f7eb2Smrg dest -= dstride[n] * extent[n];
198627f7eb2Smrg n++;
199627f7eb2Smrg if (n >= rank)
200627f7eb2Smrg {
201627f7eb2Smrg /* Break out of the loop. */
202627f7eb2Smrg continue_loop = 0;
203627f7eb2Smrg break;
204627f7eb2Smrg }
205627f7eb2Smrg else
206627f7eb2Smrg {
207627f7eb2Smrg count[n]++;
208627f7eb2Smrg base += sstride[n];
209627f7eb2Smrg dest += dstride[n];
210627f7eb2Smrg }
211627f7eb2Smrg }
212627f7eb2Smrg }
213627f7eb2Smrg }
214627f7eb2Smrg
215627f7eb2Smrg #endif
216