]>
Commit | Line | Data |
---|---|---|
6de9cd9a | 1 | /* Implementation of the SUM intrinsic |
748086b7 | 2 | Copyright 2002, 2007, 2009 Free Software Foundation, Inc. |
6de9cd9a DN |
3 | Contributed by Paul Brook <paul@nowt.org> |
4 | ||
57dea9f6 | 5 | This file is part of the GNU Fortran 95 runtime library (libgfortran). |
6de9cd9a DN |
6 | |
7 | Libgfortran is free software; you can redistribute it and/or | |
57dea9f6 | 8 | modify it under the terms of the GNU General Public |
6de9cd9a | 9 | License as published by the Free Software Foundation; either |
748086b7 | 10 | version 3 of the License, or (at your option) any later version. |
6de9cd9a DN |
11 | |
12 | Libgfortran is distributed in the hope that it will be useful, | |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
57dea9f6 | 15 | GNU General Public License for more details. |
6de9cd9a | 16 | |
748086b7 JJ |
17 | Under Section 7 of GPL version 3, you are granted additional |
18 | permissions described in the GCC Runtime Library Exception, version | |
19 | 3.1, as published by the Free Software Foundation. | |
20 | ||
21 | You should have received a copy of the GNU General Public License and | |
22 | a copy of the GCC Runtime Library Exception along with this program; | |
23 | see the files COPYING3 and COPYING.RUNTIME respectively. If not, see | |
24 | <http://www.gnu.org/licenses/>. */ | |
6de9cd9a | 25 | |
36ae8a61 | 26 | #include "libgfortran.h" |
6de9cd9a DN |
27 | #include <stdlib.h> |
28 | #include <assert.h> | |
6de9cd9a | 29 | |
7d7b8bfe | 30 | |
644cb69f FXC |
31 | #if defined (HAVE_GFC_INTEGER_4) && defined (HAVE_GFC_INTEGER_4) |
32 | ||
33 | ||
64acfd99 JB |
34 | extern void sum_i4 (gfc_array_i4 * const restrict, |
35 | gfc_array_i4 * const restrict, const index_type * const restrict); | |
7f68c75f | 36 | export_proto(sum_i4); |
7d7b8bfe | 37 | |
6de9cd9a | 38 | void |
64acfd99 JB |
39 | sum_i4 (gfc_array_i4 * const restrict retarray, |
40 | gfc_array_i4 * const restrict array, | |
41 | const index_type * const restrict pdim) | |
6de9cd9a | 42 | { |
e33e218b TK |
43 | index_type count[GFC_MAX_DIMENSIONS]; |
44 | index_type extent[GFC_MAX_DIMENSIONS]; | |
45 | index_type sstride[GFC_MAX_DIMENSIONS]; | |
46 | index_type dstride[GFC_MAX_DIMENSIONS]; | |
64acfd99 JB |
47 | const GFC_INTEGER_4 * restrict base; |
48 | GFC_INTEGER_4 * restrict dest; | |
6de9cd9a DN |
49 | index_type rank; |
50 | index_type n; | |
51 | index_type len; | |
52 | index_type delta; | |
53 | index_type dim; | |
da96f5ab | 54 | int continue_loop; |
6de9cd9a DN |
55 | |
56 | /* Make dim zero based to avoid confusion. */ | |
57 | dim = (*pdim) - 1; | |
58 | rank = GFC_DESCRIPTOR_RANK (array) - 1; | |
e33e218b | 59 | |
dfb55fdc | 60 | len = GFC_DESCRIPTOR_EXTENT(array,dim); |
da96f5ab TK |
61 | if (len < 0) |
62 | len = 0; | |
dfb55fdc | 63 | delta = GFC_DESCRIPTOR_STRIDE(array,dim); |
6de9cd9a DN |
64 | |
65 | for (n = 0; n < dim; n++) | |
66 | { | |
dfb55fdc TK |
67 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n); |
68 | extent[n] = GFC_DESCRIPTOR_EXTENT(array,n); | |
80ee04b9 TK |
69 | |
70 | if (extent[n] < 0) | |
71 | extent[n] = 0; | |
6de9cd9a DN |
72 | } |
73 | for (n = dim; n < rank; n++) | |
74 | { | |
dfb55fdc TK |
75 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array, n + 1); |
76 | extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1); | |
80ee04b9 TK |
77 | |
78 | if (extent[n] < 0) | |
79 | extent[n] = 0; | |
6de9cd9a DN |
80 | } |
81 | ||
6c167c45 VL |
82 | if (retarray->data == NULL) |
83 | { | |
dfb55fdc | 84 | size_t alloc_size, str; |
80ee04b9 | 85 | |
6c167c45 VL |
86 | for (n = 0; n < rank; n++) |
87 | { | |
6c167c45 | 88 | if (n == 0) |
dfb55fdc | 89 | str = 1; |
6c167c45 | 90 | else |
dfb55fdc TK |
91 | str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1]; |
92 | ||
93 | GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str); | |
94 | ||
6c167c45 VL |
95 | } |
96 | ||
efd4dc1a | 97 | retarray->offset = 0; |
50dd63a9 | 98 | retarray->dtype = (array->dtype & ~GFC_DTYPE_RANK_MASK) | rank; |
80ee04b9 | 99 | |
dfb55fdc | 100 | alloc_size = sizeof (GFC_INTEGER_4) * GFC_DESCRIPTOR_STRIDE(retarray,rank-1) |
80ee04b9 TK |
101 | * extent[rank-1]; |
102 | ||
103 | if (alloc_size == 0) | |
104 | { | |
105 | /* Make sure we have a zero-sized array. */ | |
dfb55fdc | 106 | GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1); |
80ee04b9 | 107 | return; |
dfb55fdc | 108 | |
80ee04b9 TK |
109 | } |
110 | else | |
111 | retarray->data = internal_malloc_size (alloc_size); | |
6c167c45 | 112 | } |
50dd63a9 TK |
113 | else |
114 | { | |
50dd63a9 | 115 | if (rank != GFC_DESCRIPTOR_RANK (retarray)) |
fd6590f8 | 116 | runtime_error ("rank of return array incorrect in" |
ccacefc7 TK |
117 | " SUM intrinsic: is %ld, should be %ld", |
118 | (long int) (GFC_DESCRIPTOR_RANK (retarray)), | |
119 | (long int) rank); | |
fd6590f8 | 120 | |
9731c4a3 | 121 | if (unlikely (compile_options.bounds_check)) |
16bff921 TK |
122 | bounds_ifunction_return ((array_t *) retarray, extent, |
123 | "return value", "SUM"); | |
50dd63a9 TK |
124 | } |
125 | ||
6de9cd9a DN |
126 | for (n = 0; n < rank; n++) |
127 | { | |
128 | count[n] = 0; | |
dfb55fdc | 129 | dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n); |
6de9cd9a DN |
130 | if (extent[n] <= 0) |
131 | len = 0; | |
132 | } | |
133 | ||
134 | base = array->data; | |
135 | dest = retarray->data; | |
136 | ||
da96f5ab TK |
137 | continue_loop = 1; |
138 | while (continue_loop) | |
6de9cd9a | 139 | { |
64acfd99 | 140 | const GFC_INTEGER_4 * restrict src; |
6de9cd9a DN |
141 | GFC_INTEGER_4 result; |
142 | src = base; | |
143 | { | |
144 | ||
145 | result = 0; | |
146 | if (len <= 0) | |
147 | *dest = 0; | |
148 | else | |
149 | { | |
150 | for (n = 0; n < len; n++, src += delta) | |
151 | { | |
152 | ||
153 | result += *src; | |
154 | } | |
155 | *dest = result; | |
156 | } | |
157 | } | |
158 | /* Advance to the next element. */ | |
159 | count[0]++; | |
160 | base += sstride[0]; | |
161 | dest += dstride[0]; | |
162 | n = 0; | |
163 | while (count[n] == extent[n]) | |
164 | { | |
165 | /* When we get to the end of a dimension, reset it and increment | |
166 | the next dimension. */ | |
167 | count[n] = 0; | |
168 | /* We could precalculate these products, but this is a less | |
5d7adf7a | 169 | frequently used path so probably not worth it. */ |
6de9cd9a DN |
170 | base -= sstride[n] * extent[n]; |
171 | dest -= dstride[n] * extent[n]; | |
172 | n++; | |
173 | if (n == rank) | |
174 | { | |
175 | /* Break out of the look. */ | |
da96f5ab TK |
176 | continue_loop = 0; |
177 | break; | |
6de9cd9a DN |
178 | } |
179 | else | |
180 | { | |
181 | count[n]++; | |
182 | base += sstride[n]; | |
183 | dest += dstride[n]; | |
184 | } | |
185 | } | |
186 | } | |
187 | } | |
188 | ||
7d7b8bfe | 189 | |
64acfd99 JB |
190 | extern void msum_i4 (gfc_array_i4 * const restrict, |
191 | gfc_array_i4 * const restrict, const index_type * const restrict, | |
28dc6b33 | 192 | gfc_array_l1 * const restrict); |
7f68c75f | 193 | export_proto(msum_i4); |
7d7b8bfe | 194 | |
6de9cd9a | 195 | void |
64acfd99 JB |
196 | msum_i4 (gfc_array_i4 * const restrict retarray, |
197 | gfc_array_i4 * const restrict array, | |
198 | const index_type * const restrict pdim, | |
28dc6b33 | 199 | gfc_array_l1 * const restrict mask) |
6de9cd9a | 200 | { |
e33e218b TK |
201 | index_type count[GFC_MAX_DIMENSIONS]; |
202 | index_type extent[GFC_MAX_DIMENSIONS]; | |
203 | index_type sstride[GFC_MAX_DIMENSIONS]; | |
204 | index_type dstride[GFC_MAX_DIMENSIONS]; | |
205 | index_type mstride[GFC_MAX_DIMENSIONS]; | |
64acfd99 JB |
206 | GFC_INTEGER_4 * restrict dest; |
207 | const GFC_INTEGER_4 * restrict base; | |
28dc6b33 | 208 | const GFC_LOGICAL_1 * restrict mbase; |
6de9cd9a DN |
209 | int rank; |
210 | int dim; | |
211 | index_type n; | |
212 | index_type len; | |
213 | index_type delta; | |
214 | index_type mdelta; | |
28dc6b33 | 215 | int mask_kind; |
6de9cd9a DN |
216 | |
217 | dim = (*pdim) - 1; | |
218 | rank = GFC_DESCRIPTOR_RANK (array) - 1; | |
e33e218b | 219 | |
dfb55fdc | 220 | len = GFC_DESCRIPTOR_EXTENT(array,dim); |
6de9cd9a DN |
221 | if (len <= 0) |
222 | return; | |
28dc6b33 TK |
223 | |
224 | mbase = mask->data; | |
225 | ||
226 | mask_kind = GFC_DESCRIPTOR_SIZE (mask); | |
227 | ||
228 | if (mask_kind == 1 || mask_kind == 2 || mask_kind == 4 || mask_kind == 8 | |
229 | #ifdef HAVE_GFC_LOGICAL_16 | |
230 | || mask_kind == 16 | |
231 | #endif | |
232 | ) | |
233 | mbase = GFOR_POINTER_TO_L1 (mbase, mask_kind); | |
234 | else | |
235 | runtime_error ("Funny sized logical array"); | |
236 | ||
dfb55fdc TK |
237 | delta = GFC_DESCRIPTOR_STRIDE(array,dim); |
238 | mdelta = GFC_DESCRIPTOR_STRIDE_BYTES(mask,dim); | |
6de9cd9a DN |
239 | |
240 | for (n = 0; n < dim; n++) | |
241 | { | |
dfb55fdc TK |
242 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n); |
243 | mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask,n); | |
244 | extent[n] = GFC_DESCRIPTOR_EXTENT(array,n); | |
80ee04b9 TK |
245 | |
246 | if (extent[n] < 0) | |
247 | extent[n] = 0; | |
248 | ||
6de9cd9a DN |
249 | } |
250 | for (n = dim; n < rank; n++) | |
251 | { | |
dfb55fdc TK |
252 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n + 1); |
253 | mstride[n] = GFC_DESCRIPTOR_STRIDE_BYTES(mask, n + 1); | |
254 | extent[n] = GFC_DESCRIPTOR_EXTENT(array, n + 1); | |
80ee04b9 TK |
255 | |
256 | if (extent[n] < 0) | |
257 | extent[n] = 0; | |
6de9cd9a DN |
258 | } |
259 | ||
50dd63a9 TK |
260 | if (retarray->data == NULL) |
261 | { | |
dfb55fdc | 262 | size_t alloc_size, str; |
80ee04b9 | 263 | |
50dd63a9 TK |
264 | for (n = 0; n < rank; n++) |
265 | { | |
50dd63a9 | 266 | if (n == 0) |
dfb55fdc | 267 | str = 1; |
50dd63a9 | 268 | else |
dfb55fdc TK |
269 | str= GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1]; |
270 | ||
271 | GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str); | |
272 | ||
50dd63a9 TK |
273 | } |
274 | ||
dfb55fdc | 275 | alloc_size = sizeof (GFC_INTEGER_4) * GFC_DESCRIPTOR_STRIDE(retarray,rank-1) |
80ee04b9 TK |
276 | * extent[rank-1]; |
277 | ||
efd4dc1a | 278 | retarray->offset = 0; |
50dd63a9 | 279 | retarray->dtype = (array->dtype & ~GFC_DTYPE_RANK_MASK) | rank; |
80ee04b9 TK |
280 | |
281 | if (alloc_size == 0) | |
282 | { | |
283 | /* Make sure we have a zero-sized array. */ | |
dfb55fdc | 284 | GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1); |
80ee04b9 TK |
285 | return; |
286 | } | |
287 | else | |
288 | retarray->data = internal_malloc_size (alloc_size); | |
289 | ||
50dd63a9 TK |
290 | } |
291 | else | |
292 | { | |
50dd63a9 | 293 | if (rank != GFC_DESCRIPTOR_RANK (retarray)) |
fd6590f8 TK |
294 | runtime_error ("rank of return array incorrect in SUM intrinsic"); |
295 | ||
9731c4a3 | 296 | if (unlikely (compile_options.bounds_check)) |
fd6590f8 | 297 | { |
16bff921 TK |
298 | bounds_ifunction_return ((array_t *) retarray, extent, |
299 | "return value", "SUM"); | |
300 | bounds_equal_extents ((array_t *) mask, (array_t *) array, | |
301 | "MASK argument", "SUM"); | |
fd6590f8 | 302 | } |
50dd63a9 TK |
303 | } |
304 | ||
6de9cd9a DN |
305 | for (n = 0; n < rank; n++) |
306 | { | |
307 | count[n] = 0; | |
dfb55fdc | 308 | dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n); |
6de9cd9a DN |
309 | if (extent[n] <= 0) |
310 | return; | |
311 | } | |
312 | ||
313 | dest = retarray->data; | |
314 | base = array->data; | |
6de9cd9a DN |
315 | |
316 | while (base) | |
317 | { | |
64acfd99 | 318 | const GFC_INTEGER_4 * restrict src; |
28dc6b33 | 319 | const GFC_LOGICAL_1 * restrict msrc; |
6de9cd9a DN |
320 | GFC_INTEGER_4 result; |
321 | src = base; | |
322 | msrc = mbase; | |
323 | { | |
324 | ||
325 | result = 0; | |
326 | if (len <= 0) | |
327 | *dest = 0; | |
328 | else | |
329 | { | |
330 | for (n = 0; n < len; n++, src += delta, msrc += mdelta) | |
331 | { | |
332 | ||
333 | if (*msrc) | |
334 | result += *src; | |
335 | } | |
336 | *dest = result; | |
337 | } | |
338 | } | |
339 | /* Advance to the next element. */ | |
340 | count[0]++; | |
341 | base += sstride[0]; | |
342 | mbase += mstride[0]; | |
343 | dest += dstride[0]; | |
344 | n = 0; | |
345 | while (count[n] == extent[n]) | |
346 | { | |
347 | /* When we get to the end of a dimension, reset it and increment | |
348 | the next dimension. */ | |
349 | count[n] = 0; | |
350 | /* We could precalculate these products, but this is a less | |
5d7adf7a | 351 | frequently used path so probably not worth it. */ |
6de9cd9a DN |
352 | base -= sstride[n] * extent[n]; |
353 | mbase -= mstride[n] * extent[n]; | |
354 | dest -= dstride[n] * extent[n]; | |
355 | n++; | |
356 | if (n == rank) | |
357 | { | |
358 | /* Break out of the look. */ | |
359 | base = NULL; | |
360 | break; | |
361 | } | |
362 | else | |
363 | { | |
364 | count[n]++; | |
365 | base += sstride[n]; | |
366 | mbase += mstride[n]; | |
367 | dest += dstride[n]; | |
368 | } | |
369 | } | |
370 | } | |
371 | } | |
644cb69f | 372 | |
97a62038 TK |
373 | |
374 | extern void ssum_i4 (gfc_array_i4 * const restrict, | |
375 | gfc_array_i4 * const restrict, const index_type * const restrict, | |
376 | GFC_LOGICAL_4 *); | |
377 | export_proto(ssum_i4); | |
378 | ||
379 | void | |
380 | ssum_i4 (gfc_array_i4 * const restrict retarray, | |
381 | gfc_array_i4 * const restrict array, | |
382 | const index_type * const restrict pdim, | |
383 | GFC_LOGICAL_4 * mask) | |
384 | { | |
802367d7 TK |
385 | index_type count[GFC_MAX_DIMENSIONS]; |
386 | index_type extent[GFC_MAX_DIMENSIONS]; | |
387 | index_type sstride[GFC_MAX_DIMENSIONS]; | |
388 | index_type dstride[GFC_MAX_DIMENSIONS]; | |
389 | GFC_INTEGER_4 * restrict dest; | |
97a62038 TK |
390 | index_type rank; |
391 | index_type n; | |
802367d7 TK |
392 | index_type dim; |
393 | ||
97a62038 TK |
394 | |
395 | if (*mask) | |
396 | { | |
397 | sum_i4 (retarray, array, pdim); | |
398 | return; | |
399 | } | |
802367d7 TK |
400 | /* Make dim zero based to avoid confusion. */ |
401 | dim = (*pdim) - 1; | |
402 | rank = GFC_DESCRIPTOR_RANK (array) - 1; | |
403 | ||
404 | for (n = 0; n < dim; n++) | |
405 | { | |
dfb55fdc TK |
406 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n); |
407 | extent[n] = GFC_DESCRIPTOR_EXTENT(array,n); | |
802367d7 TK |
408 | |
409 | if (extent[n] <= 0) | |
410 | extent[n] = 0; | |
411 | } | |
412 | ||
413 | for (n = dim; n < rank; n++) | |
414 | { | |
dfb55fdc | 415 | sstride[n] = GFC_DESCRIPTOR_STRIDE(array,n + 1); |
802367d7 | 416 | extent[n] = |
dfb55fdc | 417 | GFC_DESCRIPTOR_EXTENT(array,n + 1); |
802367d7 TK |
418 | |
419 | if (extent[n] <= 0) | |
420 | extent[n] = 0; | |
421 | } | |
97a62038 TK |
422 | |
423 | if (retarray->data == NULL) | |
424 | { | |
dfb55fdc | 425 | size_t alloc_size, str; |
802367d7 TK |
426 | |
427 | for (n = 0; n < rank; n++) | |
428 | { | |
802367d7 | 429 | if (n == 0) |
dfb55fdc | 430 | str = 1; |
802367d7 | 431 | else |
dfb55fdc TK |
432 | str = GFC_DESCRIPTOR_STRIDE(retarray,n-1) * extent[n-1]; |
433 | ||
434 | GFC_DIMENSION_SET(retarray->dim[n], 0, extent[n] - 1, str); | |
435 | ||
802367d7 TK |
436 | } |
437 | ||
97a62038 | 438 | retarray->offset = 0; |
802367d7 TK |
439 | retarray->dtype = (array->dtype & ~GFC_DTYPE_RANK_MASK) | rank; |
440 | ||
dfb55fdc | 441 | alloc_size = sizeof (GFC_INTEGER_4) * GFC_DESCRIPTOR_STRIDE(retarray,rank-1) |
802367d7 TK |
442 | * extent[rank-1]; |
443 | ||
444 | if (alloc_size == 0) | |
445 | { | |
446 | /* Make sure we have a zero-sized array. */ | |
dfb55fdc | 447 | GFC_DIMENSION_SET(retarray->dim[0], 0, -1, 1); |
802367d7 TK |
448 | return; |
449 | } | |
450 | else | |
451 | retarray->data = internal_malloc_size (alloc_size); | |
97a62038 TK |
452 | } |
453 | else | |
454 | { | |
802367d7 TK |
455 | if (rank != GFC_DESCRIPTOR_RANK (retarray)) |
456 | runtime_error ("rank of return array incorrect in" | |
457 | " SUM intrinsic: is %ld, should be %ld", | |
458 | (long int) (GFC_DESCRIPTOR_RANK (retarray)), | |
459 | (long int) rank); | |
460 | ||
9731c4a3 | 461 | if (unlikely (compile_options.bounds_check)) |
fd6590f8 | 462 | { |
802367d7 TK |
463 | for (n=0; n < rank; n++) |
464 | { | |
465 | index_type ret_extent; | |
97a62038 | 466 | |
dfb55fdc | 467 | ret_extent = GFC_DESCRIPTOR_EXTENT(retarray,n); |
802367d7 TK |
468 | if (extent[n] != ret_extent) |
469 | runtime_error ("Incorrect extent in return value of" | |
470 | " SUM intrinsic in dimension %ld:" | |
471 | " is %ld, should be %ld", (long int) n + 1, | |
472 | (long int) ret_extent, (long int) extent[n]); | |
473 | } | |
fd6590f8 TK |
474 | } |
475 | } | |
97a62038 | 476 | |
802367d7 TK |
477 | for (n = 0; n < rank; n++) |
478 | { | |
479 | count[n] = 0; | |
dfb55fdc | 480 | dstride[n] = GFC_DESCRIPTOR_STRIDE(retarray,n); |
802367d7 TK |
481 | } |
482 | ||
483 | dest = retarray->data; | |
484 | ||
485 | while(1) | |
486 | { | |
487 | *dest = 0; | |
488 | count[0]++; | |
489 | dest += dstride[0]; | |
490 | n = 0; | |
491 | while (count[n] == extent[n]) | |
492 | { | |
493 | /* When we get to the end of a dimension, reset it and increment | |
494 | the next dimension. */ | |
495 | count[n] = 0; | |
496 | /* We could precalculate these products, but this is a less | |
497 | frequently used path so probably not worth it. */ | |
498 | dest -= dstride[n] * extent[n]; | |
499 | n++; | |
500 | if (n == rank) | |
501 | return; | |
502 | else | |
503 | { | |
504 | count[n]++; | |
505 | dest += dstride[n]; | |
506 | } | |
507 | } | |
508 | } | |
97a62038 TK |
509 | } |
510 | ||
644cb69f | 511 | #endif |