summaryrefslogtreecommitdiff
path: root/usr/src/libm/src/mvec/vrhypotf_.c
blob: 5af9ad6de7c70db493bfda49c93e8c04c5c18fdc (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License (the "License").
 * You may not use this file except in compliance with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */

/*
 * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#pragma ident	"@(#)vrhypotf_.c	1.4	06/01/31 SMI"

extern void __vrhypotf( int, float *, int, float *, int, float *, int );

#pragma weak vrhypotf_ = __vrhypotf_

#ifndef LIBMTSK_BASED

/* just invoke the serial function */
void
__vrhypotf_( int *n, float *x, int *stridex, float *y, int *stridey,
	float *z, int *stridez )
{
	__vrhypotf( *n, x, *stridex, y, *stridey, z, *stridez );
}

#else

#include "mtsk.h"

static float *xp, *yp, *zp;
static int sx, sy, sz;

/* m-function for parallel vrhypotf */
void
__vrhypotf_mfunc( struct MFunctionBlock *MFunctionBlockPtr, int LowerBound,
	int UpperBound, int Step )
{
	__vrhypotf( UpperBound - LowerBound + 1, xp + sx * LowerBound, sx,
		yp + sy * LowerBound, sy, zp + sz * LowerBound, sz );
}

void
__vrhypotf_( int *n, float *x, int *stridex, float *y, int *stridey,
	float *z, int *stridez )
{
	struct MFunctionBlock m;
	int i;

	/* if ncpus < 2, we are already in a parallel construct, or there
	   aren't enough vector elements to bother parallelizing, just
	   invoke the serial function */
	i = __mt_getncpus_();
	if ( i < 2 || *n < ( i << 3 ) || __mt_inepc_() || __mt_inapc_() )
	{
		__vrhypotf( *n, x, *stridex, y, *stridey, z, *stridez );
		return;
	}

	/* should be safe, we already know we're not in a parallel region */
	xp = x;
	sx = *stridex;
	yp = y;
	sy = *stridey;
	zp = z;
	sz = *stridez;

	m.MFunctionPtr = &__vrhypotf_mfunc;
	m.LowerBound = 0;
	m.UpperBound = *n - 1;
	m.Step = 1;
	__mt_dopar_vfun_( m.MFunctionPtr, m.LowerBound, m.UpperBound, m.Step );
}

#endif