blob: 1cbf68fa4da5a5655223c846ac20fc721cc58fb0 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
|
# Copyright 1999-2015 Gentoo Foundation
# Distributed under the terms of the GNU General Public License v2
# $Id$
EAPI=5
PYTHON_COMPAT=( python2_7 )
FORTRAN_STANDARD="77 90"
inherit cuda eutils flag-o-matic fortran-2 multilib toolchain-funcs versionator python-any-r1
DESCRIPTION="Matrix Algebra on GPU and Multicore Architectures"
HOMEPAGE="http://icl.cs.utk.edu/magma/"
SRC_URI="http://icl.cs.utk.edu/projectsfiles/${PN}/downloads/${P}.tar.gz"
LICENSE="BSD"
SLOT="0"
KEYWORDS="~amd64 ~x86 ~amd64-linux ~x86-linux"
IUSE="fermi kepler static-libs test"
REQUIRED_USE="?? ( fermi kepler )"
RDEPEND="
dev-util/nvidia-cuda-toolkit
virtual/cblas
virtual/fortran
virtual/lapack"
DEPEND="${RDEPEND}
virtual/pkgconfig
test? ( ${PYTHON_DEPS} )"
# We have to have write acccess /dev/nvidia0 and /dev/nvidiactl and the portage
# user is (usually) not in the video group
RESTRICT="userpriv"
pkg_setup() {
fortran-2_pkg_setup
use test && python-any-r1_pkg_setup
}
src_prepare() {
# distributed pc file not so useful so replace it
cat <<-EOF > ${PN}.pc
prefix=${EPREFIX}/usr
libdir=\${prefix}/$(get_libdir)
includedir=\${prefix}/include/${PN}
Name: ${PN}
Description: ${DESCRIPTION}
Version: ${PV}
URL: ${HOMEPAGE}
Libs: -L\${libdir} -lmagma
Libs.private: -lm -lpthread -ldl -lcublas -lcudart
Cflags: -I\${includedir}
Requires: cblas lapack
EOF
if [[ $(tc-getCC) =~ gcc ]]; then
local eopenmp=-fopenmp
elif [[ $(tc-getCC) =~ icc ]]; then
local eopenmp=-openmp
else
elog "Cannot detect compiler type so not setting openmp support"
fi
append-flags -fPIC ${eopenmp}
append-ldflags -Wl,-soname,lib${PN}.so.1.4 ${eopenmp}
cuda_src_prepare
}
src_configure() {
cat <<-EOF > make.inc
ARCH = $(tc-getAR)
ARCHFLAGS = cr
RANLIB = $(tc-getRANLIB)
NVCC = nvcc
CC = $(tc-getCXX)
FORT = $(tc-getFC)
INC = -I"${EPREFIX}/opt/cuda/include" -DADD_ -DCUBLAS_GFORTRAN
OPTS = ${CFLAGS} -fPIC
FOPTS = ${FFLAGS} -fPIC -x f95-cpp-input
F77OPTS = ${FFLAGS} -fPIC
NVOPTS = -DADD_ -DUNIX ${NVCCFLAGS}
LDOPTS = ${LDFLAGS}
LOADER = $(tc-getFC)
LIBBLAS = $($(tc-getPKG_CONFIG) --libs cblas)
LIBLAPACK = $($(tc-getPKG_CONFIG) --libs lapack)
CUDADIR = ${EPREFIX}/opt/cuda
LIBCUDA = -L\$(CUDADIR)/$(get_libdir) -lcublas -lcudart
LIB = -pthread -lm -ldl \$(LIBCUDA) \$(LIBBLAS) \$(LIBLAPACK) -lstdc++
EOF
if use kepler; then
echo >> make.inc "GPU_TARGET = Kepler"
elif use fermi; then
echo >> make.inc "GPU_TARGET = Fermi"
else # See http://icl.cs.utk.edu/magma/forum/viewtopic.php?f=2&t=227
echo >> make.inc "GPU_TARGET = Tesla"
fi
}
src_compile() {
emake lib
emake shared
mv lib/lib${PN}.so{,.1.4} || die
ln -sf lib${PN}.so.1.4 lib/lib${PN}.so.1 || die
ln -sf lib${PN}.so.1.4 lib/lib${PN}.so || die
}
src_test() {
emake test lapacktest
cd testing/lin || die
# we need to access this while running the tests
addwrite /dev/nvidiactl
addwrite /dev/nvidia0
LD_LIBRARY_PATH="${S}"/lib ${EPYTHON} lapack_testing.py || die
}
src_install() {
dolib.so lib/lib*$(get_libname)*
use static-libs && dolib.a lib/lib*.a
insinto /usr/include/${PN}
doins include/*.h
insinto /usr/$(get_libdir)/pkgconfig
doins ${PN}.pc
dodoc README ReleaseNotes
}
|