Skip to content

Commit a131985

Browse files
committed
Various enhancements
* MPICH: Configure --with-device=ch4:ofi,ucx * Remove references to source/build directories
1 parent eaf7bc2 commit a131985

File tree

7 files changed

+302
-30
lines changed

7 files changed

+302
-30
lines changed

.github/workflows/cd-wheel.yml

+1-1
Original file line numberDiff line numberDiff line change
@@ -174,7 +174,7 @@ jobs:
174174
CIBW_REPAIR_WHEEL_COMMAND_MACOS: >
175175
delocate-wheel
176176
--ignore-missing-dependencies
177-
--exclude libmpi --exclude libpmpi
177+
--exclude libmpi --exclude libpmpi --exclude libfabric
178178
--require-archs {delocate_archs}
179179
-w {dest_dir} -v {wheel}
180180

bootstrap.sh

+29
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,35 @@ if test ! -d "$SOURCE"; then
3838
if test -f "$patch"; then
3939
patch -p1 -i "$patch" -d "$SOURCE"
4040
fi
41+
if test "$mpiname" = "mpich"; then
42+
if test "${version}" \> "4.2.2"; then
43+
conf_args='s/\(ofi_subdir_args\)=\("--enable-embedded"\)/\1=""/'
44+
configure="$SOURCE"/configure
45+
sed -i.orig "$conf_args" "$configure"
46+
fi
47+
if test "${version}" \< "4.2.0"; then
48+
disable_doc='s/^\(install-data-local:\s\+\)\$/\1#\$/'
49+
Makefile="$SOURCE"/Makefile.in
50+
sed -i.orig "$disable_doc" "$Makefile"
51+
fi
52+
fi
53+
if test "$mpiname" = "openmpi"; then
54+
makefiles=(
55+
"$SOURCE"/3rd-party/openpmix/src/util/keyval/Makefile.in
56+
"$SOURCE"/3rd-party/prrte/src/mca/rmaps/rank_file/Makefile.in
57+
"$SOURCE"/3rd-party/prrte/src/util/hostfile/Makefile.in
58+
)
59+
variables=(
60+
PRTE_CFLAGS_BEFORE_PICKY
61+
PMIX_CFLAGS_BEFORE_PICKY
62+
)
63+
for makefile in "${makefiles[@]}"; do
64+
test -f "$makefile" || continue
65+
for variable in "${variables[@]}"; do
66+
echo "$variable = @CFLAGS@" >> "$makefile"
67+
done
68+
done
69+
fi
4170
if test "$mpiname-$(uname)" = "openmpi-Darwin"; then
4271
if test -d "$SOURCE"/3rd-party; then
4372
cd "$SOURCE"/3rd-party

build-wheel.sh

+3-3
Original file line numberDiff line numberDiff line change
@@ -13,14 +13,14 @@ export CIBW_ARCHS=$ARCHLIST
1313
export CIBW_BEFORE_ALL='bash {project}/cibw-build-mpi.sh'
1414
export CIBW_TEST_COMMAND='bash {project}/cibw-check-mpi.sh'
1515
export CIBW_ENVIRONMENT_PASS='MPINAME RELEASE SOURCE WORKDIR DESTDIR'
16-
export CIBW_REPAIR_WHEEL_COMMAND_MACOS='delocate-wheel --ignore-missing-dependencies --exclude libmpi --exclude libpmpi --require-archs {delocate_archs -w {dest_dir} -v {wheel}'
16+
export CIBW_REPAIR_WHEEL_COMMAND_MACOS='delocate-wheel --ignore-missing-dependencies --exclude libmpi --exclude libpmpi --exclude libfabric --require-archs {delocate_archs -w {dest_dir} -v {wheel}'
1717

1818
if test "$(uname)" = Linux; then
1919
containerengine=$(basename "$(command -v podman || command -v docker)")
2020
export CIBW_CONTAINER_ENGINE=$containerengine
2121
export SOURCE="/project/$SOURCE"
22-
export WORKDIR="/host/$PWD/$WORKDIR"
23-
export DESTDIR="/host/$PWD/$DESTDIR"
22+
export WORKDIR="/host$PWD/$WORKDIR"
23+
export DESTDIR="/host$PWD/$DESTDIR"
2424
platform=linux
2525
fi
2626
if test "$(uname)" = Darwin; then

check-wheel.sh

+26-5
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,9 @@ unzip -qq "$wheelfile" -d "$workdir"
1616
cd "$workdir"
1717

1818
whlname=$(basename "$wheelfile")
19-
pkgname=${whlname%%-*}
19+
whlinfo=${whlname%%-py*}
20+
pkgname=${whlinfo%%-*}
21+
version=${whlinfo##*-}
2022
mpiname=${pkgname}
2123

2224
data=$(ls -d "$pkgname"-*.data/data)
@@ -29,6 +31,9 @@ if test "$(uname)" = Linux; then
2931
libsdir=.libs
3032
print-runpath() { patchelf --print-rpath "$1"; }
3133
print-needed() { patchelf --print-needed "$1"; }
34+
if test -f "$data"/lib/libfabric.so; then
35+
runlibs=$runlibs'|libfabric'$soregex
36+
fi
3237
if test -f "$data"/lib/libucp.so; then
3338
runlibs=$runlibs'|libuc(m|p|s|t)'$soregex
3439
fi
@@ -41,6 +46,9 @@ if test "$(uname)" = Darwin; then
4146
libsdir=.dylibs
4247
print-runpath() { otool -l "$1" | sed -n '/RPATH/{n;n;p;}'; }
4348
print-needed() { otool -L "$1" | sed 1,1d; }
49+
if test -f "$data"/lib/libfabric.dylib; then
50+
runlibs=$runlibs'|libfabric'$soregex
51+
fi
4452
if test -f "$data"/lib/libucp.dylib; then
4553
runlibs=$runlibs'|libuc(m|p|s|t)'$soregex
4654
fi
@@ -67,7 +75,12 @@ if test "$mpiname" = "mpich"; then
6775
libraries=(
6876
"$data"/lib/libmpi.*
6977
)
70-
if test -d "$data"/lib/ucx; then
78+
if ls "$data"/lib/libfabric.* > /dev/null 2>&1; then
79+
libraries+=(
80+
"$data"/lib/libfabric.*
81+
)
82+
fi
83+
if ls "$data"/lib/libuct.* > /dev/null 2>&1; then
7184
libraries+=(
7285
"$data"/lib/libuc[mpst]*.*
7386
"$data"/lib/ucx/libuc*.*
@@ -96,14 +109,22 @@ if test "$mpiname" = "openmpi"; then
96109
"$data"/lib/libmpi.*
97110
"$data"/lib/libopen-*.*
98111
)
112+
if test "${version%%.*}" -ge 5; then
113+
libraries+=(
114+
"$data"/lib/libevent*.*
115+
"$data"/lib/libhwloc.*
116+
"$data"/lib/libpmix.*
117+
"$data"/lib/libprrte.*
118+
)
119+
fi
99120
runlibs+='|lib(z|util|event.*|hwloc)'$soregex
100121
runlibs+='|lib(open-(pal|rte)|pmix|prrte)'$soregex
101122
fi
102123

103124
check-binary() {
104125
local dso=$1 out1="" out2=""
105126
echo checking "$dso"...
106-
test -f "$dso" || printf "ERROR: file not found\n"
127+
test -f "$dso" || (printf "ERROR: file not found\n"; exit 1)
107128
out1="$(print-runpath "$dso" | grep -vE "$runpath" || true)"
108129
test -z "$out1" || printf "ERROR: RUNPATH\n%s\n" "$out1"
109130
out2="$(print-needed "$dso" | grep -vE "$runlibs" || true)"
@@ -114,15 +135,15 @@ check-binary() {
114135
for header in "${headers[@]-}"; do
115136
test -n "$header" || break
116137
echo checking "$header"...
117-
test -f "$header"
138+
test -f "$header" || (printf "ERROR: file not found\n"; exit 1)
118139
out=$(grep -E '^#include\s+"mpicxx\.h"' "$header" || true)
119140
test -z "$out" || printf "ERROR: include\n%s\n" "$out"
120141
test -z "$out"
121142
done
122143
for script in "${scripts[@]-}"; do
123144
test -n "$script" || break
124145
echo checking "$script"...
125-
test -f "$script"
146+
test -f "$script" || (printf "ERROR: file not found\n"; exit 1)
126147
out=$(grep -E "/opt/$mpiname" "$script" || true)
127148
test -z "$out" || printf "ERROR: prefix\n%s\n" "$out"
128149
test -z "$out"

cibw-build-mpi.sh

+108-21
Original file line numberDiff line numberDiff line change
@@ -11,13 +11,31 @@ WORKDIR=${WORKDIR:-$PACKAGE/workdir}
1111
DESTDIR=${DESTDIR:-$PACKAGE/install}
1212
PREFIX=${PREFIX:-"/opt/$mpiname"}
1313

14+
case $(uname) in
15+
Linux) njobs=$(nproc);;
16+
Darwin) njobs=$(sysctl -n hw.physicalcpu);;
17+
esac
18+
19+
if test "$(uname)" = Darwin; then
20+
export MACOSX_DEPLOYMENT_TARGET="11.0"
21+
if test "$(uname -m)" = x86_64; then
22+
export MACOSX_DEPLOYMENT_TARGET="10.9"
23+
export ac_cv_func_aligned_alloc="no" # macOS>=10.15
24+
fi
25+
fi
26+
1427
if test "$mpiname" = "mpich"; then
1528
version=$(sed -n 's/MPICH_VERSION=\(.*\)/\1/p' "$SOURCE"/maint/Version)
29+
case $(uname)-$(uname -m) in
30+
Linux-x86_64) netmod=ofi,ucx ;;
31+
Linux-aarch64) netmod=ofi,ucx ;;
32+
*) netmod=ofi ;;
33+
esac
1634
options=(
1735
CC=cc
1836
CXX=c++
1937
--prefix="$PREFIX"
20-
--with-device=ch4:"${variant:-ofi}"
38+
--with-device="ch4:$netmod"
2139
--with-pm=hydra:gforker
2240
--with-libfabric=embedded
2341
--with-ucx=embedded
@@ -40,11 +58,16 @@ if test "$mpiname" = "mpich"; then
4058
export MPICH_MPICXX_LDFLAGS="-Wl,-rpath,$PREFIX/lib"
4159
export MPICH_MPIFORT_LDFLAGS="-Wl,-rpath,$PREFIX/lib"
4260
fi
43-
disable_doc='s/^\(install-data-local:\s\+\)\$/\1#\$/'
44-
sed -i.orig "$disable_doc" "$SOURCE"/Makefile.in
61+
generated_files+=(src/include/mpichinfo.h)
62+
generated_files+=(src/pm/hydra/hydra_config.h)
63+
file_prefix_map+=("-ffile-prefix-map=$SOURCE=$mpiname-$version")
64+
file_prefix_map+=("-ffile-prefix-map=$WORKDIR=$mpiname-$version")
65+
export MPICHLIB_CFLAGS="${file_prefix_map[*]}"
4566
fi
4667

4768
if test "$mpiname" = "openmpi"; then
69+
# shellcheck disable=SC1091,SC2154
70+
version=$(source "$SOURCE"/VERSION && echo "$major.$minor.$release")
4871
options=(
4972
CC=cc
5073
CXX=c++
@@ -67,27 +90,50 @@ if test "$mpiname" = "openmpi"; then
6790
--enable-mpi-fortran=mpifh
6891
--disable-dependency-tracking
6992
)
93+
generated_files+=(ompi/tools/ompi_info/Makefile)
94+
generated_files+=(oshmem/tools/oshmem_info/Makefile)
95+
generated_files+=(3rd-party/openpmix/src/tools/*/Makefile)
96+
generated_files+=(3rd-party/prrte/src/tools/*/Makefile)
97+
generated_files+=(opal/include/opal_config.h)
98+
generated_files+=(3rd-party/openpmix/src/include/pmix_config.h)
99+
generated_files+=(3rd-party/prrte/src/include/prte_config.h)
100+
file_prefix_map+=("-ffile-prefix-map=$SOURCE=$mpiname-$version")
101+
file_prefix_map+=("-ffile-prefix-map=$WORKDIR=$mpiname-$version")
102+
export CFLAGS="${file_prefix_map[*]}"
70103
fi
71104

72-
if test "$(uname)" = Darwin; then
73-
export MACOSX_DEPLOYMENT_TARGET="11.0"
74-
if test "$(uname -m)" = x86_64; then
75-
export MACOSX_DEPLOYMENT_TARGET="10.9"
76-
export ac_cv_func_aligned_alloc="no" # macOS>=10.15
77-
fi
78-
fi
79-
80-
case $(uname) in
81-
Linux) njobs=$(nproc);;
82-
Darwin) njobs=$(sysctl -n hw.physicalcpu);;
83-
esac
84-
85-
mkdir -p "$WORKDIR"
86-
cd "$WORKDIR"
105+
mkdir -p "$WORKDIR" && cd "$WORKDIR"
87106

88107
echo running configure
89108
"$SOURCE"/configure "${options[@]}" || cat config.log
90109

110+
# shellcheck disable=SC2206
111+
generated_files=(${generated_files[@]:-})
112+
for filename in "${generated_files[@]}"; do
113+
test -n "$filename" || continue
114+
test -f "$filename" || continue
115+
cflags="s|\s*${file_prefix_map[*]}\s*| |g"
116+
source="s|$SOURCE|$mpiname-$version|g"
117+
workdir="s|$WORKDIR|$mpiname-$version|g"
118+
if test "$(basename "$filename")" = "Makefile"; then
119+
echo removing CFLAGS from "$filename"
120+
sed -i.orig "/-D.*_BUILD_CFLAGS=/$cflags" "$filename"
121+
echo replacing SOURCE in "$filename"
122+
sed -i.orig "/-D.*_BUILD_CPPFLAGS=/$source" "$filename"
123+
sed -i.orig "/-D.*_BUILD_LIBS=/$source" "$filename"
124+
echo replacing WORKDIR in "$filename"
125+
sed -i.orig "/-D.*_BUILD_CPPFLAGS=/$workdir" "$filename"
126+
sed -i.orig "/-D.*_BUILD_LIBS=/$workdir" "$filename"
127+
else
128+
echo removing CFLAGS from "$filename"
129+
sed -i.orig "$cflags" "$filename"
130+
echo replacing SOURCE in "$filename"
131+
sed -i.orig "$source" "$filename"
132+
echo replacing WORKDIR in "$filename"
133+
sed -i.orig "$workdir" "$filename"
134+
fi
135+
done
136+
91137
echo running make with "${njobs:-1}" jobs
92138
make -j "${njobs:-1}" install DESTDIR="$DESTDIR"
93139

@@ -97,7 +143,6 @@ cd "${DESTDIR}${PREFIX}"
97143
rm -f include/*cxx.h
98144
rm -f include/*.mod
99145
rm -f include/*f.h
100-
rm -fr include/rdma
101146
rm -f bin/mpif77
102147
rm -f bin/mpif90
103148
rm -f bin/mpifort
@@ -112,6 +157,12 @@ rm -f lib/lib*mpifort.*
112157
rm -fr lib/pkgconfig
113158
rm -fr share
114159

160+
cd "${DESTDIR}${PREFIX}"
161+
rm -fr include/rdma
162+
rm -f bin/fi_*
163+
rm -f lib/libfabric.a
164+
rm -f lib/libfabric.la
165+
115166
cd "${DESTDIR}${PREFIX}"
116167
rm -f bin/io_demo
117168
rm -f bin/ucx_read_profile
@@ -134,6 +185,7 @@ for script in "${scripts[@]}"; do
134185
test ! -L "$script" || continue
135186
# shellcheck disable=SC2016
136187
topdir='$(CDPATH= cd -- "$(dirname -- "${BASH_SOURCE:-$0}")/.." \&\& pwd)'
188+
sed -i.orig s:"\s$WORKDIR/.*/lib\(.*\)\.la":" -l\1":g "$script"
137189
sed -i.orig s@^prefix=.*@prefix="$topdir"@ "$script"
138190
sed -i.orig s:"$PREFIX":\"\$\{prefix\}\":g "$script"
139191
sed -i.orig s:-Wl,-commons,use_dylibs::g "$script"
@@ -153,6 +205,19 @@ if test "$(uname)" = Linux; then
153205
mv "$(readlink "$libmpi")" "$libmpi"
154206
ln -sf "$libmpi" "${libmpi%.*}"
155207
fi
208+
if test -f libfabric.so; then
209+
patchelf --set-rpath "\$ORIGIN" "$libmpi"
210+
for lib in libfabric.so.?; do
211+
if test -f "$lib".*.*; then
212+
mv "$(readlink "$lib")" "$lib"
213+
ln -sf "$lib" "${lib%.*}"
214+
fi
215+
patchelf --set-rpath "\$ORIGIN" "$lib"
216+
for exe in "${executables[@]}"; do
217+
patchelf --remove-needed "$lib" "../bin/$exe"
218+
done
219+
done
220+
fi
156221
if test -f libucp.so; then
157222
patchelf --set-rpath "\$ORIGIN" "$libmpi"
158223
for lib in libuc[mpst]*.so.?; do
@@ -182,16 +247,31 @@ if test "$(uname)" = Darwin; then
182247
libpmpi="libpmpi.12.dylib"
183248
cd "${DESTDIR}${PREFIX}/bin"
184249
for exe in "${executables[@]}"; do
185-
install_name_tool -change "$libdir/$libmpi" "@rpath/$libmpi" "$exe"
186-
install_name_tool -change "$libdir/$libpmpi" "@rpath/$libpmpi" "$exe"
187250
install_name_tool -add_rpath "@executable_path/../lib/" "$exe"
251+
for lib in "$libmpi" "$libpmpi"; do
252+
install_name_tool -change "$libdir/$lib" "@rpath/$lib" "$exe"
253+
done
188254
done
189255
cd "${DESTDIR}${PREFIX}/lib"
190256
for lib in "$libmpi" "$libpmpi"; do
191257
install_name_tool -id "@rpath/$lib" "$lib"
192258
install_name_tool -add_rpath "@loader_path/" "$lib"
193259
done
194260
install_name_tool -change "$libdir/$libpmpi" "@rpath/$libpmpi" "$libmpi"
261+
libfabric="libfabric.1.dylib"
262+
if test -f "$libfabric"; then
263+
install_name_tool -id "@rpath/$libfabric" "$libfabric"
264+
install_name_tool -add_rpath "@loader_path/" "$libfabric"
265+
oldname="$libdir/$libfabric"; newname="@rpath/$libfabric";
266+
cd "${DESTDIR}${PREFIX}/bin"
267+
for exe in "${executables[@]}"; do
268+
install_name_tool -change "$oldname" "$newname" "$exe"
269+
done
270+
cd "${DESTDIR}${PREFIX}/lib"
271+
for lib in "$libmpi" "$libpmpi"; do
272+
install_name_tool -change "$oldname" "$newname" "$lib"
273+
done
274+
fi
195275
fi
196276

197277
} # fixup-mpich()
@@ -365,3 +445,10 @@ done
365445

366446
echo fixing install tree
367447
fixup-"$mpiname"
448+
449+
echo checking install tree
450+
cd "${DESTDIR}${PREFIX}"
451+
echo cheking files with SOURCE
452+
! grep -lr "$SOURCE"
453+
echo cheking files with WORKDIR
454+
! grep -lr "$WORKDIR"

cibw-check-mpi.sh

+19
Original file line numberDiff line numberDiff line change
@@ -68,3 +68,22 @@ RUN mpicxx helloworld.cxx -o helloworld-cxx
6868
RUN command -v mpiexec
6969
RUN mpiexec -n 3 ./helloworld-c
7070
RUN mpiexec -n 3 ./helloworld-cxx
71+
72+
if test "$mpiname" = "mpich"; then
73+
case $(uname)-$(uname -m) in
74+
Linux-x86_64) ch4netmods=(ofi ucx) ;;
75+
Linux-aarch64) ch4netmods=(ofi ucx) ;;
76+
*) ch4netmods=(ofi) ;;
77+
esac
78+
export MPICH_CH4_OFI_CAPABILITY_DEBUG=1
79+
export MPICH_CH4_UCX_CAPABILITY_DEBUG=1
80+
for netmod in "${ch4netmods[@]}"; do
81+
printf "testing ch4:%s ... " "$netmod"
82+
export MPICH_CH4_NETMOD="$netmod"
83+
./helloworld-c | grep -i "$netmod" > /dev/null
84+
printf "OK\n"
85+
done
86+
unset MPICH_CH4_OFI_CAPABILITY_DEBUG
87+
unset MPICH_CH4_UCX_CAPABILITY_DEBUG
88+
unset MPICH_CH4_NETMOD
89+
fi

0 commit comments

Comments
 (0)