WIP: Testing with automatic fetching

This commit is contained in:
Rodrigo Arias 2020-10-26 19:43:02 +01:00
parent 59346fa97e
commit 3bd4e61f3f
7 changed files with 149 additions and 20 deletions

View File

@ -25,7 +25,7 @@ let
gitBranch = "garlic/mpi+send"; gitBranch = "garlic/mpi+send";
# Repeat the execution of each unit 30 times # Repeat the execution of each unit 30 times
loops = 30; loops = 10;
# Resources # Resources
qos = "debug"; qos = "debug";
@ -34,6 +34,10 @@ let
time = "02:00:00"; time = "02:00:00";
cpuBind = "sockets,verbose"; cpuBind = "sockets,verbose";
jobName = "nbody-bs-${toString blocksize}-${gitBranch}"; jobName = "nbody-bs-${toString blocksize}-${gitBranch}";
# Experiment revision: this allows a user to run again a experiment already
# executed
rev = 0;
}; };
# Compute the array of configurations # Compute the array of configurations
@ -47,10 +51,11 @@ let
}; };
program = {nextStage, conf, ...}: with conf; program = {nextStage, conf, ...}: with conf;
let # FIXME: This is becoming very slow:
customPkgs = stdexp.replaceMpi conf.mpi; #let
in # customPkgs = stdexp.replaceMpi conf.mpi;
customPkgs.apps.nbody.override { #in
bsc.garlic.apps.nbody.override {
inherit cc blocksize mpi gitBranch; inherit cc blocksize mpi gitBranch;
}; };

33
garlic/pp/check.nix Normal file
View File

@ -0,0 +1,33 @@
{
stdenv
}:
resultTree:
stdenv.mkDerivation {
name = "check";
preferLocalBuild = true;
phases = [ "installPhase" ];
installPhase = ''
echo "checking result tree: ${resultTree}"
cd ${resultTree}
for exp in *-experiment; do
cd ${resultTree}/$exp
echo "$exp: checking units"
for unit in *-unit; do
cd ${resultTree}/$exp/$unit
if [ ! -e status ]; then
echo "missing $unit/status file, aborting"
exit 1
fi
st=$(cat status)
if [ "$st" != "completed" ]; then
echo "unit $unit is not complete yet, aborting"
exit 1
fi
done
echo "$exp: execution complete"
done
ln -s $out ${resultTree}
'';
}

View File

@ -31,14 +31,17 @@ in
name = "fetch"; name = "fetch";
preferLocalBuild = true; preferLocalBuild = true;
buildInputs = [ rsync openssh curl ]; buildInputs = [ rsync openssh curl nix ];
phases = [ "installPhase" ]; phases = [ "installPhase" ];
# This doesn't work when multiple users have different directories where the
# results are stored.
#src = /. + "${prefix}${experimentName}";
installPhase = '' installPhase = ''
cat > $out << EOF cat > $out << EOF
#!/bin/sh -e #!/bin/sh -e
mkdir -p ${garlicTemp} mkdir -p ${garlicTemp}
export PATH=${rsync}/bin:${openssh}/bin:${nix}/bin export PATH=$PATH
rsync -av \ rsync -av \
--copy-links \ --copy-links \
${rsyncFilter} \ ${rsyncFilter} \
@ -50,8 +53,11 @@ in
garlicTemp = "${garlicTemp}"; \ garlicTemp = "${garlicTemp}"; \
})') })')
rm -rf ${garlicTemp}/${experimentName}
echo "The results for experiment ${experimentName} are at:" echo "The results for experiment ${experimentName} are at:"
echo " \$res" echo " \$res"
EOF EOF
chmod +x $out chmod +x $out
''; '';

81
garlic/pp/result2.nix Normal file
View File

@ -0,0 +1,81 @@
{
stdenv
, garlicTools
}:
{
trebuchetStage
, experimentStage
, garlicTemp
}:
with garlicTools;
let
experimentName = baseNameOf (toString experimentStage);
garlicOut = "/mnt/garlic-out";
in
stdenv.mkDerivation {
name = "result";
preferLocalBuild = true;
__noChroot = true;
phases = [ "installPhase" ];
installPhase = ''
expList=$(find ${garlicOut} -maxdepth 2 -name ${experimentName})
if [ -z "$expList" ]; then
echo "ERROR: missing results for ${experimentName}"
echo "Execute it by running:"
echo
echo -e " \e[30;48;5;2m${trebuchetStage}\e[0m"
echo
echo "cannot continue building $out, aborting"
exit 1
fi
N=$(echo $expList | wc -l)
echo "Found $N results: $expList"
if [ $N -gt 1 ]; then
echo
echo "ERROR: multiple results for ${experimentName}:"
echo "$expList"
echo
echo "cannot continue building $out, aborting"
exit 1
fi
exp=$expList
repeat=1
while [ 1 ]; do
repeat=0
cd $exp
echo "$exp: checking units"
for unit in *-unit; do
cd $exp/$unit
if [ ! -e status ]; then
echo "$unit: no status"
repeat=1
else
st=$(cat status)
echo "$unit: $st"
if [ "$st" != "completed" ]; then
repeat=1
fi
fi
done
if [ $repeat -eq 0 ]; then
break
fi
echo "waiting 10 seconds to try again"
sleep 10
done
echo "$exp: execution complete"
mkdir -p $out
cp -aL $exp $out
'';
}

View File

@ -38,7 +38,7 @@ stdenv.mkDerivation {
export GARLIC_EXPERIMENT=$(basename $out) export GARLIC_EXPERIMENT=$(basename $out)
if [ -e "\$GARLIC_EXPERIMENT" ]; then if [ -e "\$GARLIC_EXPERIMENT" ]; then
>&2 echo "skipping, experiment path already exists: \$GARLIC_EXPERIMENT" >&2 echo "skipping, path exists: \$(pwd)/\$GARLIC_EXPERIMENT"
exit 0 exit 0
fi fi

View File

@ -5,13 +5,13 @@ if [ -e /nix ]; then
exit 1 exit 1
fi fi
>&2 echo Running runexp for MN4 #>&2 echo Running runexp for MN4
>&2 echo PATH=$PATH #>&2 echo PATH=$PATH
user=$(id -un) user=$(id -un)
group=$(id -gn) group=$(id -gn)
export GARLIC_OUT="/gpfs/projects/$group/$user/garlic-out" export GARLIC_OUT="/gpfs/projects/bsc15/garlic/out/$user"
mkdir -p "$GARLIC_OUT" mkdir -p "$GARLIC_OUT"
cd "$GARLIC_OUT" cd "$GARLIC_OUT"

View File

@ -314,15 +314,14 @@ let
# Post processing tools # Post processing tools
pp = rec { pp = rec {
getExpResult = callPackage ./garlic/pp/result.nix { getExpResult = callPackage ./garlic/pp/result2.nix {
inherit fetchExperiment;
}; };
resultFromTrebuchet = trebuchetStage: getExpResult { resultFromTrebuchet = trebuchetStage: (getExpResult {
garlicTemp = "/tmp/garlic-temp"; garlicTemp = "/tmp/garlic-temp";
inherit trebuchetStage; inherit trebuchetStage;
experimentStage = with self.bsc.garlicTools; experimentStage = with self.bsc.garlicTools;
getExperimentStage trebuchetStage; getExperimentStage trebuchetStage;
}; });
fetchExperiment = callPackage ./garlic/pp/fetch.nix { }; fetchExperiment = callPackage ./garlic/pp/fetch.nix { };
timetable = callPackage ./garlic/pp/timetable.nix { }; timetable = callPackage ./garlic/pp/timetable.nix { };
rPlot = callPackage ./garlic/pp/rplot.nix { }; rPlot = callPackage ./garlic/pp/rplot.nix { };
@ -337,11 +336,16 @@ let
# Datasets used in the figures # Datasets used in the figures
ds = with self.bsc.garlic; with pp; { ds = with self.bsc.garlic; with pp; {
nbody = with exp.nbody; { nbody = with exp.nbody; {
test = merge [ baseline ]; test = merge [ test ];
baseline = merge [ baseline ];
jemalloc = merge [ jemalloc ];
freeCpu = merge [ freeCpu ];
cmp = {
jemalloc = merge [ baseline jemalloc ]; jemalloc = merge [ baseline jemalloc ];
freeCpu = merge [ baseline freeCpu ]; freeCpu = merge [ baseline freeCpu ];
}; };
}; };
};
# Figures generated from the experiments # Figures generated from the experiments
fig = with self.bsc.garlic; { fig = with self.bsc.garlic; {