2020-11-05 19:56:26 +01:00
|
|
|
{
|
|
|
|
stdenv
|
|
|
|
, stdexp
|
|
|
|
, bsc
|
|
|
|
, targetMachine
|
|
|
|
, stages
|
2021-03-05 16:18:51 +01:00
|
|
|
, garlicTools
|
2021-03-09 18:45:33 +01:00
|
|
|
, enablePerf ? false
|
2021-03-12 12:13:10 +01:00
|
|
|
, enableCTF ? false
|
2020-11-05 19:56:26 +01:00
|
|
|
}:
|
|
|
|
|
|
|
|
with stdenv.lib;
|
2021-03-05 16:18:51 +01:00
|
|
|
with garlicTools;
|
2020-11-05 19:56:26 +01:00
|
|
|
|
|
|
|
let
|
|
|
|
# Initial variable configuration
|
|
|
|
varConf = with bsc; {
|
2021-03-17 20:13:49 +01:00
|
|
|
cbs = range2 32 4096;
|
|
|
|
rbs = range2 32 4096;
|
|
|
|
#cbs = [ 64 256 1024 4096 ];
|
|
|
|
#rbs = [ 32 128 512 1024 ];
|
2021-03-12 12:13:10 +01:00
|
|
|
#cbs = [ 4096 ];
|
2021-03-17 20:13:49 +01:00
|
|
|
#rbs = [ 512 ];
|
2020-11-05 19:56:26 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
machineConfig = targetMachine.config;
|
|
|
|
|
|
|
|
# Generate the complete configuration for each unit
|
|
|
|
genConf = with bsc; c: targetMachine.config // rec {
|
|
|
|
expName = "heat";
|
2021-03-05 16:18:51 +01:00
|
|
|
unitName = expName +
|
|
|
|
".cbs-${toString cbs}" +
|
|
|
|
".rbs-${toString rbs}";
|
|
|
|
|
2020-11-05 19:56:26 +01:00
|
|
|
inherit (machineConfig) hw;
|
|
|
|
|
|
|
|
# heat options
|
|
|
|
timesteps = 10;
|
2021-03-05 16:18:51 +01:00
|
|
|
cols = 1024 * 16; # Columns
|
|
|
|
rows = 1024 * 16; # Rows
|
|
|
|
cbs = c.cbs;
|
|
|
|
rbs = c.rbs;
|
|
|
|
gitBranch = "garlic/tampi+isend+oss+task";
|
2020-11-05 19:56:26 +01:00
|
|
|
|
|
|
|
# Repeat the execution of each unit 30 times
|
2021-03-12 12:13:10 +01:00
|
|
|
loops = 1;
|
2020-11-05 19:56:26 +01:00
|
|
|
|
|
|
|
# Resources
|
|
|
|
qos = "debug";
|
|
|
|
ntasksPerNode = 1;
|
|
|
|
nodes = 1;
|
|
|
|
time = "02:00:00";
|
|
|
|
# Assign one socket to each task (only one process)
|
2020-11-17 11:17:57 +01:00
|
|
|
cpusPerTask = hw.cpusPerSocket;
|
2020-11-05 19:56:26 +01:00
|
|
|
jobName = unitName;
|
|
|
|
};
|
|
|
|
|
|
|
|
# Compute the array of configurations
|
|
|
|
configs = stdexp.buildConfigs {
|
|
|
|
inherit varConf genConf;
|
|
|
|
};
|
|
|
|
|
2021-03-09 18:45:33 +01:00
|
|
|
perf = {nextStage, conf, ...}: stages.perf {
|
|
|
|
inherit nextStage;
|
|
|
|
perfOptions = "stat -o .garlic/perf.csv -x , " +
|
|
|
|
"-e cycles,instructions,cache-references,cache-misses";
|
|
|
|
};
|
|
|
|
|
2021-03-12 12:13:10 +01:00
|
|
|
ctf = {nextStage, conf, ...}: with conf; stages.exec {
|
|
|
|
inherit nextStage;
|
|
|
|
env = ''
|
|
|
|
export NANOS6_CONFIG_OVERRIDE="version.instrument=ctf,\
|
|
|
|
instrument.ctf.converter.enabled=false"
|
|
|
|
'';
|
|
|
|
# Only one process converts the trace, otherwise use:
|
|
|
|
# if [ $SLURM_PROCID == 0 ]; then
|
|
|
|
# ...
|
|
|
|
# fi
|
|
|
|
post = ''
|
|
|
|
if [ $SLURM_PROCID == 0 ]; then
|
|
|
|
sleep 2
|
|
|
|
for tracedir in trace_*; do
|
|
|
|
offset=$(grep 'offset =' $tracedir/ctf/ust/uid/1000/64-bit/metadata | \
|
|
|
|
grep -o '[0-9]*')
|
|
|
|
echo "offset = $offset"
|
|
|
|
|
|
|
|
start_time=$(awk '/^start_time / {print $2}' stdout.log)
|
|
|
|
end_time=$(awk '/^end_time / {print $2}' stdout.log)
|
|
|
|
|
|
|
|
begin=$(awk "BEGIN{print $start_time*1e9 - $offset}")
|
|
|
|
end=$(awk "BEGIN{print $end_time*1e9 - $offset}")
|
|
|
|
|
|
|
|
echo "only events between $begin and $end"
|
|
|
|
|
|
|
|
${bsc.cn6}/bin/cn6 -s $tracedir
|
|
|
|
|
2021-03-18 20:06:53 +01:00
|
|
|
${bsc.cn6}/bin/cut $begin $end < $tracedir/prv/trace.prv |\
|
|
|
|
${bsc.cn6}/bin/hcut 1 ${toString conf.cpusPerTask} \
|
2021-03-17 20:13:49 +01:00
|
|
|
> $tracedir/prv/trace-cut.prv
|
|
|
|
|
|
|
|
${bsc.cn6}/bin/dur 6400025 0 < $tracedir/prv/trace-cut.prv |\
|
2021-03-12 12:13:10 +01:00
|
|
|
awk '{s+=$1} END {print s}' >> .garlic/time_mode_dead.csv &
|
|
|
|
|
2021-03-17 20:13:49 +01:00
|
|
|
${bsc.cn6}/bin/dur 6400025 1 < $tracedir/prv/trace-cut.prv |\
|
2021-03-12 12:13:10 +01:00
|
|
|
awk '{s+=$1} END {print s}' >> .garlic/time_mode_runtime.csv &
|
|
|
|
|
2021-03-17 20:13:49 +01:00
|
|
|
${bsc.cn6}/bin/dur 6400025 3 < $tracedir/prv/trace-cut.prv |\
|
2021-03-12 12:13:10 +01:00
|
|
|
awk '{s+=$1} END {print s}' >> .garlic/time_mode_task.csv &
|
|
|
|
|
|
|
|
wait
|
|
|
|
|
|
|
|
# Remove the traces at the end, as they are huge
|
|
|
|
rm -rf $tracedir
|
|
|
|
done
|
|
|
|
fi
|
|
|
|
'';
|
|
|
|
};
|
|
|
|
|
2021-03-05 16:18:51 +01:00
|
|
|
exec = {nextStage, conf, ...}: stages.exec {
|
2020-11-05 19:56:26 +01:00
|
|
|
inherit nextStage;
|
2021-03-05 16:18:51 +01:00
|
|
|
argv = [
|
|
|
|
"--rows" conf.rows
|
|
|
|
"--cols" conf.cols
|
|
|
|
"--rbs" conf.rbs
|
|
|
|
"--cbs" conf.cbs
|
|
|
|
"--timesteps" conf.timesteps
|
|
|
|
];
|
|
|
|
|
|
|
|
# The next stage is the program
|
2020-11-05 19:56:26 +01:00
|
|
|
env = ''
|
2021-03-05 16:18:51 +01:00
|
|
|
ln -sf ${nextStage}/etc/heat.conf heat.conf || true
|
2020-11-05 19:56:26 +01:00
|
|
|
'';
|
|
|
|
};
|
|
|
|
|
2021-03-05 16:18:51 +01:00
|
|
|
program = {nextStage, conf, ...}: bsc.garlic.apps.heat.override {
|
|
|
|
inherit (conf) gitBranch;
|
|
|
|
};
|
2020-11-05 19:56:26 +01:00
|
|
|
|
2021-03-09 18:45:33 +01:00
|
|
|
pipeline = stdexp.stdPipeline ++
|
|
|
|
(optional enablePerf perf) ++
|
2021-03-12 12:13:10 +01:00
|
|
|
(optional enableCTF ctf) ++
|
2021-03-09 18:45:33 +01:00
|
|
|
[ exec program ];
|
2020-11-05 19:56:26 +01:00
|
|
|
|
|
|
|
in
|
|
|
|
|
|
|
|
stdexp.genExperiment { inherit configs pipeline; }
|