forked from rarias/jungle
		
	nbody: add ctf tests
This commit is contained in:
		
							parent
							
								
									b8a1ea3f72
								
							
						
					
					
						commit
						bdaadd4ef7
					
				
							
								
								
									
										110
									
								
								garlic/exp/nbody/nblocks.nix
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										110
									
								
								garlic/exp/nbody/nblocks.nix
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,110 @@ | |||||||
|  | { | ||||||
|  |   stdenv | ||||||
|  | , stdexp | ||||||
|  | , bsc | ||||||
|  | , targetMachine | ||||||
|  | , stages | ||||||
|  | , garlicTools | ||||||
|  | 
 | ||||||
|  | # Options for the experiment | ||||||
|  | , enableJemalloc ? false | ||||||
|  | , enableCTF ? false | ||||||
|  | # Number of cases tested | ||||||
|  | , steps ? 7 | ||||||
|  | # nbody iterations | ||||||
|  | , timesteps ? 10 | ||||||
|  | # nbody total number of particles | ||||||
|  | , particles ? null | ||||||
|  | , gitBranch ? "garlic/tampi+send+oss+task" | ||||||
|  | , loops ? 10 | ||||||
|  | , nblocks0 ? null | ||||||
|  | }: | ||||||
|  | 
 | ||||||
|  | with stdenv.lib; | ||||||
|  | with garlicTools; | ||||||
|  | 
 | ||||||
|  | let | ||||||
|  | 
 | ||||||
|  |   defaultOpt = var: def: if (var != null) then var else def; | ||||||
|  | 
 | ||||||
|  |   machineConfig = targetMachine.config; | ||||||
|  |   inherit (machineConfig) hw; | ||||||
|  | 
 | ||||||
|  |   # Initial variable configuration | ||||||
|  |   varConf = with bsc; { | ||||||
|  |     # Create a list with values 2^n with n from 0 to (steps - 1) inclusive | ||||||
|  |     i = expRange 2 0 (steps - 1); | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   # Generate the complete configuration for each unit | ||||||
|  |   genConf = var: fix (self: var // targetMachine.config // { | ||||||
|  |     expName = "nbody-nblocks"; | ||||||
|  |     unitName = "${self.expName}${toString self.nblocks}"; | ||||||
|  | 
 | ||||||
|  |     inherit (machineConfig) hw; | ||||||
|  | 
 | ||||||
|  |     # nbody options | ||||||
|  |     particles = defaultOpt particles (4096 * self.hw.cpusPerSocket); | ||||||
|  |     nblocks0 = defaultOpt nblocks0 (self.hw.cpusPerSocket / 2); | ||||||
|  |     # The number of blocks is then computed from the multiplier "i" and | ||||||
|  |     # the initial number of blocks "nblocks0" | ||||||
|  |     nblocks = self.i * self.nblocks0; | ||||||
|  | 
 | ||||||
|  |     totalTasks = self.ntasksPerNode * self.nodes; | ||||||
|  |     particlesPerTask = self.particles / self.totalTasks; | ||||||
|  |     blocksize = self.particlesPerTask / self.nblocks; | ||||||
|  |     cc = bsc.icc; | ||||||
|  |     mpi = bsc.impi; | ||||||
|  |     cflags = "-g"; | ||||||
|  |     inherit timesteps gitBranch enableJemalloc enableCTF loops; | ||||||
|  | 
 | ||||||
|  |     # Resources | ||||||
|  |     qos = "debug"; | ||||||
|  |     cpusPerTask = self.hw.cpusPerSocket; | ||||||
|  |     ntasksPerNode = self.hw.socketsPerNode; | ||||||
|  |     nodes = 1; | ||||||
|  |     jobName = self.unitName; | ||||||
|  |   }); | ||||||
|  | 
 | ||||||
|  |   # Compute the array of configurations | ||||||
|  |   configs = stdexp.buildConfigs { | ||||||
|  |     inherit varConf genConf; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   perf = {nextStage, conf, ...}: with conf; stages.perf { | ||||||
|  |     inherit nextStage; | ||||||
|  |     perfOptions = "record --call-graph dwarf -o \\$\\$.perf"; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   ctf = {nextStage, conf, ...}: with conf; stages.exec { | ||||||
|  |     inherit nextStage; | ||||||
|  |     env = optionalString (conf.enableCTF) '' | ||||||
|  |       export NANOS6_CONFIG_OVERRIDE="version.instrument=ctf,\ | ||||||
|  |         instrument.ctf.conversor.enabled=false" | ||||||
|  |     ''; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   exec = {nextStage, conf, ...}: with conf; stages.exec { | ||||||
|  |     inherit nextStage; | ||||||
|  |     argv = [ "-t" timesteps "-p" particles ]; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   program = {nextStage, conf, ...}: with conf; | ||||||
|  |     let | ||||||
|  |       /* These changes are propagated to all dependencies. For example, | ||||||
|  |       when changing nanos6+jemalloc, we will get tampi built with | ||||||
|  |       nanos6+jemalloc as well. */ | ||||||
|  |       customPkgs = bsc.extend (self: super: { | ||||||
|  |         mpi = conf.mpi; | ||||||
|  |         nanos6 = self.nanos6.override { inherit enableJemalloc; }; | ||||||
|  |       }); | ||||||
|  |     in | ||||||
|  |       customPkgs.apps.nbody.override ({ | ||||||
|  |         inherit cc blocksize mpi gitBranch cflags; | ||||||
|  |       }); | ||||||
|  | 
 | ||||||
|  |   pipeline = stdexp.stdPipeline ++ [ ctf exec program ]; | ||||||
|  | 
 | ||||||
|  | in | ||||||
|  |   | ||||||
|  |   stdexp.genExperiment { inherit configs pipeline; } | ||||||
| @ -1,101 +0,0 @@ | |||||||
| { |  | ||||||
|   stdenv |  | ||||||
| , stdexp |  | ||||||
| , bsc |  | ||||||
| , targetMachine |  | ||||||
| , stages |  | ||||||
| , garlicTools |  | ||||||
| , enableJemalloc ? false |  | ||||||
| , particles ? null |  | ||||||
| }: |  | ||||||
| 
 |  | ||||||
| with stdenv.lib; |  | ||||||
| with garlicTools; |  | ||||||
| 
 |  | ||||||
| let |  | ||||||
| 
 |  | ||||||
|   machineConfig = targetMachine.config; |  | ||||||
|   inherit (machineConfig) hw; |  | ||||||
| 
 |  | ||||||
|   # Number of cases tested |  | ||||||
|   steps = 7; |  | ||||||
| 
 |  | ||||||
|   # First value for nblocks: we want to begin by using 1/2 blocks/cpu so we set |  | ||||||
|   # the first number of blocks to cpusPerSocket / 2 |  | ||||||
|   nblocks0 = hw.cpusPerSocket / 2; |  | ||||||
| 
 |  | ||||||
|   # Initial variable configuration |  | ||||||
|   varConf = with bsc; { |  | ||||||
|     # Create a list with values 2^n with n from 0 to (steps - 1) inclusive |  | ||||||
|     i = expRange 2 0 (steps - 1); |  | ||||||
|   }; |  | ||||||
| 
 |  | ||||||
|   # Set here the particles, so we don't have an infinite recursion in the |  | ||||||
|   # genConf attrset. |  | ||||||
|   _particles = if (particles != null) |  | ||||||
|     then particles |  | ||||||
|     else 4096 * hw.cpusPerSocket; |  | ||||||
| 
 |  | ||||||
|   # Generate the complete configuration for each unit |  | ||||||
|   genConf = with bsc; c: targetMachine.config // rec { |  | ||||||
|     expName = "nbody-nblocks"; |  | ||||||
|     unitName = "${expName}${toString nblocks}"; |  | ||||||
| 
 |  | ||||||
|     inherit (machineConfig) hw; |  | ||||||
|     # nbody options |  | ||||||
|     particles = _particles; |  | ||||||
|     timesteps = 10; |  | ||||||
|     nblocks = c.i * nblocks0; |  | ||||||
|     totalTasks = ntasksPerNode * nodes; |  | ||||||
|     particlesPerTask = particles / totalTasks; |  | ||||||
|     blocksize = particlesPerTask / nblocks; |  | ||||||
|     cc = icc; |  | ||||||
|     mpi = impi; |  | ||||||
|     gitBranch = "garlic/tampi+send+oss+task"; |  | ||||||
|     cflags = "-g"; |  | ||||||
|     inherit enableJemalloc; |  | ||||||
|      |  | ||||||
|     # Repeat the execution of each unit 10 times |  | ||||||
|     loops = 10; |  | ||||||
| 
 |  | ||||||
|     # Resources |  | ||||||
|     qos = "debug"; |  | ||||||
|     cpusPerTask = hw.cpusPerSocket; |  | ||||||
|     ntasksPerNode = hw.socketsPerNode; |  | ||||||
|     nodes = 1; |  | ||||||
| 
 |  | ||||||
|     jobName = unitName; |  | ||||||
|   }; |  | ||||||
| 
 |  | ||||||
|   # Compute the array of configurations |  | ||||||
|   configs = stdexp.buildConfigs { |  | ||||||
|     inherit varConf genConf; |  | ||||||
|   }; |  | ||||||
| 
 |  | ||||||
|   perf = {nextStage, conf, ...}: with conf; stages.perf { |  | ||||||
|     inherit nextStage; |  | ||||||
|     perfOptions = "record --call-graph dwarf -o \\$\\$.perf"; |  | ||||||
|   }; |  | ||||||
| 
 |  | ||||||
|   exec = {nextStage, conf, ...}: with conf; stages.exec { |  | ||||||
|     inherit nextStage; |  | ||||||
|     argv = [ "-t" timesteps "-p" particles ]; |  | ||||||
|   }; |  | ||||||
| 
 |  | ||||||
|   program = {nextStage, conf, ...}: with conf; |  | ||||||
|   let |  | ||||||
|     customPkgs = stdexp.replaceMpi conf.mpi; |  | ||||||
|   in |  | ||||||
|     customPkgs.apps.nbody.override ({ |  | ||||||
|       inherit cc blocksize mpi gitBranch cflags; |  | ||||||
|     } // optionalAttrs enableJemalloc { |  | ||||||
|       mcxx = bsc.mcxx.override { |  | ||||||
|         nanos6 = bsc.nanos6Jemalloc; |  | ||||||
|       }; |  | ||||||
|     }); |  | ||||||
| 
 |  | ||||||
|   pipeline = stdexp.stdPipeline ++ [ exec program ]; |  | ||||||
| 
 |  | ||||||
| in |  | ||||||
|   |  | ||||||
|   stdexp.genExperiment { inherit configs pipeline; } |  | ||||||
							
								
								
									
										27
									
								
								overlay.nix
									
									
									
									
									
								
							
							
						
						
									
										27
									
								
								overlay.nix
									
									
									
									
									
								
							| @ -372,14 +372,30 @@ let | |||||||
|       # Experiments |       # Experiments | ||||||
|       exp = { |       exp = { | ||||||
|         nbody = rec { |         nbody = rec { | ||||||
|           tampi = callPackage ./garlic/exp/nbody/tampi.nix { }; |           baseline = callPackage ./garlic/exp/nbody/nblocks.nix { }; | ||||||
| 
 | 
 | ||||||
|           # Experiment variants |           # Experiment variants | ||||||
|           baseline = tampi; |           small = baseline.override { | ||||||
|           small = baseline.override { particles = 12 * 4096; }; |             particles = 12 * 4096; | ||||||
|  |           }; | ||||||
|           # TODO: Update freeCpu using a non-standard pipeline |           # TODO: Update freeCpu using a non-standard pipeline | ||||||
|           #freeCpu = baseline.override { freeCpu = true; }; |           #freeCpu = baseline.override { freeCpu = true; }; | ||||||
|           jemalloc = baseline.override { enableJemalloc = true; }; |           jemalloc = baseline.override { enableJemalloc = true; }; | ||||||
|  | 
 | ||||||
|  |           # Some experiments with traces | ||||||
|  |           trace = { | ||||||
|  |             # Only one unit repeated 30 times | ||||||
|  |             baseline = small.override { | ||||||
|  |               enableCTF = true; | ||||||
|  |               loops = 30; | ||||||
|  |               steps = 1; | ||||||
|  |             }; | ||||||
|  | 
 | ||||||
|  |             # Same but with jemalloc enabled | ||||||
|  |             jemalloc = trace.baseline.override { | ||||||
|  |               enableJemalloc = true; | ||||||
|  |             }; | ||||||
|  |           }; | ||||||
|         }; |         }; | ||||||
| 
 | 
 | ||||||
|         saiph = { |         saiph = { | ||||||
| @ -450,6 +466,7 @@ let | |||||||
|           small = merge [ small ]; |           small = merge [ small ]; | ||||||
|           jemalloc = merge [ baseline jemalloc ]; |           jemalloc = merge [ baseline jemalloc ]; | ||||||
|           #freeCpu  = merge [ baseline freeCpu ]; |           #freeCpu  = merge [ baseline freeCpu ]; | ||||||
|  |           ctf = merge [ ctf ]; | ||||||
|         }; |         }; | ||||||
| 
 | 
 | ||||||
|         hpcg = with exp.hpcg; { |         hpcg = with exp.hpcg; { | ||||||
| @ -490,6 +507,10 @@ let | |||||||
|           #  script = ./garlic/fig/nbody/freeCpu.R; |           #  script = ./garlic/fig/nbody/freeCpu.R; | ||||||
|           #  dataset = ds.nbody.freeCpu; |           #  dataset = ds.nbody.freeCpu; | ||||||
|           #}; |           #}; | ||||||
|  |           ctf = pp.rPlot { | ||||||
|  |             script = ./garlic/fig/nbody/baseline.R; | ||||||
|  |             dataset = ds.nbody.ctf; | ||||||
|  |           }; | ||||||
|         }; |         }; | ||||||
| 
 | 
 | ||||||
|         hpcg = { |         hpcg = { | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user