forked from rarias/bscpkgs
		
	hpcg: add strongscaling
HPCG rounds problem size axis when its value is < 16
This commit is contained in:
		
							parent
							
								
									b60a46b683
								
							
						
					
					
						commit
						cb6577b439
					
				
							
								
								
									
										112
									
								
								garlic/exp/hpcg/oss.slices.strongscaling.nix
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										112
									
								
								garlic/exp/hpcg/oss.slices.strongscaling.nix
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,112 @@ | |||||||
|  | { | ||||||
|  |   stdenv | ||||||
|  | , stdexp | ||||||
|  | , bsc | ||||||
|  | , targetMachine | ||||||
|  | , stages | ||||||
|  | , genInput | ||||||
|  | }: | ||||||
|  | 
 | ||||||
|  | with stdenv.lib; | ||||||
|  | 
 | ||||||
|  | let | ||||||
|  |   # Initial variable configuration | ||||||
|  |   varConf = { | ||||||
|  |     n = [ | ||||||
|  |         { x = 192; y = 192; z = 16 * 192; } | ||||||
|  |     ]; | ||||||
|  |     nprocs = [ | ||||||
|  |         # { x = 2; y = 1; z = 1; } | ||||||
|  |         # { x = 4; y = 1; z = 1; } | ||||||
|  |         # { x = 8; y = 1; z = 1; } | ||||||
|  |         # { x = 16; y = 1; z = 1; } | ||||||
|  |         # { x = 32; y = 1; z = 1; } | ||||||
|  | 
 | ||||||
|  |         # { x = 1; y = 2; z = 1; } | ||||||
|  |         # { x = 1; y = 4; z = 1; } | ||||||
|  |         # { x = 1; y = 8; z = 1; } | ||||||
|  |         # { x = 1; y = 16; z = 1; } | ||||||
|  |         # { x = 1; y = 32; z = 1; } | ||||||
|  | 
 | ||||||
|  |         { x = 1; y = 1; z = 2; } | ||||||
|  |         { x = 1; y = 1; z = 4; } | ||||||
|  |         { x = 1; y = 1; z = 8; } | ||||||
|  |         { x = 1; y = 1; z = 16; } | ||||||
|  |         { x = 1; y = 1; z = 32; } | ||||||
|  | 
 | ||||||
|  |     ]; | ||||||
|  |     # nblocks = [ 12 24 48 96 192 384 768 1536 ]; | ||||||
|  |     nblocks = [ 24 48 96 192 ]; | ||||||
|  |     ncommblocks = [ 1 ]; | ||||||
|  |     # nodes = [ 1 ]; | ||||||
|  |     # nodes = [ 1 2 4 8 16 ]; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   # Generate the complete configuration for each unit | ||||||
|  |   genConf = c: targetMachine.config // rec { | ||||||
|  |     expName = "hpcg.oss"; | ||||||
|  |     unitName = "${expName}.nb${toString nblocks}"; | ||||||
|  | 
 | ||||||
|  |     inherit (targetMachine.config) hw; | ||||||
|  | 
 | ||||||
|  |     # hpcg options | ||||||
|  |     inherit (c) nprocs nblocks ncommblocks; | ||||||
|  | 
 | ||||||
|  |     n = { | ||||||
|  |         x = c.n.x / nprocs.x; | ||||||
|  |         y = c.n.y / nprocs.y; | ||||||
|  |         z = c.n.z / nprocs.z; | ||||||
|  |     }; | ||||||
|  | 
 | ||||||
|  |     gitBranch = "garlic/tampi+isend+oss+task"; | ||||||
|  | 
 | ||||||
|  |     # Repeat the execution of each unit 30 times | ||||||
|  |     loops = 1; | ||||||
|  | 
 | ||||||
|  |     disableAspectRatio = true; | ||||||
|  | 
 | ||||||
|  |     # Resources | ||||||
|  |     qos = "debug"; | ||||||
|  |     ntasksPerNode = hw.socketsPerNode; | ||||||
|  |     time = "02:00:00"; | ||||||
|  |     # task in one socket | ||||||
|  |     cpusPerTask = hw.cpusPerSocket; | ||||||
|  |     nodes = (nprocs.x * nprocs.y * nprocs.z) / ntasksPerNode; | ||||||
|  |     jobName = "hpcg-${toString n.x}-${toString n.y}-${toString n.z}-${gitBranch}"; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   # Compute the array of configurations | ||||||
|  |   configs = stdexp.buildConfigs { | ||||||
|  |     inherit varConf genConf; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   input = genInput configs; | ||||||
|  | 
 | ||||||
|  |   exec = {nextStage, conf, ...}: stages.exec { | ||||||
|  |     inherit nextStage; | ||||||
|  |     argv = [ | ||||||
|  |       "--nx=${toString conf.n.x}" | ||||||
|  |       "--ny=${toString conf.n.y}" | ||||||
|  |       "--nz=${toString conf.n.z}" | ||||||
|  |       # Distribute all processes in X axis | ||||||
|  |       "--npx=${toString conf.nprocs.x}" | ||||||
|  |       "--npy=${toString conf.nprocs.y}" | ||||||
|  |       "--npz=${toString conf.nprocs.z}" | ||||||
|  |       "--nblocks=${toString conf.nblocks}" | ||||||
|  |       "--ncomms=${toString conf.ncommblocks}" | ||||||
|  |       # The input symlink is generated by the input stage, which is generated by | ||||||
|  |       # the genInput function. | ||||||
|  |       "--load=input" | ||||||
|  |       # Disable HPCG Aspect Ratio to run any mpi layout | ||||||
|  |     ] ++ optional (conf.disableAspectRatio) "--no-ar=1"; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   program = {nextStage, conf, ...}: bsc.apps.hpcg.override { | ||||||
|  |     inherit (conf) gitBranch; | ||||||
|  |   }; | ||||||
|  | 
 | ||||||
|  |   pipeline = stdexp.stdPipeline ++ [ input exec program ]; | ||||||
|  | 
 | ||||||
|  | in | ||||||
|  | 
 | ||||||
|  |   stdexp.genExperiment { inherit configs pipeline; } | ||||||
| @ -72,6 +72,9 @@ | |||||||
|     ossSlicesWeakscaling = callPackage ./hpcg/oss.slices.weakscaling.nix { |     ossSlicesWeakscaling = callPackage ./hpcg/oss.slices.weakscaling.nix { | ||||||
|       inherit genInput; |       inherit genInput; | ||||||
|     }; |     }; | ||||||
|  |     ossSlicesStrongscaling = callPackage ./hpcg/oss.slices.strongscaling.nix { | ||||||
|  |       inherit genInput; | ||||||
|  |     }; | ||||||
|   }; |   }; | ||||||
| 
 | 
 | ||||||
|   heat = rec { |   heat = rec { | ||||||
|  | |||||||
							
								
								
									
										109
									
								
								garlic/fig/hpcg/oss.slices.strongscaling.R
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										109
									
								
								garlic/fig/hpcg/oss.slices.strongscaling.R
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,109 @@ | |||||||
|  | # This R program takes as argument the dataset that contains the results of the | ||||||
|  | # execution of the heat example experiment and produces some plots. All the | ||||||
|  | # knowledge to understand how this script works is covered by this nice R book: | ||||||
|  | # | ||||||
|  | # Winston Chang, R Graphics Cookbook: Practical Recipes for Visualizing Data, | ||||||
|  | # O’Reilly Media (2020). 2nd edition | ||||||
|  | # | ||||||
|  | # Which can be freely read it online here: https://r-graphics.org/ | ||||||
|  | # | ||||||
|  | # Please, search in this book before copying some random (and probably oudated) | ||||||
|  | # reply on stack overflow. | ||||||
|  | 
 | ||||||
|  | # We load some R packages to import the required functions. We mainly use the | ||||||
|  | # tidyverse packages, which are very good for ploting data, | ||||||
|  | library(ggplot2) | ||||||
|  | library(dplyr, warn.conflicts = FALSE) | ||||||
|  | library(scales) | ||||||
|  | library(jsonlite) | ||||||
|  | library(viridis, warn.conflicts = FALSE) | ||||||
|  | 
 | ||||||
|  | # Here we simply load the arguments to find the input dataset. If nothing is | ||||||
|  | # specified we use the file named `input` in the current directory. | ||||||
|  | # We can run this script directly using: | ||||||
|  | # Rscript <path-to-this-script> <input-dataset> | ||||||
|  | 
 | ||||||
|  | # Load the arguments (argv) | ||||||
|  | args = commandArgs(trailingOnly=TRUE) | ||||||
|  | 
 | ||||||
|  | # Set the input dataset if given in argv[1], or use "input" as default | ||||||
|  | if (length(args)>0) { input_file = args[1] } else { input_file = "input" } | ||||||
|  | 
 | ||||||
|  | df = jsonlite::stream_in(file(input_file), verbose=FALSE) %>% | ||||||
|  | 
 | ||||||
|  |   # Then we flatten it, as it may contain dictionaries inside the columns | ||||||
|  |   jsonlite::flatten() %>% | ||||||
|  | 
 | ||||||
|  |   # Now the dataframe contains all the configuration of the units inside the | ||||||
|  |   # columns named `config.*`, for example `config.cbs`. We first select only | ||||||
|  |   # the columns that we need: | ||||||
|  |   select(config.nblocks, | ||||||
|  |          config.ncommblocks, | ||||||
|  |          config.hw.cpusPerSocket, | ||||||
|  |          config.nodes, | ||||||
|  |          config.nprocs.x, | ||||||
|  |          config.nprocs.y, | ||||||
|  |          config.nprocs.z, | ||||||
|  |          unit, | ||||||
|  |          time | ||||||
|  |          ) %>% | ||||||
|  | 
 | ||||||
|  |   # And then we rename those columns to something shorter: | ||||||
|  |   rename(nblocks=config.nblocks, | ||||||
|  |          ncommblocks=config.ncommblocks, | ||||||
|  |          cpusPerSocket=config.hw.cpusPerSocket, | ||||||
|  |          nodes=config.nodes, | ||||||
|  |          npx=config.nprocs.x, | ||||||
|  |          npy=config.nprocs.y, | ||||||
|  |          npz=config.nprocs.z | ||||||
|  |          ) %>% | ||||||
|  | 
 | ||||||
|  |   mutate(axisColor=as.factor(ifelse(npx != 1, "X", ifelse(npy != 1, "Y", "Z")))) %>% | ||||||
|  | 
 | ||||||
|  |   mutate(blocksPerCpu = nblocks / cpusPerSocket) %>% | ||||||
|  | 
 | ||||||
|  |   mutate(nblocks = as.factor(nblocks)) %>% | ||||||
|  |   mutate(blocksPerCpu = as.factor(blocksPerCpu)) %>% | ||||||
|  |   mutate(nodes = as.factor(nodes)) %>% | ||||||
|  |   mutate(unit = as.factor(unit)) %>% | ||||||
|  | 
 | ||||||
|  |   mutate(timePerNprocs = time * npz) %>% | ||||||
|  | 
 | ||||||
|  |   group_by(unit) %>% | ||||||
|  | 
 | ||||||
|  |   # And compute some metrics which are applied to each group. For example we | ||||||
|  |   # compute the median time within the runs of a unit: | ||||||
|  |   mutate(median.time = median(time)) %>% | ||||||
|  |   mutate(normalized.time = time / median.time - 1) %>% | ||||||
|  |   mutate(log.median.time = log(median.time)) %>% | ||||||
|  | 
 | ||||||
|  |   # Then, we remove the grouping. This step is very important, otherwise the | ||||||
|  |   # plotting functions get confused: | ||||||
|  |   ungroup() | ||||||
|  | 
 | ||||||
|  | dpi=300 | ||||||
|  | h=5 | ||||||
|  | w=5 | ||||||
|  | 
 | ||||||
|  | # We plot the time of each run as we vary the block size | ||||||
|  | p = ggplot(df, aes(x=nodes, y=timePerNprocs, color=blocksPerCpu)) + | ||||||
|  | 
 | ||||||
|  |   # We add a points (scatter plot) using circles (shape=21) a bit larger | ||||||
|  |   # than the default (size=3) | ||||||
|  |   geom_point(shape=21, size=3) + | ||||||
|  | 
 | ||||||
|  |   # The bw theme is recommended for publications | ||||||
|  |   theme_bw() + | ||||||
|  | 
 | ||||||
|  |   # Here we add the title and the labels of the axes | ||||||
|  |   labs(x="Nodes", y="Time * Num Procs", title="HPCG strong scalability: Z axis", | ||||||
|  |     color="Blocks Per CPU", | ||||||
|  |     subtitle=input_file) + | ||||||
|  | 
 | ||||||
|  |   # And set the subtitle font size a bit smaller, so it fits nicely | ||||||
|  |   theme(plot.subtitle=element_text(size=8)) | ||||||
|  | 
 | ||||||
|  | # Then, we save the plot both in png and pdf | ||||||
|  | ggsave("time.png", plot=p, width=w, height=h, dpi=dpi) | ||||||
|  | ggsave("time.pdf", plot=p, width=w, height=h, dpi=dpi) | ||||||
|  | 
 | ||||||
| @ -45,6 +45,9 @@ in | |||||||
| 
 | 
 | ||||||
|     # /nix/store/a3x76fbnfbacn2xhz3q65fklfp0qbb6p-plot |     # /nix/store/a3x76fbnfbacn2xhz3q65fklfp0qbb6p-plot | ||||||
|     ossWeakscalingPerAxisPerBlock = stdPlot ./hpcg/oss.slices.weakscaling.R [ ossSlicesWeakscaling ]; |     ossWeakscalingPerAxisPerBlock = stdPlot ./hpcg/oss.slices.weakscaling.R [ ossSlicesWeakscaling ]; | ||||||
|  | 
 | ||||||
|  |     # /nix/store/pxf41v2c37h5fh5x8hm6dv297hkdka04-plot | ||||||
|  |     ossStrongscalingPerBlock = stdPlot ./hpcg/oss.slices.strongscaling.R [ ossSlicesStrongscaling ]; | ||||||
|   }; |   }; | ||||||
| 
 | 
 | ||||||
|   saiph = with exp.saiph; { |   saiph = with exp.saiph; { | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user
	 Raúl Peñacoba
						Raúl Peñacoba