Rodrigo Arias Mallo
121030537d
The loom name "loom.xyz.123" will produce the hostname "xyz", so Nanos6 programs can use the ovnisync tool too. Also, sort the loom array directly, so we avoid potential problems by sorting the loom and the hostnames individually (when there are repeated entries).
594 lines
12 KiB
C
594 lines
12 KiB
C
/*
|
|
* Copyright (c) 2021 Barcelona Supercomputing Center (BSC)
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef OVNI_EMU_H
|
|
#define OVNI_EMU_H
|
|
|
|
#include <stdio.h>
|
|
|
|
#include "common.h"
|
|
#include "ovni.h"
|
|
#include "uthash.h"
|
|
#include "parson.h"
|
|
#include "heap.h"
|
|
#include "pcf.h"
|
|
|
|
/* Emulated thread runtime status */
|
|
enum ethread_state {
|
|
TH_ST_UNKNOWN,
|
|
TH_ST_RUNNING,
|
|
TH_ST_PAUSED,
|
|
TH_ST_DEAD,
|
|
TH_ST_COOLING,
|
|
TH_ST_WARMING,
|
|
};
|
|
|
|
enum task_state {
|
|
TASK_ST_CREATED,
|
|
TASK_ST_RUNNING,
|
|
TASK_ST_PAUSED,
|
|
TASK_ST_DEAD,
|
|
};
|
|
|
|
enum ovni_state {
|
|
ST_OVNI_FLUSHING = 1,
|
|
};
|
|
|
|
enum error_values {
|
|
ST_BAD = 666,
|
|
ST_TOO_MANY_TH = 777,
|
|
};
|
|
|
|
enum nosv_ss_values {
|
|
ST_NULL = 0,
|
|
ST_NOSV_SCHED_HUNGRY = 6,
|
|
ST_NOSV_SCHED_SERVING,
|
|
ST_NOSV_SCHED_SUBMITTING,
|
|
ST_NOSV_MEM_ALLOCATING,
|
|
ST_NOSV_MEM_FREEING,
|
|
ST_NOSV_TASK_RUNNING,
|
|
ST_NOSV_API_SUBMIT,
|
|
ST_NOSV_API_PAUSE,
|
|
ST_NOSV_API_YIELD,
|
|
ST_NOSV_API_WAITFOR,
|
|
ST_NOSV_API_SCHEDPOINT,
|
|
ST_NOSV_ATTACH,
|
|
ST_NOSV_WORKER,
|
|
ST_NOSV_DELEGATE,
|
|
|
|
EV_NOSV_SCHED_RECV,
|
|
EV_NOSV_SCHED_SEND,
|
|
EV_NOSV_SCHED_SELF,
|
|
};
|
|
|
|
enum tampi_state {
|
|
ST_TAMPI_SEND = 1,
|
|
ST_TAMPI_RECV = 2,
|
|
ST_TAMPI_ISEND = 3,
|
|
ST_TAMPI_IRECV = 4,
|
|
ST_TAMPI_WAIT = 5,
|
|
ST_TAMPI_WAITALL = 6,
|
|
};
|
|
|
|
enum openmp_state {
|
|
ST_OPENMP_TASK = 1,
|
|
ST_OPENMP_PARALLEL = 2,
|
|
};
|
|
|
|
enum nodes_state {
|
|
ST_NODES_REGISTER = 1,
|
|
ST_NODES_UNREGISTER = 2,
|
|
ST_NODES_IF0_WAIT = 3,
|
|
ST_NODES_IF0_INLINE = 4,
|
|
ST_NODES_TASKWAIT = 5,
|
|
ST_NODES_CREATE = 6,
|
|
ST_NODES_SUBMIT = 7,
|
|
ST_NODES_SPAWN = 8,
|
|
};
|
|
|
|
/* The values of nanos6_ss_state are synced to the previous
|
|
* CTF implementation. */
|
|
enum nanos6_ss_state {
|
|
ST_NANOS6_TASK_BODY = 1,
|
|
ST_NANOS6_TASK_CREATING,
|
|
ST_NANOS6_TASK_SUBMIT,
|
|
ST_NANOS6_TASK_SPAWNING,
|
|
ST_NANOS6_TASK_FOR,
|
|
ST_NANOS6_SCHED_ADDING,
|
|
ST_NANOS6_SCHED_PROCESSING,
|
|
ST_NANOS6_SCHED_SERVING,
|
|
ST_NANOS6_DEP_REG,
|
|
ST_NANOS6_DEP_UNREG,
|
|
ST_NANOS6_BLK_TASKWAIT,
|
|
ST_NANOS6_BLK_WAITFOR,
|
|
ST_NANOS6_BLK_BLOCKING,
|
|
ST_NANOS6_BLK_UNBLOCKING,
|
|
ST_NANOS6_ALLOCATING,
|
|
ST_NANOS6_FREEING,
|
|
ST_NANOS6_HANDLING_TASK,
|
|
ST_NANOS6_WORKER_LOOP,
|
|
ST_NANOS6_SWITCH_TO,
|
|
ST_NANOS6_MIGRATE,
|
|
ST_NANOS6_SUSPEND,
|
|
ST_NANOS6_RESUME,
|
|
|
|
/* Value 51 is broken in old Paraver */
|
|
EV_NANOS6_SCHED_RECV = 60,
|
|
EV_NANOS6_SCHED_SEND,
|
|
EV_NANOS6_SCHED_SELF,
|
|
EV_NANOS6_CPU_IDLE,
|
|
EV_NANOS6_CPU_ACTIVE,
|
|
EV_NANOS6_SIGNAL,
|
|
};
|
|
|
|
enum nanos6_thread_type {
|
|
ST_NANOS6_TH_LEADER = 1,
|
|
ST_NANOS6_TH_MAIN = 2,
|
|
ST_NANOS6_TH_WORKER = 3,
|
|
ST_NANOS6_TH_EXTERNAL = 4,
|
|
};
|
|
|
|
enum kernel_cs_state {
|
|
ST_KERNEL_CSOUT = 3,
|
|
};
|
|
|
|
struct ovni_ethread;
|
|
struct ovni_eproc;
|
|
|
|
struct task_type {
|
|
uint32_t id; /* Per-process task identifier */
|
|
uint32_t gid; /* Global identifier computed from the label */
|
|
char label[MAX_PCF_LABEL];
|
|
UT_hash_handle hh;
|
|
};
|
|
|
|
struct task {
|
|
uint32_t id;
|
|
struct task_type *type;
|
|
|
|
/* The thread that has began to execute the task. It cannot
|
|
* change after being set, even if the task ends. */
|
|
struct ovni_ethread *thread;
|
|
enum task_state state;
|
|
UT_hash_handle hh;
|
|
|
|
/* List handle for nested task support */
|
|
struct task *next;
|
|
struct task *prev;
|
|
};
|
|
|
|
struct task_info {
|
|
/* Both hash maps of all known tasks and types */
|
|
struct task_type *types;
|
|
struct task *tasks;
|
|
};
|
|
|
|
struct task_stack {
|
|
union {
|
|
struct task *top; /* Synctactic sugar */
|
|
struct task *tasks;
|
|
};
|
|
struct ovni_ethread *thread;
|
|
};
|
|
|
|
#define MAX_CHAN_STACK 512
|
|
|
|
enum chan_track {
|
|
/* The channel is manually controlled. */
|
|
CHAN_TRACK_NONE = 0,
|
|
|
|
/* Enables the channel when the thread is running only. */
|
|
CHAN_TRACK_TH_RUNNING,
|
|
|
|
/* The thread active tracking mode a enables the channel when
|
|
* the thread is running, cooling or warming. Otherwise the
|
|
* channel is disabled. */
|
|
CHAN_TRACK_TH_ACTIVE,
|
|
};
|
|
|
|
enum chan {
|
|
CHAN_OVNI_PID,
|
|
CHAN_OVNI_TID,
|
|
CHAN_OVNI_NRTHREADS,
|
|
CHAN_OVNI_STATE,
|
|
CHAN_OVNI_APPID,
|
|
CHAN_OVNI_CPU,
|
|
CHAN_OVNI_FLUSH,
|
|
|
|
CHAN_NOSV_TASKID,
|
|
CHAN_NOSV_TYPE,
|
|
CHAN_NOSV_APPID,
|
|
CHAN_NOSV_SUBSYSTEM,
|
|
CHAN_NOSV_RANK,
|
|
|
|
CHAN_TAMPI_MODE,
|
|
CHAN_OPENMP_MODE,
|
|
CHAN_NODES_SUBSYSTEM,
|
|
|
|
CHAN_NANOS6_TASKID,
|
|
CHAN_NANOS6_TYPE,
|
|
CHAN_NANOS6_SUBSYSTEM,
|
|
CHAN_NANOS6_RANK,
|
|
CHAN_NANOS6_THREAD,
|
|
|
|
CHAN_KERNEL_CS,
|
|
|
|
CHAN_MAX
|
|
};
|
|
|
|
enum chan_type {
|
|
CHAN_TH = 0,
|
|
CHAN_CPU = 1,
|
|
CHAN_MAXTYPE = 2,
|
|
};
|
|
|
|
enum chan_dirty {
|
|
CHAN_CLEAN = 0,
|
|
|
|
/* The channel is dirty because it has been enabled or disabled */
|
|
CHAN_DIRTY_ACTIVE = 1,
|
|
|
|
/* The channel is dirty because it changed the state */
|
|
CHAN_DIRTY_VALUE = 2,
|
|
};
|
|
|
|
static const int chan_to_prvtype[CHAN_MAX] = {
|
|
[CHAN_OVNI_PID] = 1,
|
|
[CHAN_OVNI_TID] = 2,
|
|
[CHAN_OVNI_NRTHREADS] = 3,
|
|
[CHAN_OVNI_STATE] = 4,
|
|
[CHAN_OVNI_APPID] = 5, /* Not used */
|
|
[CHAN_OVNI_CPU] = 6,
|
|
[CHAN_OVNI_FLUSH] = 7,
|
|
[CHAN_NOSV_TASKID] = 10,
|
|
[CHAN_NOSV_TYPE] = 11,
|
|
[CHAN_NOSV_APPID] = 12,
|
|
[CHAN_NOSV_SUBSYSTEM] = 13,
|
|
[CHAN_NOSV_RANK] = 14,
|
|
[CHAN_TAMPI_MODE] = 20,
|
|
[CHAN_OPENMP_MODE] = 25,
|
|
[CHAN_NODES_SUBSYSTEM] = 30,
|
|
[CHAN_NANOS6_TASKID] = 35,
|
|
[CHAN_NANOS6_TYPE] = 36,
|
|
[CHAN_NANOS6_SUBSYSTEM] = 37,
|
|
[CHAN_NANOS6_RANK] = 38,
|
|
[CHAN_NANOS6_THREAD] = 39,
|
|
[CHAN_KERNEL_CS] = 45,
|
|
};
|
|
|
|
struct ovni_chan {
|
|
/* Channel id */
|
|
enum chan id;
|
|
|
|
/* Number of states in the stack */
|
|
int n;
|
|
|
|
/* Stack of states */
|
|
int stack[MAX_CHAN_STACK];
|
|
|
|
/* 1 if enabled, 0 if not. */
|
|
int enabled;
|
|
|
|
/* What state should be shown in errors */
|
|
int badst;
|
|
|
|
/* Last state emitted (-1 otherwise) */
|
|
int lastst;
|
|
|
|
/* Punctual event: -1 if not used */
|
|
int ev;
|
|
|
|
/* Emit events of this type */
|
|
int type;
|
|
|
|
/* A pointer to a clock to sample the time */
|
|
int64_t *clock;
|
|
|
|
/* The time of the last state or event */
|
|
int64_t t;
|
|
|
|
/* Paraver row */
|
|
int row;
|
|
|
|
/* Type of dirty */
|
|
enum chan_dirty dirty;
|
|
|
|
/* Where should the events be written to? */
|
|
FILE *prv;
|
|
|
|
/* What should cause the channel to become disabled? */
|
|
enum chan_track track;
|
|
|
|
/* The thread associated with the channel if any */
|
|
struct ovni_ethread *thread;
|
|
|
|
/* The CPU associated with the channel if any */
|
|
struct ovni_cpu *cpu;
|
|
|
|
struct ovni_chan **update_list;
|
|
|
|
/* Used when the channel is a list */
|
|
struct ovni_chan *prev;
|
|
struct ovni_chan *next;
|
|
};
|
|
|
|
#define MAX_BURSTS 100
|
|
|
|
/* State of each emulated thread */
|
|
struct ovni_ethread {
|
|
/* Emulated thread tid */
|
|
pid_t tid;
|
|
|
|
int index;
|
|
int gindex;
|
|
|
|
/* The process associated with this thread */
|
|
struct ovni_eproc *proc;
|
|
|
|
enum ethread_state state;
|
|
int is_running;
|
|
int is_active;
|
|
|
|
/* Thread stream */
|
|
struct ovni_stream *stream;
|
|
|
|
/* Current cpu */
|
|
struct ovni_cpu *cpu;
|
|
|
|
/* FIXME: Use a table with registrable pointers to custom data
|
|
* structures */
|
|
|
|
/* Task stacks, top ones are the tasks currently runnable. */
|
|
struct task_stack nosv_task_stack;
|
|
struct task_stack nanos6_task_stack;
|
|
|
|
/* Channels are used to output the emulator state in PRV */
|
|
struct ovni_chan chan[CHAN_MAX];
|
|
|
|
/* Burst times */
|
|
int nbursts;
|
|
int64_t burst_time[MAX_BURSTS];
|
|
|
|
/* These pointers keep a linked list of threads in each CPU */
|
|
struct ovni_ethread *prev;
|
|
struct ovni_ethread *next;
|
|
|
|
/* Trace file path */
|
|
char tracefile[PATH_MAX];
|
|
};
|
|
|
|
/* State of each emulated process */
|
|
struct ovni_eproc {
|
|
int pid;
|
|
int index;
|
|
int gindex;
|
|
int appid;
|
|
int rank;
|
|
|
|
/* The loom of the current process */
|
|
struct ovni_loom *loom;
|
|
|
|
/* Path of the process tracedir */
|
|
char dir[PATH_MAX];
|
|
|
|
/* Threads */
|
|
size_t nthreads;
|
|
struct ovni_ethread *thread;
|
|
|
|
JSON_Value *meta;
|
|
|
|
/* ------ Subsystem specific data --------*/
|
|
/* TODO: Use dynamic allocation */
|
|
|
|
struct task_info nosv_task_info;
|
|
struct task_info nanos6_task_info;
|
|
};
|
|
|
|
|
|
/* ------------------ emulation ---------------- */
|
|
|
|
enum ovni_cpu_type {
|
|
CPU_REAL,
|
|
CPU_VIRTUAL,
|
|
};
|
|
|
|
enum ovni_cpu_state {
|
|
CPU_ST_UNKNOWN,
|
|
CPU_ST_READY,
|
|
};
|
|
|
|
#define MAX_CPU_NAME 32
|
|
|
|
struct ovni_cpu {
|
|
/* Logical index: 0 to ncpus - 1 */
|
|
int i;
|
|
|
|
/* Physical id: as reported by lscpu(1) */
|
|
int phyid;
|
|
|
|
/* Global index for all CPUs */
|
|
int gindex;
|
|
|
|
enum ovni_cpu_state state;
|
|
|
|
/* The loom of the CPU */
|
|
struct ovni_loom *loom;
|
|
|
|
/* CPU channels */
|
|
struct ovni_chan chan[CHAN_MAX];
|
|
|
|
/* The threads assigned to this CPU */
|
|
size_t nthreads;
|
|
struct ovni_ethread *thread;
|
|
|
|
/* Running threads */
|
|
size_t nrunning_threads;
|
|
struct ovni_ethread *th_running;
|
|
|
|
/* Active threads (not paused or dead) */
|
|
size_t nactive_threads;
|
|
struct ovni_ethread *th_active;
|
|
|
|
/* Cpu name as shown in paraver row */
|
|
char name[MAX_CPU_NAME];
|
|
|
|
/* Is this a virtual CPU? */
|
|
int virtual;
|
|
};
|
|
|
|
/* ----------------------- trace ------------------------ */
|
|
|
|
/* State of each loom on post-process */
|
|
struct ovni_loom {
|
|
size_t nprocs;
|
|
char hostname[OVNI_MAX_HOSTNAME];
|
|
char dname[PATH_MAX]; /* Loom directory name */
|
|
char path[PATH_MAX]; /* Relative to cwd */
|
|
|
|
size_t max_ncpus;
|
|
size_t max_phyid;
|
|
size_t ncpus;
|
|
size_t offset_ncpus;
|
|
struct ovni_cpu *cpu;
|
|
int rank_enabled;
|
|
|
|
int64_t clock_offset;
|
|
|
|
/* Virtual CPU */
|
|
struct ovni_cpu vcpu;
|
|
|
|
struct ovni_eproc *proc;
|
|
};
|
|
|
|
#define MAX_VIRTUAL_EVENTS 16
|
|
|
|
struct ovni_trace {
|
|
size_t nlooms;
|
|
struct ovni_loom *loom;
|
|
|
|
size_t nstreams;
|
|
struct ovni_stream *stream;
|
|
};
|
|
|
|
struct ovni_stream {
|
|
uint8_t *buf;
|
|
size_t size;
|
|
size_t offset;
|
|
|
|
int tid;
|
|
struct ovni_loom *loom;
|
|
struct ovni_eproc *proc;
|
|
struct ovni_ethread *thread;
|
|
int loaded;
|
|
int active;
|
|
|
|
double progress;
|
|
|
|
struct ovni_ev *cur_ev;
|
|
int64_t lastclock;
|
|
int64_t clock_offset;
|
|
|
|
heap_node_t hh;
|
|
};
|
|
|
|
struct ovni_emu {
|
|
struct ovni_trace trace;
|
|
|
|
struct ovni_stream *cur_stream;
|
|
struct ovni_ev *cur_ev;
|
|
|
|
struct ovni_loom *cur_loom;
|
|
struct ovni_eproc *cur_proc;
|
|
struct ovni_ethread *cur_thread;
|
|
|
|
/* Indexed by gindex */
|
|
struct ovni_ethread **global_thread;
|
|
struct ovni_cpu **global_cpu;
|
|
|
|
/* Global processed size and offset of all streams */
|
|
size_t global_size;
|
|
size_t global_offset;
|
|
double start_emulation_time;
|
|
|
|
int64_t firstclock;
|
|
int64_t lastclock;
|
|
int64_t delta_time;
|
|
|
|
/* Counters for statistics */
|
|
int64_t nev_processed;
|
|
|
|
/* Be strict */
|
|
int enable_linter;
|
|
|
|
FILE *prv_thread;
|
|
FILE *prv_cpu;
|
|
|
|
struct pcf_file pcf[CHAN_MAXTYPE];
|
|
|
|
char *clock_offset_file;
|
|
char *tracedir;
|
|
|
|
/* Total counters */
|
|
size_t total_nthreads;
|
|
size_t total_nprocs;
|
|
size_t total_ncpus;
|
|
|
|
uint32_t nosv_type_counter;
|
|
|
|
/* Keep a list of dirty channels for the CPUs and threads */
|
|
struct ovni_chan *cpu_chan;
|
|
struct ovni_chan *th_chan;
|
|
|
|
heap_head_t sorted_stream;
|
|
};
|
|
|
|
/* Emulator function declaration */
|
|
|
|
void edie(struct ovni_emu *emu, const char* fmt, ...);
|
|
void eerr(struct ovni_emu *emu, const char* fmt, ...);
|
|
|
|
void hook_init_ovni(struct ovni_emu *emu);
|
|
void hook_pre_ovni(struct ovni_emu *emu);
|
|
|
|
void hook_init_nosv(struct ovni_emu *emu);
|
|
void hook_pre_nosv(struct ovni_emu *emu);
|
|
void hook_end_nosv(struct ovni_emu *emu);
|
|
|
|
void hook_init_tampi(struct ovni_emu *emu);
|
|
void hook_pre_tampi(struct ovni_emu *emu);
|
|
|
|
void hook_init_openmp(struct ovni_emu *emu);
|
|
void hook_pre_openmp(struct ovni_emu *emu);
|
|
|
|
void hook_init_nodes(struct ovni_emu *emu);
|
|
void hook_pre_nodes(struct ovni_emu *emu);
|
|
|
|
void hook_init_kernel(struct ovni_emu *emu);
|
|
void hook_pre_kernel(struct ovni_emu *emu);
|
|
|
|
void hook_init_nanos6(struct ovni_emu *emu);
|
|
void hook_pre_nanos6(struct ovni_emu *emu);
|
|
void hook_end_nanos6(struct ovni_emu *emu);
|
|
|
|
struct ovni_cpu *emu_get_cpu(struct ovni_loom *loom, int cpuid);
|
|
|
|
struct ovni_ethread *emu_get_thread(struct ovni_eproc *proc, int tid);
|
|
|
|
void emu_cpu_update_chan(struct ovni_cpu *cpu, struct ovni_chan *cpu_chan);
|
|
|
|
#endif /* OVNI_EMU_H */
|