2023-01-25 12:01:01 +01:00
|
|
|
/* Copyright (c) 2021-2023 Barcelona Supercomputing Center (BSC)
|
|
|
|
* SPDX-License-Identifier: GPL-3.0-or-later */
|
|
|
|
|
|
|
|
#include "cpu.h"
|
|
|
|
|
|
|
|
#include "chan.h"
|
|
|
|
#include "value.h"
|
|
|
|
#include "utlist.h"
|
2023-02-02 16:31:43 +01:00
|
|
|
#include "pv/pvt.h"
|
2023-01-25 12:01:01 +01:00
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
static const char chan_fmt[] = "cpu%ld.%s";
|
|
|
|
static const char *chan_name[] = {
|
|
|
|
[CPU_CHAN_NRUN] = "nrunning",
|
|
|
|
[CPU_CHAN_PID] = "pid_running",
|
|
|
|
[CPU_CHAN_TID] = "tid_running",
|
|
|
|
[CPU_CHAN_APPID] = "appid_running",
|
2023-01-31 18:23:41 +01:00
|
|
|
[CPU_CHAN_THRUN] = "th_running",
|
|
|
|
[CPU_CHAN_THACT] = "th_active",
|
2023-01-27 18:51:18 +01:00
|
|
|
};
|
|
|
|
|
2023-01-30 22:43:57 +01:00
|
|
|
static int chan_type[] = {
|
|
|
|
[CPU_CHAN_PID] = 1,
|
|
|
|
[CPU_CHAN_TID] = 2,
|
|
|
|
[CPU_CHAN_NRUN] = 3,
|
|
|
|
[CPU_CHAN_APPID] = 5,
|
2023-01-31 18:23:41 +01:00
|
|
|
[CPU_CHAN_THRUN] = -1,
|
|
|
|
[CPU_CHAN_THACT] = -1,
|
2023-01-30 22:43:57 +01:00
|
|
|
};
|
|
|
|
|
2023-01-25 12:01:01 +01:00
|
|
|
void
|
2023-02-07 13:34:18 +01:00
|
|
|
cpu_init_begin(struct cpu *cpu, int phyid, int is_virtual)
|
2023-01-25 12:01:01 +01:00
|
|
|
{
|
|
|
|
memset(cpu, 0, sizeof(struct cpu));
|
|
|
|
|
|
|
|
cpu->phyid = phyid;
|
2023-02-07 13:34:18 +01:00
|
|
|
cpu->is_virtual = is_virtual;
|
2023-01-27 18:51:18 +01:00
|
|
|
|
2023-02-01 11:38:39 +01:00
|
|
|
dbg("cpu init %d", phyid);
|
2023-01-25 18:11:13 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
cpu_get_phyid(struct cpu *cpu)
|
|
|
|
{
|
|
|
|
return cpu->phyid;
|
2023-01-25 12:01:01 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
cpu_set_gindex(struct cpu *cpu, int64_t gindex)
|
|
|
|
{
|
|
|
|
cpu->gindex = gindex;
|
|
|
|
}
|
|
|
|
|
2023-02-17 10:08:40 +01:00
|
|
|
void
|
|
|
|
cpu_set_loom(struct cpu *cpu, struct loom *loom)
|
|
|
|
{
|
|
|
|
cpu->loom = loom;
|
|
|
|
}
|
|
|
|
|
2023-01-25 12:01:01 +01:00
|
|
|
void
|
2023-01-25 18:11:13 +01:00
|
|
|
cpu_set_name(struct cpu *cpu, const char *name)
|
2023-01-25 12:01:01 +01:00
|
|
|
{
|
2023-01-25 18:11:13 +01:00
|
|
|
if (snprintf(cpu->name, PATH_MAX, "%s", name) >= PATH_MAX)
|
|
|
|
die("cpu name too long");
|
2023-01-25 12:01:01 +01:00
|
|
|
}
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
int
|
|
|
|
cpu_init_end(struct cpu *cpu)
|
|
|
|
{
|
|
|
|
if (strlen(cpu->name) == 0) {
|
|
|
|
err("cpu name not set");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (cpu->gindex < 0) {
|
|
|
|
err("cpu gindex not set");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (int i = 0; i < CPU_CHAN_MAX; i++) {
|
2023-01-31 18:23:41 +01:00
|
|
|
if (chan_name[i] == NULL)
|
|
|
|
die("chan_name is null");
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
chan_init(&cpu->chan[i], CHAN_SINGLE,
|
|
|
|
chan_fmt, cpu->gindex, chan_name[i]);
|
|
|
|
}
|
|
|
|
|
|
|
|
chan_prop_set(&cpu->chan[CPU_CHAN_NRUN], CHAN_DUPLICATES, 1);
|
2023-01-31 18:23:41 +01:00
|
|
|
chan_prop_set(&cpu->chan[CPU_CHAN_TID], CHAN_DUPLICATES, 1);
|
|
|
|
chan_prop_set(&cpu->chan[CPU_CHAN_PID], CHAN_DUPLICATES, 1);
|
|
|
|
chan_prop_set(&cpu->chan[CPU_CHAN_THRUN], CHAN_DUPLICATES, 1);
|
|
|
|
chan_prop_set(&cpu->chan[CPU_CHAN_THACT], CHAN_DUPLICATES, 1);
|
2023-01-27 18:51:18 +01:00
|
|
|
|
|
|
|
cpu->is_init = 1;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2023-01-30 22:43:57 +01:00
|
|
|
cpu_connect(struct cpu *cpu, struct bay *bay, struct recorder *rec)
|
2023-01-27 18:51:18 +01:00
|
|
|
{
|
|
|
|
if (!cpu->is_init) {
|
|
|
|
err("cpu not initialized");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2023-01-30 22:43:57 +01:00
|
|
|
/* Get cpu prv */
|
|
|
|
struct pvt *pvt = recorder_find_pvt(rec, "cpu");
|
|
|
|
if (pvt == NULL) {
|
|
|
|
err("cannot find cpu pvt");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
struct prv *prv = pvt_get_prv(pvt);
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
for (int i = 0; i < CPU_CHAN_MAX; i++) {
|
2023-01-30 22:43:57 +01:00
|
|
|
struct chan *c = &cpu->chan[i];
|
|
|
|
if (bay_register(bay, c) != 0) {
|
2023-01-27 18:51:18 +01:00
|
|
|
err("bay_register failed");
|
|
|
|
return -1;
|
|
|
|
}
|
2023-01-30 22:43:57 +01:00
|
|
|
|
|
|
|
long type = chan_type[i];
|
2023-01-31 18:23:41 +01:00
|
|
|
if (type < 0)
|
|
|
|
continue;
|
|
|
|
|
2023-01-30 22:43:57 +01:00
|
|
|
long row = cpu->gindex;
|
2023-01-31 18:23:41 +01:00
|
|
|
if (prv_register(prv, row, type, bay, c, PRV_DUP)) {
|
2023-01-30 22:43:57 +01:00
|
|
|
err("prv_register failed");
|
|
|
|
return -1;
|
|
|
|
}
|
2023-01-27 18:51:18 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2023-01-25 12:01:01 +01:00
|
|
|
static struct thread *
|
|
|
|
find_thread(struct cpu *cpu, struct thread *thread)
|
|
|
|
{
|
|
|
|
struct thread *p = NULL;
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
/* TODO use hash table */
|
|
|
|
DL_FOREACH2(cpu->threads, p, cpu_next)
|
2023-01-25 12:01:01 +01:00
|
|
|
{
|
|
|
|
if (p == thread)
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
int
|
|
|
|
cpu_update(struct cpu *cpu)
|
2023-01-25 12:01:01 +01:00
|
|
|
{
|
|
|
|
struct thread *th = NULL;
|
|
|
|
struct thread *th_running = NULL;
|
|
|
|
struct thread *th_active = NULL;
|
|
|
|
int active = 0, running = 0;
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
DL_FOREACH2(cpu->threads, th, cpu_next)
|
2023-01-25 12:01:01 +01:00
|
|
|
{
|
|
|
|
if (th->state == TH_ST_RUNNING) {
|
|
|
|
th_running = th;
|
|
|
|
running++;
|
|
|
|
th_active = th;
|
|
|
|
active++;
|
|
|
|
} else if (th->state == TH_ST_COOLING || th->state == TH_ST_WARMING) {
|
|
|
|
th_active = th;
|
|
|
|
active++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
cpu->nth_running = running;
|
|
|
|
cpu->nth_active = active;
|
2023-01-27 18:51:18 +01:00
|
|
|
|
2023-02-07 13:34:18 +01:00
|
|
|
/* Only virtual cpus can be oversubscribed */
|
|
|
|
if (cpu->nth_running > 1 && !cpu->is_virtual) {
|
2023-02-07 16:17:25 +01:00
|
|
|
err("physical cpu %s has %d threads running at the same time",
|
2023-02-07 13:34:18 +01:00
|
|
|
cpu->name, cpu->nth_running);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2023-01-30 22:43:57 +01:00
|
|
|
struct value tid_running;
|
|
|
|
struct value pid_running;
|
2023-01-31 18:23:41 +01:00
|
|
|
struct value gid_running;
|
2023-01-30 22:43:57 +01:00
|
|
|
if (running == 1) {
|
2023-01-27 18:51:18 +01:00
|
|
|
cpu->th_running = th_running;
|
2023-01-30 22:43:57 +01:00
|
|
|
tid_running = value_int64(th_running->tid);
|
|
|
|
pid_running = value_int64(th_running->proc->pid);
|
2023-01-31 18:23:41 +01:00
|
|
|
gid_running = value_int64(th_running->gindex);
|
2023-01-30 22:43:57 +01:00
|
|
|
} else {
|
2023-01-27 18:51:18 +01:00
|
|
|
cpu->th_running = NULL;
|
2023-01-30 22:43:57 +01:00
|
|
|
tid_running = value_null();
|
|
|
|
pid_running = value_null();
|
2023-01-31 18:23:41 +01:00
|
|
|
gid_running = value_null();
|
2023-01-30 22:43:57 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
if (chan_set(&cpu->chan[CPU_CHAN_TID], tid_running) != 0) {
|
|
|
|
err("chan_set tid failed");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
if (chan_set(&cpu->chan[CPU_CHAN_PID], pid_running) != 0) {
|
|
|
|
err("chan_set pid failed");
|
|
|
|
return -1;
|
|
|
|
}
|
2023-01-31 18:23:41 +01:00
|
|
|
if (chan_set(&cpu->chan[CPU_CHAN_THRUN], gid_running) != 0) {
|
|
|
|
err("chan_set gid_running failed");
|
|
|
|
return -1;
|
|
|
|
}
|
2023-01-27 18:51:18 +01:00
|
|
|
|
2023-01-31 18:23:41 +01:00
|
|
|
struct value gid_active;
|
|
|
|
if (active == 1) {
|
2023-01-27 18:51:18 +01:00
|
|
|
cpu->th_active = th_active;
|
2023-01-31 18:23:41 +01:00
|
|
|
gid_active = value_int64(th_active->gindex);
|
|
|
|
} else {
|
2023-01-27 18:51:18 +01:00
|
|
|
cpu->th_active = NULL;
|
2023-01-31 18:23:41 +01:00
|
|
|
gid_active = value_null();
|
|
|
|
}
|
2023-01-25 12:01:01 +01:00
|
|
|
|
|
|
|
/* Update nth_running number in the channel */
|
2023-01-30 22:43:57 +01:00
|
|
|
if (chan_set(&cpu->chan[CPU_CHAN_NRUN], value_int64(running)) != 0) {
|
2023-01-27 18:51:18 +01:00
|
|
|
err("chan_set nth_running failed");
|
2023-01-25 12:01:01 +01:00
|
|
|
return -1;
|
|
|
|
}
|
2023-01-31 18:23:41 +01:00
|
|
|
if (chan_set(&cpu->chan[CPU_CHAN_THACT], gid_active) != 0) {
|
|
|
|
err("chan_set gid_active failed");
|
|
|
|
return -1;
|
|
|
|
}
|
2023-01-25 12:01:01 +01:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Add the given thread to the list of threads assigned to the CPU */
|
|
|
|
int
|
|
|
|
cpu_add_thread(struct cpu *cpu, struct thread *thread)
|
|
|
|
{
|
|
|
|
if (find_thread(cpu, thread) != NULL) {
|
2023-01-27 18:51:18 +01:00
|
|
|
err("thread %d already assigned to %s",
|
2023-01-25 12:01:01 +01:00
|
|
|
thread->tid, cpu->name);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
DL_APPEND2(cpu->threads, thread, cpu_prev, cpu_next);
|
2023-01-25 12:01:01 +01:00
|
|
|
cpu->nthreads++;
|
|
|
|
|
2023-01-27 18:51:18 +01:00
|
|
|
if (cpu_update(cpu) != 0) {
|
|
|
|
err("cpu_update failed");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
cpu_remove_thread(struct cpu *cpu, struct thread *thread)
|
|
|
|
{
|
|
|
|
struct thread *t = find_thread(cpu, thread);
|
|
|
|
|
|
|
|
/* Not found, abort */
|
|
|
|
if (t == NULL) {
|
|
|
|
err("cannot remove missing thread %d from cpu %s\n",
|
|
|
|
thread->tid, cpu->name);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
DL_DELETE2(cpu->threads, thread, cpu_prev, cpu_next);
|
|
|
|
cpu->nthreads--;
|
|
|
|
|
|
|
|
if (cpu_update(cpu) != 0) {
|
|
|
|
err("cpu_update failed");
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
|
|
|
cpu_migrate_thread(struct cpu *cpu, struct thread *thread, struct cpu *newcpu)
|
|
|
|
{
|
|
|
|
if (cpu_remove_thread(cpu, thread) != 0) {
|
|
|
|
err("cannot remove thread %d from %s",
|
|
|
|
thread->tid, cpu->name);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (cpu_add_thread(newcpu, thread) != 0) {
|
|
|
|
err("cannot add thread %d to %s",
|
|
|
|
thread->tid, cpu->name);
|
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2023-01-25 12:01:01 +01:00
|
|
|
return 0;
|
|
|
|
}
|
2023-02-13 18:36:54 +01:00
|
|
|
|
|
|
|
struct chan *
|
|
|
|
cpu_get_th_chan(struct cpu *cpu, enum track_th trackmode)
|
|
|
|
{
|
|
|
|
if (trackmode != TRACK_TH_RUN)
|
|
|
|
die("cpu tracking must be running");
|
|
|
|
|
|
|
|
return &cpu->chan[CPU_CHAN_THRUN];
|
|
|
|
}
|