2019-10-21 14:50:16 +02:00
{
2022-07-27 13:01:15 +02:00
"$schema" : "http://json-schema.org/draft/2020-12/schema" ,
2022-10-06 11:17:48 +02:00
"$id" : "job-meta.schema.json" ,
2019-10-21 14:50:16 +02:00
"title" : "Job meta data" ,
"description" : "Meta data information of a HPC job" ,
"type" : "object" ,
"properties" : {
2021-12-17 06:54:16 +01:00
"jobId" : {
2019-10-21 14:50:16 +02:00
"description" : "The unique identifier of a job" ,
2021-11-26 09:15:50 +01:00
"type" : "integer"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"user" : {
2019-10-21 14:50:16 +02:00
"description" : "The unique identifier of a user" ,
"type" : "string"
} ,
2021-12-02 10:45:01 +01:00
"project" : {
2019-10-21 14:50:16 +02:00
"description" : "The unique identifier of a project" ,
"type" : "string"
} ,
2021-12-02 10:45:01 +01:00
"cluster" : {
2019-10-21 14:50:16 +02:00
"description" : "The unique identifier of a cluster" ,
"type" : "string"
} ,
2022-03-10 16:03:26 +01:00
"subCluster" : {
"description" : "The unique identifier of a sub cluster" ,
"type" : "string"
} ,
2021-11-26 09:15:50 +01:00
"partition" : {
2022-03-10 11:47:10 +01:00
"description" : "The Slurm partition to which the job was submitted" ,
2022-03-10 16:03:26 +01:00
"type" : "string"
2021-11-26 09:15:50 +01:00
} ,
2021-12-17 06:54:16 +01:00
"arrayJobId" : {
2021-11-26 09:15:50 +01:00
"description" : "The unique identifier of an array job" ,
"type" : "integer"
} ,
2021-12-17 06:54:16 +01:00
"numNodes" : {
2019-10-21 14:50:16 +02:00
"description" : "Number of nodes used" ,
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
2021-12-17 06:54:16 +01:00
"numHwthreads" : {
2021-11-26 09:15:50 +01:00
"description" : "Number of HWThreads used" ,
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
2021-12-17 06:54:16 +01:00
"numAcc" : {
2021-11-29 10:26:00 +01:00
"description" : "Number of accelerators used" ,
2021-11-26 09:15:50 +01:00
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
2019-10-21 14:50:16 +02:00
"exclusive" : {
2022-07-17 09:40:22 +02:00
"description" : "Specifies how nodes are shared. 0 - Shared among multiple jobs of multiple users, 1 - Job exclusive, 2 - Shared among multiple jobs of same user" ,
"type" : "integer" ,
2022-09-14 06:35:18 +02:00
"minimum" : 0 ,
2022-07-17 09:40:22 +02:00
"maximum" : 2
2019-10-21 14:50:16 +02:00
} ,
2021-12-17 06:54:16 +01:00
"monitoringStatus" : {
2021-12-02 10:45:01 +01:00
"description" : "State of monitoring system during job run" ,
2021-12-16 08:10:36 +01:00
"type" : "integer"
2021-12-02 10:45:01 +01:00
} ,
2021-11-26 09:15:50 +01:00
"smt" : {
2021-12-02 10:45:01 +01:00
"description" : "SMT threads used by job" ,
"type" : "integer"
2021-11-26 09:15:50 +01:00
} ,
2019-10-21 14:50:16 +02:00
"walltime" : {
"description" : "Requested walltime of job in seconds" ,
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
2021-12-17 06:54:16 +01:00
"jobState" : {
2019-10-21 14:50:16 +02:00
"description" : "Final state of job" ,
"type" : "string" ,
"enum" : [
"completed" ,
"failed" ,
2022-03-10 11:47:10 +01:00
"cancelled" ,
2021-11-26 09:15:50 +01:00
"stopped" ,
2022-03-10 11:47:10 +01:00
"out_of_memory" ,
2019-10-21 14:50:16 +02:00
"timeout"
]
} ,
2021-12-17 06:54:16 +01:00
"startTime" : {
2019-10-21 14:50:16 +02:00
"description" : "Start epoch time stamp in seconds" ,
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
"duration" : {
"description" : "Duration of job in seconds" ,
"type" : "integer" ,
"exclusiveMinimum" : 0
} ,
2021-11-26 09:15:50 +01:00
"resources" : {
"description" : "Resources used by job" ,
2019-10-21 14:50:16 +02:00
"type" : "array" ,
"items" : {
2021-11-26 09:15:50 +01:00
"type" : "object" ,
"properties" : {
"hostname" : {
"type" : "string"
} ,
2021-11-29 10:26:00 +01:00
"hwthreads" : {
2021-11-26 09:15:50 +01:00
"type" : "array" ,
"description" : "List of OS processor ids" ,
"items" : {
"type" : "integer"
}
} ,
2021-11-29 10:26:00 +01:00
"accelerators" : {
2021-11-26 09:15:50 +01:00
"type" : "array" ,
2022-05-03 15:58:30 +02:00
"description" : "List of of accelerator device ids" ,
2021-11-26 09:15:50 +01:00
"items" : {
2022-05-03 15:58:30 +02:00
"type" : "string"
2021-11-26 09:15:50 +01:00
}
} ,
2021-12-02 10:45:01 +01:00
"configuration" : {
"type" : "string" ,
"description" : "The configuration options of the node"
2022-07-27 13:01:15 +02:00
}
2021-11-26 09:15:50 +01:00
} ,
2022-07-27 13:01:15 +02:00
"required" : [
"hostname"
] ,
2021-12-02 10:45:01 +01:00
"minItems" : 1
}
} ,
2021-12-17 06:54:16 +01:00
"metaData" : {
2021-12-02 10:45:01 +01:00
"description" : "Additional information about the job" ,
"type" : "object" ,
"properties" : {
2021-12-17 06:54:16 +01:00
"jobScript" : {
2021-12-02 10:45:01 +01:00
"type" : "string" ,
"description" : "The batch script of the job"
} ,
2022-03-16 07:46:23 +01:00
"jobName" : {
2021-12-02 10:45:01 +01:00
"type" : "string" ,
2022-03-16 07:46:23 +01:00
"description" : "Slurm Job name"
} ,
"slurmInfo" : {
"type" : "string" ,
"description" : "Additional slurm infos as show by scontrol show job"
2021-12-02 10:45:01 +01:00
}
}
2019-10-21 14:50:16 +02:00
} ,
"tags" : {
"description" : "List of tags" ,
"type" : "array" ,
"items" : {
"type" : "object" ,
"properties" : {
"name" : {
"type" : "string"
} ,
"type" : {
"type" : "string"
}
} ,
"required" : [
"name" ,
"type"
]
} ,
"uniqueItems" : true
} ,
"statistics" : {
"description" : "Job statistic data" ,
"type" : "object" ,
"properties" : {
"mem_used" : {
"description" : "Memory capacity used (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"cpu_load" : {
"description" : "CPU requested core utilization (load 1m) (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2021-12-02 10:45:01 +01:00
} ,
2019-10-21 14:50:16 +02:00
"flops_any" : {
"description" : "Total flop rate with DP flops scaled up (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"mem_bw" : {
"description" : "Main memory bandwidth (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"net_bw" : {
"description" : "Total fast interconnect network bandwidth (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"file_bw" : {
"description" : "Total file IO bandwidth (required)" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"ipc" : {
"description" : "Instructions executed per cycle" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2023-06-27 15:08:03 +02:00
"cpu_user" : {
"description" : "CPU user active core utilization" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"flops_dp" : {
"description" : "Double precision flop rate" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"flops_sp" : {
"description" : "Single precision flops rate" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"rapl_power" : {
"description" : "CPU power consumption" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2022-09-21 15:24:48 +02:00
"acc_used" : {
2019-10-21 14:50:16 +02:00
"description" : "GPU utilization" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2022-09-21 15:24:48 +02:00
"acc_mem_used" : {
2019-10-21 14:50:16 +02:00
"description" : "GPU memory capacity used" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2022-09-21 15:24:48 +02:00
"acc_power" : {
2019-10-21 14:50:16 +02:00
"description" : "GPU power consumption" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"clock" : {
"description" : "Average core frequency" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"eth_read_bw" : {
"description" : "Ethernet read bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
"eth_write_bw" : {
"description" : "Ethernet write bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"ic_rcv_packets" : {
"description" : "Network interconnect read packets" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"ic_send_packets" : {
"description" : "Network interconnect send packet" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"ic_read_bw" : {
"description" : "Network interconnect read bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2019-10-21 14:50:16 +02:00
} ,
2021-12-02 10:45:01 +01:00
"ic_write_bw" : {
"description" : "Network interconnect write bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"filesystems" : {
"description" : "Array of filesystems" ,
"type" : "array" ,
"items" : {
"type" : "object" ,
"properties" : {
"name" : {
"type" : "string"
} ,
"type" : {
"type" : "string" ,
"enum" : [
"nfs" ,
"lustre" ,
"gpfs" ,
"nvme" ,
"ssd" ,
"hdd" ,
"beegfs"
]
} ,
"read_bw" : {
"description" : "File system read bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"write_bw" : {
"description" : "File system write bandwidth" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"read_req" : {
"description" : "File system read requests" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"write_req" : {
"description" : "File system write requests" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"inodes" : {
"description" : "File system write requests" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"accesses" : {
"description" : "File system open and close" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"fsync" : {
"description" : "File system fsync" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"create" : {
"description" : "File system create" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"open" : {
"description" : "File system open" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"close" : {
"description" : "File system close" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
} ,
"seek" : {
"description" : "File system seek" ,
2022-10-06 11:17:48 +02:00
"$ref" : "job-metric-statistics.schema.json"
2022-08-25 17:33:18 +02:00
}
} ,
"required" : [
"name" ,
"type" ,
"read_bw" ,
2022-09-14 06:35:18 +02:00
"write_bw"
2022-08-25 17:33:18 +02:00
]
} ,
"minItems" : 1
2019-10-21 14:50:16 +02:00
}
} ,
"required" : [
2023-06-27 15:08:03 +02:00
"cpu_user" ,
"cpu_load" ,
2019-10-21 14:50:16 +02:00
"mem_used" ,
"flops_any" ,
2022-08-25 17:33:18 +02:00
"mem_bw"
2019-10-21 14:50:16 +02:00
]
}
} ,
"required" : [
2021-12-17 06:54:16 +01:00
"jobId" ,
"user" ,
"project" ,
"cluster" ,
2023-06-27 15:08:03 +02:00
"subCluster" ,
2021-12-17 06:54:16 +01:00
"numNodes" ,
2022-01-14 20:33:18 +01:00
"exclusive" ,
2021-12-17 06:54:16 +01:00
"startTime" ,
2022-01-14 20:33:18 +01:00
"jobState" ,
2019-10-21 14:50:16 +02:00
"duration" ,
2021-11-26 09:15:50 +01:00
"resources" ,
2019-10-21 14:50:16 +02:00
"statistics"
]
}