diff --git a/_data/sidebars/merlin6_sidebar.yml b/_data/sidebars/merlin6_sidebar.yml index 0b72f98..ac975d0 100644 --- a/_data/sidebars/merlin6_sidebar.yml +++ b/_data/sidebars/merlin6_sidebar.yml @@ -43,6 +43,8 @@ entries: url: /merlin6/slurm-examples.html - title: Slurm Configuration url: /merlin6/slurm-configuration.html + - title: Monitoring + url: /merlin6/monitoring.html - title: Jupyterhub folderitems: - title: Jupyterhub service diff --git a/docker-compose.yml b/docker-compose.yml index f372ae6..f5bf6f9 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -6,6 +6,6 @@ services: dockerfile: Dockerfile image: result/latest ports: - - "4000:4000" + - "4001:4001" volumes: - - ".:/src" \ No newline at end of file + - ".:/src" diff --git a/pages/merlin6/03 merlin6-slurm/monitoring.md b/pages/merlin6/03 merlin6-slurm/monitoring.md new file mode 100644 index 0000000..f7ff08f --- /dev/null +++ b/pages/merlin6/03 merlin6-slurm/monitoring.md @@ -0,0 +1,35 @@ +--- +title: Monitoring +#tags: +#keywords: +last_updated: 20 June 2019 +#summary: "" +sidebar: merlin6_sidebar +permalink: /merlin6/monitoring.html +--- + +## Monitoring + +The following pages contain basic monitoring for Slurm and computing nodes. +Currently, monitoring is based on Grafana + InfluxDB. In the future it will +be moved to a different service based on ElasticSearch + LogStash + Kibana. + +In the meantime, the following monitoring pages are available in a best effort +support: + +### Merlin6 Monitoring Pages + +* Slurm monitoring: + * [Merlin6 Slurm Live Status](https://hpc-monitor01.psi.ch/d/vpwNKUhZz/merlin6-slurm-live-status?refresh=10s&orgId=1) + * [Merlin6 Slurm Overview](https://hpc-monitor01.psi.ch/d/QzBI6QoZz/merlin5-slurm-overview?refresh=10s&orgId=1) +* Nodes monitoring: + * [Merlin6 CPU Nodes Overview](https://hpc-monitor01.psi.ch/d/JmvLR8gZz/merlin6-computing-cpu-nodes?refresh=10s&orgId=1) + * [Merlin6 GPU Nodes Overview](https://hpc-monitor01.psi.ch/d/98l409-mk/merlin6-computing-gpu-nodes?refresh=5s&orgId=1) + +### Merlin5 Monitoring Pages + +* Slurm monitoring: + * [Merlin5 Slurm Live Status](https://hpc-monitor01.psi.ch/d/UbKbewTWz/merlin5-slurm-live-status?refresh=10s&orgId=1) + * [Merlin5 Slurm Overview](https://hpc-monitor01.psi.ch/d/QzBI6QoZz/merlin5-slurm-overview?refresh=10s&orgId=1) +* Nodes monitoring: + * [Merlin5 CPU Nodes Overview](https://hpc-monitor01.psi.ch/d/a-TsfGpZk/merlin5-computing-cpu-nodes?refresh=10s&orgId=1)