diff --git a/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.json b/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.json new file mode 100644 index 0000000000000000000000000000000000000000..c0a19fab3bf23209f5c4dcd7bd1a36ae9d3cc6fa --- /dev/null +++ b/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.json @@ -0,0 +1,289 @@ +{ + "architecture": { + "cpu_core_numbering": "round-robin", + "nb_cores": 20, + "nb_procs": 2, + "nb_threads": 40, + "platform_type": "x86_64" + }, + "bios": { + "release_date": "01/07/2025", + "vendor": "Dell Inc.", + "version": "2.23.0" + }, + "bmc_version": "3.15.17.15", + "chassis": { + "manufactured_at": "2018-03-13", + "manufacturer": "Dell Inc.", + "name": "PowerEdge R740", + "serial": "GFHZMN2", + "warranty_end": "2023-03-13" + }, + "exotic": false, + "gpu_devices": { + "nvidia0": { + "compute_capability": "6.1", + "cores": 3840, + "cpu_affinity": 0, + "device": "/dev/nvidia0", + "memory": 12884901888, + "microarchitecture": "Pascal", + "model": "TITAN Xp", + "performance": { + "fp-16": 177600000000, + "fp-32": 12149700000000, + "fp-64": 355200000000 + }, + "power_default_limit": "250.00 W", + "vbios_version": "86.02.3D.00.01", + "vendor": "Nvidia" + }, + "nvidia1": { + "compute_capability": "6.1", + "cores": 3840, + "cpu_affinity": 1, + "device": "/dev/nvidia1", + "memory": 12884901888, + "microarchitecture": "Pascal", + "model": "TITAN Xp", + "performance": { + "fp-16": 177600000000, + "fp-32": 12149700000000, + "fp-64": 355200000000 + }, + "power_default_limit": "250.00 W", + "vbios_version": "86.02.3D.00.01", + "vendor": "Nvidia" + } + }, + "main_memory": { + "ram_size": 103079215104 + }, + "management_tools": { + "bmc_vendor_tool": "racadm", + "ipmitool": { + "retries": 5 + } + }, + "memory_devices": [ + { + "device": "dimm_a1", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a2", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a3", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a4", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a5", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a6", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b1", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b2", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b3", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b4", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b5", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b6", + "size": 8589934592, + "technology": "dram" + } + ], + "network_adapters": [ + { + "device": "eth0", + "driver": "bnxt_en", + "enabled": true, + "firmware_version": "214.0.166.0/pkg 21.40.16.60", + "interface": "Ethernet", + "ip": "172.16.27.5", + "ip6": "2001:660:4406:100:c::5", + "kavlan": false, + "mac": "00:0a:f7:bf:4d:bc", + "management": false, + "model": "BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller", + "mountable": true, + "mounted": true, + "name": "enp1s0f0np0", + "network_address": "vercors3-1.grenoble.grid5000.fr", + "rate": 10000000000, + "sriov": false, + "sriov_totalvfs": 0, + "switch": "imag-1b-F2-prod-01", + "switch_port": "1/1/7", + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth1", + "driver": "bnxt_en", + "enabled": false, + "firmware_version": "214.0.166.0/pkg 21.40.16.60", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:4d:bd", + "management": false, + "model": "BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller", + "mountable": false, + "mounted": false, + "name": "eno2np1", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth2", + "driver": "tg3", + "enabled": false, + "firmware_version": "FFV20.6.52 bc 5720-v1.39", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:4d:ba", + "management": false, + "model": "NetXtreme BCM5720 2-port Gigabit Ethernet PCIe", + "mountable": false, + "mounted": false, + "name": "eno3", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth3", + "driver": "tg3", + "enabled": false, + "firmware_version": "FFV20.6.52 bc 5720-v1.39", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:4d:bb", + "management": false, + "model": "NetXtreme BCM5720 2-port Gigabit Ethernet PCIe", + "mountable": false, + "mounted": false, + "name": "eno4", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "bmc", + "enabled": true, + "interface": "Ethernet", + "ip": "172.17.27.5", + "kavlan": false, + "mac": "58:8a:5a:ee:70:2c", + "management": true, + "mountable": false, + "mounted": false, + "network_address": "vercors3-1-bmc.grenoble.grid5000.fr" + } + ], + "nodeset": "vercors3", + "operating_system": { + "cstate_driver": "intel_idle", + "cstate_governor": "menu", + "ht_enabled": true, + "pstate_driver": "intel_pstate", + "pstate_governor": "performance", + "turboboost_enabled": true + }, + "performance": { + "core_flops": 35200000000, + "node_flops": 704000000000 + }, + "processor": { + "cache_l1": null, + "cache_l1d": 32768, + "cache_l1i": 32768, + "cache_l2": 1048576, + "cache_l3": 14417920, + "clock_speed": 2200000000, + "ht_capable": true, + "instruction_set": "x86-64", + "microarchitecture": "Skylake-SP", + "microcode": "0x2007006", + "model": "Intel Xeon", + "other_description": "Intel(R) Xeon(R) Silver 4114 CPU @ 2.20GHz", + "vendor": "Intel", + "version": "Silver 4114" + }, + "redfish": true, + "software": { + "forced-deployment-timestamp": 202007300948, + "postinstall-version": "1.2025040409", + "standard-environment": "debian11-x64-std" + }, + "storage_devices": [ + { + "by_id": "/dev/disk/by-id/wwn-0x6d09466045928a00226a1f510f4dd264", + "by_path": "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:0:0", + "firmware_version": 4.27, + "id": "disk0", + "interface": "SAS", + "model": "PERC H730P Adp", + "size": 999653638144, + "storage": "HDD", + "vendor": "Dell" + }, + { + "by_id": "/dev/disk/by-id/wwn-0x6d09466045928a00226a1f5c0ff46d69", + "by_path": "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:1:0", + "firmware_version": 4.27, + "id": "disk1", + "interface": "SAS", + "model": "PERC H730P Adp", + "size": 4000225165312, + "storage": "HDD", + "vendor": "Dell" + } + ], + "supported_job_types": { + "besteffort": true, + "deploy": true, + "max_walltime": 0, + "queues": [ + "admin", + "testing" + ], + "virtual": false + }, + "type": "node", + "uid": "vercors3-1" +} \ No newline at end of file diff --git a/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.json b/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.json new file mode 100644 index 0000000000000000000000000000000000000000..5d5cd31456f9fae568b2a18de2bcaee8a2387b7a --- /dev/null +++ b/data/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.json @@ -0,0 +1,289 @@ +{ + "architecture": { + "cpu_core_numbering": "round-robin", + "nb_cores": 20, + "nb_procs": 2, + "nb_threads": 40, + "platform_type": "x86_64" + }, + "bios": { + "release_date": "01/07/2025", + "vendor": "Dell Inc.", + "version": "2.23.0" + }, + "bmc_version": "3.15.17.15", + "chassis": { + "manufactured_at": "2018-03-13", + "manufacturer": "Dell Inc.", + "name": "PowerEdge R740", + "serial": "GFJ4NN2", + "warranty_end": "2023-03-13" + }, + "exotic": false, + "gpu_devices": { + "nvidia0": { + "compute_capability": "6.1", + "cores": 3840, + "cpu_affinity": 0, + "device": "/dev/nvidia0", + "memory": 12884901888, + "microarchitecture": "Pascal", + "model": "TITAN Xp", + "performance": { + "fp-16": 177600000000, + "fp-32": 12149700000000, + "fp-64": 355200000000 + }, + "power_default_limit": "250.00 W", + "vbios_version": "86.02.3D.00.01", + "vendor": "Nvidia" + }, + "nvidia1": { + "compute_capability": "6.1", + "cores": 3840, + "cpu_affinity": 1, + "device": "/dev/nvidia1", + "memory": 12884901888, + "microarchitecture": "Pascal", + "model": "TITAN Xp", + "performance": { + "fp-16": 177600000000, + "fp-32": 12149700000000, + "fp-64": 355200000000 + }, + "power_default_limit": "250.00 W", + "vbios_version": "86.02.3D.00.01", + "vendor": "Nvidia" + } + }, + "main_memory": { + "ram_size": 103079215104 + }, + "management_tools": { + "bmc_vendor_tool": "racadm", + "ipmitool": { + "retries": 5 + } + }, + "memory_devices": [ + { + "device": "dimm_a1", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a2", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a3", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a4", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a5", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_a6", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b1", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b2", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b3", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b4", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b5", + "size": 8589934592, + "technology": "dram" + }, + { + "device": "dimm_b6", + "size": 8589934592, + "technology": "dram" + } + ], + "network_adapters": [ + { + "device": "eth0", + "driver": "bnxt_en", + "enabled": true, + "firmware_version": "214.0.166.0/pkg 21.40.16.60", + "interface": "Ethernet", + "ip": "172.16.27.6", + "ip6": "2001:660:4406:100:c::6", + "kavlan": false, + "mac": "00:0a:f7:bf:1e:46", + "management": false, + "model": "BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller", + "mountable": true, + "mounted": true, + "name": "enp1s0f0np0", + "network_address": "vercors3-2.grenoble.grid5000.fr", + "rate": 10000000000, + "sriov": false, + "sriov_totalvfs": 0, + "switch": "imag-1b-F2-prod-01", + "switch_port": "1/1/8", + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth1", + "driver": "bnxt_en", + "enabled": false, + "firmware_version": "214.0.166.0/pkg 21.40.16.60", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:1e:47", + "management": false, + "model": "BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller", + "mountable": false, + "mounted": false, + "name": "eno2np1", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth2", + "driver": "tg3", + "enabled": false, + "firmware_version": "FFV20.6.52 bc 5720-v1.39", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:1e:44", + "management": false, + "model": "NetXtreme BCM5720 2-port Gigabit Ethernet PCIe", + "mountable": false, + "mounted": false, + "name": "eno3", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "eth3", + "driver": "tg3", + "enabled": false, + "firmware_version": "FFV20.6.52 bc 5720-v1.39", + "interface": "Ethernet", + "kavlan": false, + "mac": "00:0a:f7:bf:1e:45", + "management": false, + "model": "NetXtreme BCM5720 2-port Gigabit Ethernet PCIe", + "mountable": false, + "mounted": false, + "name": "eno4", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Broadcom Inc. and subsidiaries" + }, + { + "device": "bmc", + "enabled": true, + "interface": "Ethernet", + "ip": "172.17.27.6", + "kavlan": false, + "mac": "58:8a:5a:ee:6e:ca", + "management": true, + "mountable": false, + "mounted": false, + "network_address": "vercors3-2-bmc.grenoble.grid5000.fr" + } + ], + "nodeset": "vercors3", + "operating_system": { + "cstate_driver": "intel_idle", + "cstate_governor": "menu", + "ht_enabled": true, + "pstate_driver": "intel_pstate", + "pstate_governor": "performance", + "turboboost_enabled": true + }, + "performance": { + "core_flops": 35200000000, + "node_flops": 704000000000 + }, + "processor": { + "cache_l1": null, + "cache_l1d": 32768, + "cache_l1i": 32768, + "cache_l2": 1048576, + "cache_l3": 14417920, + "clock_speed": 2200000000, + "ht_capable": true, + "instruction_set": "x86-64", + "microarchitecture": "Skylake-SP", + "microcode": "0x2007006", + "model": "Intel Xeon", + "other_description": "Intel(R) Xeon(R) Silver 4114 CPU @ 2.20GHz", + "vendor": "Intel", + "version": "Silver 4114" + }, + "redfish": true, + "software": { + "forced-deployment-timestamp": 202007300948, + "postinstall-version": "1.2025040409", + "standard-environment": "debian11-x64-std" + }, + "storage_devices": [ + { + "by_id": "/dev/disk/by-id/wwn-0x6d0946604592b100226a26d009660c51", + "by_path": "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:0:0", + "firmware_version": 4.27, + "id": "disk0", + "interface": "SAS", + "model": "PERC H730P Adp", + "size": 999653638144, + "storage": "HDD", + "vendor": "Dell" + }, + { + "by_id": "/dev/disk/by-id/wwn-0x6d0946604592b100226a27390f9fb4b1", + "by_path": "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:1:0", + "firmware_version": 4.27, + "id": "disk1", + "interface": "SAS", + "model": "PERC H730P Adp", + "size": 4000225165312, + "storage": "HDD", + "vendor": "Dell" + } + ], + "supported_job_types": { + "besteffort": true, + "deploy": true, + "max_walltime": 0, + "queues": [ + "admin", + "testing" + ], + "virtual": false + }, + "type": "node", + "uid": "vercors3-2" +} \ No newline at end of file diff --git a/data/grid5000/sites/grenoble/clusters/vercors3/vercors3.json b/data/grid5000/sites/grenoble/clusters/vercors3/vercors3.json new file mode 100644 index 0000000000000000000000000000000000000000..d06e2878a659b682f907c314685af50e7a341b7f --- /dev/null +++ b/data/grid5000/sites/grenoble/clusters/vercors3/vercors3.json @@ -0,0 +1,93 @@ +{ + "boot_type": "bios", + "created_at": "Wed, 02 Apr 2025 00:00:00 GMT", + "exotic": false, + "kavlan": false, + "manufactured_at": "2018-03-13", + "metrics": [ + { + "description": "Default subset of metrics from Prometheus Node Exporter", + "name": "prom_default_metrics", + "optional_period": 15000, + "period": 0, + "source": { + "id": [ + "node_boot_time_seconds", + "node_cpu_scaling_frequency_hertz", + "node_cpu_seconds_total", + "node_filesystem_free_bytes", + "node_filesystem_size_bytes", + "node_load1", + "node_load15", + "node_load5", + "node_memory_Buffers_bytes", + "node_memory_Cached_bytes", + "node_memory_MemAvailable_bytes", + "node_memory_MemFree_bytes", + "node_memory_MemTotal_bytes", + "node_memory_Shmem_bytes", + "node_memory_SwapFree_bytes", + "node_memory_SwapTotal_bytes", + "node_network_receive_bytes_total", + "node_network_receive_packets_total", + "node_network_transmit_bytes_total", + "node_network_transmit_packets_total", + "node_procs_blocked", + "node_procs_running", + "kwollect_custom" + ], + "port": 9100, + "protocol": "prometheus" + } + }, + { + "description": "All metrics from Prometheus Node Exporter", + "name": "prom_all_metrics", + "optional_period": 15000, + "period": 0, + "source": { + "port": 9100, + "protocol": "prometheus" + } + }, + { + "description": "Default subset of metrics from Prometheus Nvidia DCGM Exporter", + "name": "prom_nvgpu_default_metrics", + "optional_period": 15000, + "period": 0, + "source": { + "id": [ + "DCGM_FI_DEV_SM_CLOCK", + "DCGM_FI_DEV_MEM_CLOCK", + "DCGM_FI_DEV_GPU_TEMP", + "DCGM_FI_DEV_POWER_USAGE", + "DCGM_FI_DEV_MEM_COPY_UTIL" + ], + "port": 9400, + "protocol": "prometheus" + } + }, + { + "description": "All metrics from Prometheus Nvidia DCGM Exporter", + "name": "prom_nvgpu_all_metrics", + "optional_period": 15000, + "period": 0, + "source": { + "port": 9400, + "protocol": "prometheus" + } + } + ], + "model": "Dell PowerEdge R740", + "nodes_count": 2, + "nodes_description": "2 CPUs Intel Xeon Silver 4114, 10 cores/CPU, 2 GPUs TITAN Xp, 96GB RAM, 931GB HDD, 3725GB HDD, 1 x 10Gb Ethernet", + "priority": 201903, + "queues": [ + "admin", + "testing" + ], + "redfish": true, + "type": "cluster", + "uid": "vercors3", + "warranty_end": "2023-03-13" +} \ No newline at end of file diff --git a/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-admin-01.json b/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-admin-01.json index 24f334f25e96ca9517faabc0c09a7f92eefcf078..052afddf929173f32db64c04b220584a67b41ba3 100644 --- a/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-admin-01.json +++ b/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-admin-01.json @@ -29,8 +29,14 @@ { }, { + "kind": "other", + "snmp_name": "1/1/9", + "uid": "vercors3-2-bmc" }, { + "kind": "other", + "snmp_name": "1/1/10", + "uid": "vercors3-1-bmc" }, { }, diff --git a/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-prod-01.json b/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-prod-01.json index 2b7cd93e7a17c0ee79f7e324460133d85a64bbf9..2ab54309353195aaf246114ad47c3528eb001141 100644 --- a/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-prod-01.json +++ b/data/grid5000/sites/grenoble/network_equipments/imag-1b-F2-prod-01.json @@ -36,8 +36,18 @@ "uid": "vercors2-2" }, { + "kind": "node", + "port": "eth0", + "rate": 10000000000, + "snmp_name": "1/1/7", + "uid": "vercors3-1" }, { + "kind": "node", + "port": "eth0", + "rate": 10000000000, + "snmp_name": "1/1/8", + "uid": "vercors3-2" }, { }, diff --git a/input/grid5000/dell-product-data.yaml b/input/grid5000/dell-product-data.yaml index da54453f07db36ca83e6b74c3c0a19cd83474148..2caaffbfef92e95bac32994b50144fe76a65be95 100644 --- a/input/grid5000/dell-product-data.yaml +++ b/input/grid5000/dell-product-data.yaml @@ -206,6 +206,16 @@ sites: chassis: manufactured_at: 2016-10-24 warranty_end: 2021-10-23 + vercors3: + nodes: + vercors3-1: + chassis: + manufactured_at: 2018-03-13 + warranty_end: 2023-03-13 + vercors3-2: + chassis: + manufactured_at: 2018-03-13 + warranty_end: 2023-03-13 yeti: nodes: yeti-1: diff --git a/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.yaml b/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.yaml new file mode 100644 index 0000000000000000000000000000000000000000..6541604e9a8b207bb969bcd7659217ec9b06283d --- /dev/null +++ b/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-1.yaml @@ -0,0 +1,161 @@ +# Generated by g5k-checks (g5k-checks -m api) +--- +vercors3-1: + architecture: + cpu_core_numbering: round-robin + nb_cores: 20 + nb_procs: 2 + nb_threads: 40 + platform_type: x86_64 + bios: + release_date: 01/07/2025 + vendor: Dell Inc. + version: 2.23.0 + bmc_version: 3.15.17.15 + chassis: + manufacturer: Dell Inc. + name: PowerEdge R740 + serial: GFHZMN2 + gpu_devices: + nvidia0: + cpu_affinity: 0 + device: "/dev/nvidia0" + memory: 12884901888 + model: TITAN Xp + power_default_limit: 250.00 W + vbios_version: 86.02.3D.00.01 + vendor: Nvidia + nvidia1: + cpu_affinity: 1 + device: "/dev/nvidia1" + memory: 12884901888 + model: TITAN Xp + power_default_limit: 250.00 W + vbios_version: 86.02.3D.00.01 + vendor: Nvidia + main_memory: + ram_size: 103079215104 + memory_devices: + dimm_a1: + size: 8589934592 + technology: dram + dimm_a2: + size: 8589934592 + technology: dram + dimm_a3: + size: 8589934592 + technology: dram + dimm_a4: + size: 8589934592 + technology: dram + dimm_a5: + size: 8589934592 + technology: dram + dimm_a6: + size: 8589934592 + technology: dram + dimm_b1: + size: 8589934592 + technology: dram + dimm_b2: + size: 8589934592 + technology: dram + dimm_b3: + size: 8589934592 + technology: dram + dimm_b4: + size: 8589934592 + technology: dram + dimm_b5: + size: 8589934592 + technology: dram + dimm_b6: + size: 8589934592 + technology: dram + network_adapters: + bmc: + ip: 172.17.27.5 + mac: 58:8a:5a:ee:70:2c + management: true + eth0: + driver: bnxt_en + firmware_version: 214.0.166.0/pkg 21.40.16.60 + interface: Ethernet + ip: 172.16.27.5 + mac: 00:0a:f7:bf:4d:bc + management: false + model: BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller + name: enp1s0f0np0 + rate: 10000000000 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth1: + driver: bnxt_en + firmware_version: 214.0.166.0/pkg 21.40.16.60 + interface: Ethernet + mac: 00:0a:f7:bf:4d:bd + management: false + model: BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller + name: eno2np1 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth2: + driver: tg3 + firmware_version: FFV20.6.52 bc 5720-v1.39 + interface: Ethernet + mac: 00:0a:f7:bf:4d:ba + management: false + model: NetXtreme BCM5720 2-port Gigabit Ethernet PCIe + name: eno3 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth3: + driver: tg3 + firmware_version: FFV20.6.52 bc 5720-v1.39 + interface: Ethernet + mac: 00:0a:f7:bf:4d:bb + management: false + model: NetXtreme BCM5720 2-port Gigabit Ethernet PCIe + name: eno4 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + operating_system: + cstate_driver: intel_idle + cstate_governor: menu + ht_enabled: true + pstate_driver: intel_pstate + pstate_governor: performance + turboboost_enabled: true + processor: + cache_l1d: 32768 + cache_l1i: 32768 + cache_l2: 1048576 + cache_l3: 14417920 + ht_capable: true + instruction_set: x86-64 + microcode: '0x2007006' + model: Intel Xeon + other_description: Intel(R) Xeon(R) Silver 4114 CPU @ 2.20GHz + vendor: Intel + version: Silver 4114 + storage_devices: + pci-0000:18:00.0-scsi-0:2:0:0: + by_id: "/dev/disk/by-id/wwn-0x6d09466045928a00226a1f510f4dd264" + by_path: "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:0:0" + firmware_version: 4.27 + model: PERC H730P Adp + size: 999653638144 + storage: HDD + pci-0000:18:00.0-scsi-0:2:1:0: + by_id: "/dev/disk/by-id/wwn-0x6d09466045928a00226a1f5c0ff46d69" + by_path: "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:1:0" + firmware_version: 4.27 + model: PERC H730P Adp + size: 4000225165312 + storage: HDD + supported_job_types: + virtual: false diff --git a/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.yaml b/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.yaml new file mode 100644 index 0000000000000000000000000000000000000000..8bb7b11be635a849fef24a20d50bfa74cd108509 --- /dev/null +++ b/input/grid5000/sites/grenoble/clusters/vercors3/nodes/vercors3-2.yaml @@ -0,0 +1,161 @@ +# Generated by g5k-checks (g5k-checks -m api) +--- +vercors3-2: + architecture: + cpu_core_numbering: round-robin + nb_cores: 20 + nb_procs: 2 + nb_threads: 40 + platform_type: x86_64 + bios: + release_date: 01/07/2025 + vendor: Dell Inc. + version: 2.23.0 + bmc_version: 3.15.17.15 + chassis: + manufacturer: Dell Inc. + name: PowerEdge R740 + serial: GFJ4NN2 + gpu_devices: + nvidia0: + cpu_affinity: 0 + device: "/dev/nvidia0" + memory: 12884901888 + model: TITAN Xp + power_default_limit: 250.00 W + vbios_version: 86.02.3D.00.01 + vendor: Nvidia + nvidia1: + cpu_affinity: 1 + device: "/dev/nvidia1" + memory: 12884901888 + model: TITAN Xp + power_default_limit: 250.00 W + vbios_version: 86.02.3D.00.01 + vendor: Nvidia + main_memory: + ram_size: 103079215104 + memory_devices: + dimm_a1: + size: 8589934592 + technology: dram + dimm_a2: + size: 8589934592 + technology: dram + dimm_a3: + size: 8589934592 + technology: dram + dimm_a4: + size: 8589934592 + technology: dram + dimm_a5: + size: 8589934592 + technology: dram + dimm_a6: + size: 8589934592 + technology: dram + dimm_b1: + size: 8589934592 + technology: dram + dimm_b2: + size: 8589934592 + technology: dram + dimm_b3: + size: 8589934592 + technology: dram + dimm_b4: + size: 8589934592 + technology: dram + dimm_b5: + size: 8589934592 + technology: dram + dimm_b6: + size: 8589934592 + technology: dram + network_adapters: + bmc: + ip: 172.17.27.6 + mac: 58:8a:5a:ee:6e:ca + management: true + eth0: + driver: bnxt_en + firmware_version: 214.0.166.0/pkg 21.40.16.60 + interface: Ethernet + ip: 172.16.27.6 + mac: 00:0a:f7:bf:1e:46 + management: false + model: BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller + name: enp1s0f0np0 + rate: 10000000000 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth1: + driver: bnxt_en + firmware_version: 214.0.166.0/pkg 21.40.16.60 + interface: Ethernet + mac: 00:0a:f7:bf:1e:47 + management: false + model: BCM57412 NetXtreme-E 10Gb RDMA Ethernet Controller + name: eno2np1 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth2: + driver: tg3 + firmware_version: FFV20.6.52 bc 5720-v1.39 + interface: Ethernet + mac: 00:0a:f7:bf:1e:44 + management: false + model: NetXtreme BCM5720 2-port Gigabit Ethernet PCIe + name: eno3 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + eth3: + driver: tg3 + firmware_version: FFV20.6.52 bc 5720-v1.39 + interface: Ethernet + mac: 00:0a:f7:bf:1e:45 + management: false + model: NetXtreme BCM5720 2-port Gigabit Ethernet PCIe + name: eno4 + sriov: false + sriov_totalvfs: 0 + vendor: Broadcom Inc. and subsidiaries + operating_system: + cstate_driver: intel_idle + cstate_governor: menu + ht_enabled: true + pstate_driver: intel_pstate + pstate_governor: performance + turboboost_enabled: true + processor: + cache_l1d: 32768 + cache_l1i: 32768 + cache_l2: 1048576 + cache_l3: 14417920 + ht_capable: true + instruction_set: x86-64 + microcode: '0x2007006' + model: Intel Xeon + other_description: Intel(R) Xeon(R) Silver 4114 CPU @ 2.20GHz + vendor: Intel + version: Silver 4114 + storage_devices: + pci-0000:18:00.0-scsi-0:2:0:0: + by_id: "/dev/disk/by-id/wwn-0x6d0946604592b100226a26d009660c51" + by_path: "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:0:0" + firmware_version: 4.27 + model: PERC H730P Adp + size: 999653638144 + storage: HDD + pci-0000:18:00.0-scsi-0:2:1:0: + by_id: "/dev/disk/by-id/wwn-0x6d0946604592b100226a27390f9fb4b1" + by_path: "/dev/disk/by-path/pci-0000:18:00.0-scsi-0:2:1:0" + firmware_version: 4.27 + model: PERC H730P Adp + size: 4000225165312 + storage: HDD + supported_job_types: + virtual: false diff --git a/input/grid5000/sites/grenoble/clusters/vercors3/vercors3.yaml b/input/grid5000/sites/grenoble/clusters/vercors3/vercors3.yaml new file mode 100644 index 0000000000000000000000000000000000000000..23c71b3774ec46b3173b9fcd4cdf6fdd7812d444 --- /dev/null +++ b/input/grid5000/sites/grenoble/clusters/vercors3/vercors3.yaml @@ -0,0 +1,52 @@ +--- +model: Dell PowerEdge R740 +created_at: 2025-04-02 +kavlan: false +boot_type: bios +exotic: false +queues: + - admin + - testing +nodes: + vercors3-[1-2]: + supported_job_types: + deploy: true + besteffort: true + max_walltime: 0 + processor: + microarchitecture: Skylake-SP + clock_speed: 2_200_000_000 + network_adapters: + bmc: + interface: Ethernet + enabled: true + mountable: false + mounted: false + eth0: + enabled: true + mountable: true + mounted: true + eth1: + enabled: false + mountable: false + mounted: false + eth2: + enabled: false + mountable: false + mounted: false + eth3: + enabled: false + mountable: false + mounted: false + storage_devices: + pci-0000:18:00.0-scsi-0:2:0:0: + id: disk0 + interface: SAS + pci-0000:18:00.0-scsi-0:2:1:0: + id: disk1 + interface: SAS + software: + standard-environment: debian11-x64-std + management_tools: + bmc_vendor_tool: racadm + nodeset: vercors3 diff --git a/input/grid5000/sites/grenoble/clusters/vercors3/vercors3_metrics.yaml b/input/grid5000/sites/grenoble/clusters/vercors3/vercors3_metrics.yaml new file mode 100644 index 0000000000000000000000000000000000000000..03c90530a6f9ec3c37a21be92fe25da2ac9cca9c --- /dev/null +++ b/input/grid5000/sites/grenoble/clusters/vercors3/vercors3_metrics.yaml @@ -0,0 +1,63 @@ +--- +metrics: + + - name: prom_default_metrics + description: Default subset of metrics from Prometheus Node Exporter + period: 0 + optional_period: 15000 + source: + protocol: prometheus + port: 9100 + id: + - node_boot_time_seconds + - node_cpu_scaling_frequency_hertz + - node_cpu_seconds_total + - node_filesystem_free_bytes + - node_filesystem_size_bytes + - node_load1 + - node_load15 + - node_load5 + - node_memory_Buffers_bytes + - node_memory_Cached_bytes + - node_memory_MemAvailable_bytes + - node_memory_MemFree_bytes + - node_memory_MemTotal_bytes + - node_memory_Shmem_bytes + - node_memory_SwapFree_bytes + - node_memory_SwapTotal_bytes + - node_network_receive_bytes_total + - node_network_receive_packets_total + - node_network_transmit_bytes_total + - node_network_transmit_packets_total + - node_procs_blocked + - node_procs_running + - kwollect_custom + + - name: prom_all_metrics + description: All metrics from Prometheus Node Exporter + period: 0 + optional_period: 15000 + source: + protocol: prometheus + port: 9100 + - name: prom_nvgpu_default_metrics + description: Default subset of metrics from Prometheus Nvidia DCGM Exporter + period: 0 + optional_period: 15000 + source: + protocol: prometheus + port: 9400 + id: + - DCGM_FI_DEV_SM_CLOCK + - DCGM_FI_DEV_MEM_CLOCK + - DCGM_FI_DEV_GPU_TEMP + - DCGM_FI_DEV_POWER_USAGE + - DCGM_FI_DEV_MEM_COPY_UTIL + + - name: prom_nvgpu_all_metrics + description: All metrics from Prometheus Nvidia DCGM Exporter + period: 0 + optional_period: 15000 + source: + protocol: prometheus + port: 9400 diff --git a/input/grid5000/sites/grenoble/networks/imag-1b-F2-admin-01.yaml b/input/grid5000/sites/grenoble/networks/imag-1b-F2-admin-01.yaml index da4a4bdaf4e175b7b5ff005c867e3001ed458ba4..78b6c3d7a0d452b7fb45dabbb65f956e6f98eafa 100644 --- a/input/grid5000/sites/grenoble/networks/imag-1b-F2-admin-01.yaml +++ b/input/grid5000/sites/grenoble/networks/imag-1b-F2-admin-01.yaml @@ -16,6 +16,12 @@ imag-1b-F2-admin-01: rate: 10_000_000_000 backplane_bps: 1_760_000_000_000 ports: + 9: + uid: vercors3-2-bmc + kind: other + 10: + uid: vercors3-1-bmc + kind: other #40: # uid: imag-1b-F1-prod-01-mgmt # kind: switch diff --git a/input/grid5000/sites/grenoble/networks/imag-1b-F2-prod-01.yaml b/input/grid5000/sites/grenoble/networks/imag-1b-F2-prod-01.yaml index 2828a4dec1874031cc86c31afb618d37f8bd11c2..6bd2c7848b3f2de67bf4b58f6fdb4afc93a9f877 100644 --- a/input/grid5000/sites/grenoble/networks/imag-1b-F2-prod-01.yaml +++ b/input/grid5000/sites/grenoble/networks/imag-1b-F2-prod-01.yaml @@ -23,6 +23,12 @@ imag-1b-F2-prod-01: 6: uid: vercors2-2 rate: 1_000_000_000 + 7: + uid: vercors3-1 + rate: 10_000_000_000 + 8: + uid: vercors3-2 + rate: 10_000_000_000 44: uid: imag-1b-F2-admin-01 kind: switch diff --git a/lib/refrepo/gpu_ref.rb b/lib/refrepo/gpu_ref.rb index 48874d4fc4bcd1b6b57153a4c5a5deb611e862a7..d9a84793bbb4108a78cd098cbf3197fffd9e0335 100644 --- a/lib/refrepo/gpu_ref.rb +++ b/lib/refrepo/gpu_ref.rb @@ -140,6 +140,18 @@ class GPURef 'fp-64' => 342900000000, }, }, + 'TITAN Xp' => { + 'cores' => 3840, + 'compute_capability' => '6.1', + 'short_name' => 'TITAN Xp', + 'alias' => 'titanxp', + 'microarchitecture' => 'Pascal', + 'performance' => { + 'fp-16' => 177600000000, + 'fp-32' => 12149700000000, + 'fp-64' => 355200000000, + }, + }, 'GeForce GTX TITAN X' => { 'cores' => 3072, 'compute_capability' => '5.2', diff --git a/lib/refrepo/net_names_mapping.yaml b/lib/refrepo/net_names_mapping.yaml index cf1c3c7dd9e2d3412a92b15f3dad9f40da431b64..24a6a349cd45f8b0ec854d80a92d268875d1e7ff 100644 --- a/lib/refrepo/net_names_mapping.yaml +++ b/lib/refrepo/net_names_mapping.yaml @@ -383,6 +383,11 @@ vercors2: eno2: eth1 eno3: eth2 eno4: eth3 +vercors3: + enp1s0f0np0: eth0 + eno2np1: eth1 + eno3: eth2 + eno4: eth3 vianden: enp1s0f0np0: eth0 eno12409np1: eth1