From d6dfb3ddbb9e0e644582b9a90ac73657acf52561 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Wed, 5 Feb 2025 10:43:03 +0100 Subject: [PATCH 1/7] [rennes][abacus28] Reference Repository minimal configuration --- .../rennes/clusters/abacus28/abacus28.json | 20 +++ .../clusters/abacus28/nodes/abacus28-1.json | 128 ++++++++++++++++++ input/grid5000/ipv4.yaml | 1 + .../rennes/clusters/abacus28/abacus28.yaml | 41 ++++++ .../rennes/clusters/abacus28/nodes.yaml.erb | 78 +++++++++++ lib/refrepo/input_loader.rb | 2 +- 6 files changed, 269 insertions(+), 1 deletion(-) create mode 100644 data/grid5000/sites/rennes/clusters/abacus28/abacus28.json create mode 100644 data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json create mode 100644 input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml create mode 100644 input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb diff --git a/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json b/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json new file mode 100644 index 00000000000..1d5acad21ac --- /dev/null +++ b/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json @@ -0,0 +1,20 @@ +{ + "boot_type": "uefi", + "created_at": "Wed, 05 Feb 2025 00:00:00 GMT", + "exotic": false, + "kavlan": false, + "manufactured_at": "2024-12-06", + "metrics": [ + + ], + "model": "Dell PowerEdge C4140", + "priority": 202412, + "queues": [ + "admin", + "testing" + ], + "redfish": true, + "type": "cluster", + "uid": "abacus28", + "warranty_end": "2027-12-06" +} \ No newline at end of file diff --git a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json new file mode 100644 index 00000000000..88d00ed3037 --- /dev/null +++ b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json @@ -0,0 +1,128 @@ +{ + "architecture": { + "cpu_core_numbering": "contiguous", + "nb_cores": 72, + "nb_procs": 1, + "nb_threads": 72, + "platform_type": "x86_64" + }, + "bios": { + "release_date": "01/01/2000", + "vendor": "Unknown", + "version": 1 + }, + "bmc_version": "v1", + "chassis": { + "manufactured_at": "2024-12-06", + "manufacturer": "Unknown", + "name": "Unknown", + "warranty_end": "2027-12-06" + }, + "exotic": false, + "main_memory": { + "ram_size": 8 + }, + "management_tools": { + "bmc_vendor_tool": "racadm", + "ipmitool": { + "retries": 5 + } + }, + "memory_devices": [ + { + "device": "dimm_proc 1 dimm 1", + "size": 8, + "technology": "dram" + } + ], + "network_adapters": [ + { + "device": "eth0", + "driver": "mlx_core", + "enabled": true, + "interface": "Ethernet", + "ip": "172.16.109.31", + "ip6": "2001:660:4406:700:e::1f", + "kavlan": false, + "mac": "78:ac:44:15:dc:cc", + "management": false, + "mountable": true, + "mounted": true, + "name": "enp1s0f0np0", + "network_address": "abacus28-1.rennes.grid5000.fr", + "rate": 10000000000, + "switch": null, + "switch_port": null + }, + { + "device": "bmc", + "enabled": true, + "interface": "Ethernet", + "ip": "172.17.109.31", + "kavlan": false, + "mac": "70:b5:e8:e3:e0:d8", + "management": true, + "mountable": false, + "mounted": false, + "network_address": "abacus28-1-bmc.rennes.grid5000.fr" + } + ], + "nodeset": "abacus28", + "operating_system": { + "cstate_driver": "unknown", + "cstate_governor": "unknown", + "ht_enabled": true, + "pstate_driver": "unknwon", + "pstate_governor": "unknown", + "turboboost_enabled": true + }, + "performance": { + "core_flops": 33600000000, + "node_flops": 2419200000000 + }, + "processor": { + "cache_l1": null, + "cache_l1d": 8, + "cache_l1i": 8, + "cache_l2": 8, + "cache_l3": 8, + "clock_speed": 2100000000, + "ht_capable": true, + "instruction_set": "x86-64", + "microarchitecture": "Cascade Lake-SP", + "microcode": "0xd000001", + "model": "Intel Xeon", + "other_description": "Intel(R) Xeon(R) Silver 4216 CPU @ 2.10GHz", + "vendor": "Intel", + "version": "Silver 4216" + }, + "redfish": true, + "software": { + "forced-deployment-timestamp": 202007300948, + "postinstall-version": "1.2025011610", + "standard-environment": "debian11-x64-std" + }, + "storage_devices": [ + { + "by_id": "", + "by_path": "/dev/disk/by-path/dummy", + "id": "disk0", + "interface": "SAS", + "model": "unknown", + "size": 8, + "storage": "SSD", + "vendor": "Unknown" + } + ], + "supported_job_types": { + "besteffort": true, + "deploy": true, + "max_walltime": 0, + "queues": [ + "admin", + "testing" + ] + }, + "type": "node", + "uid": "abacus28-1" +} \ No newline at end of file diff --git a/input/grid5000/ipv4.yaml b/input/grid5000/ipv4.yaml index 332a8e5bc8e..4da3e04760e 100644 --- a/input/grid5000/ipv4.yaml +++ b/input/grid5000/ipv4.yaml @@ -97,6 +97,7 @@ ipv4: rennes abacus25 eth0 0 0 13 24 rennes abacus26 eth0 0 0 13 28 rennes abacus27 eth0 0 0 13 29 + rennes abacus28 eth0 0 0 13 30 rennes roazhon1 eth1 0 0 14 0 rennes roazhon2 eth0 0 0 14 1 rennes roazhon3 eth0 0 0 14 2 diff --git a/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml new file mode 100644 index 00000000000..304433af955 --- /dev/null +++ b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml @@ -0,0 +1,41 @@ +--- +model: Dell PowerEdge C4140 +created_at: 2025-02-05 +kavlan: false +boot_type: uefi +exotic: false +queues: + - admin + - testing +nodes: + abacus28-1: + chassis: + manufactured_at: 2024-12-06 + warranty_end: 2027-12-06 + supported_job_types: + deploy: true + besteffort: true + max_walltime: 0 + processor: + microarchitecture: Cascade Lake-SP + clock_speed: 2100000000 + network_adapters: + bmc: + interface: Ethernet + enabled: true + mountable: false + mounted: false + eth0: + enabled: true + mountable: true + mounted: true + storage_devices: + disk0: # This field will have to be renamed later. + id: disk0 + interface: SAS + by_path: "/dev/disk/by-path/dummy" # this path will have to change later. + software: + standard-environment: debian11-x64-std + management_tools: + bmc_vendor_tool: racadm + nodeset: abacus28 \ No newline at end of file diff --git a/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb b/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb new file mode 100644 index 00000000000..eb14a7c9bec --- /dev/null +++ b/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb @@ -0,0 +1,78 @@ +<% + cluster_name = "abacus28" + nodes_number = 1 + # MAC addresses declaration + mac_eth0_list = %w( + 78:ac:44:15:dc:cc + ) + + mac_bmc_list = %w( + 70:b5:e8:e3:e0:d8 + ) +%> +--- +nodes: +<% (1..nodes_number).each { |i| %> + <%= cluster_name %>-<%= i %>: + architecture: + nb_procs: 1 + nb_cores: 72 + nb_threads: 72 + platform_type: x86_64 + cpu_core_numbering: contiguous + bios: + release_date: 01/01/2000 # Fake date, will be replaced by g5k-checks + vendor: Unknown # Fake vendor, will be replaced by g5k-checks + version: 1 # Fake version, will be replaced by g5k-checks + bmc_version: v1 # Fake version, will be replaced by g5k-checks + chassis: + manufacturer: Unknown # Fake manufacturer, will be replaced by g5k-checks + name: Unknown # Fake name, will be replaced by g5k-checks + main_memory: + ram_size: 8 # Fake size, will be replaced by g5k-checks + memory_devices: + dimm: + size: 8 # Fake size, will be replaced by g5k-checks + technology: dram # Common memory technology, will be replaced by g5k-checks + processor: + model: Intel Xeon + other_description: Intel(R) Xeon(R) Silver 4216 CPU @ 2.10GHz + vendor: Intel + version: Silver 4216 + cache_l1d: 8 # Fake cache, will be replaced by g5k-checks + cache_l1i: 8 # Fake cache, will be replaced by g5k-checks + cache_l2: 8 # Fake cache, will be replaced by g5k-checks + cache_l3: 8 # Fake cache, will be replaced by g5k-checks + instruction_set: x86-64 # Common instruction set, will be replaced by g5k-checks + microcode: "0xd000001" # Fake microcode, will be replaced by g5k-checks + ht_capable: true # Default ht capable value, will be replaced by g5k-checks + main_memory: + ram_size: 8 # Fake ram size, will be replaced by g5k-checks + memory_devices: + dimm_proc 1 dimm 1: # Fake dimm name, will be replaced by g5k-checks + size: 8 # Fake dimm size, will be replaced by g5k-checks + technology: dram # Default dimm technology, will be replaced by g5k-checks + operating_system: + cstate_driver: unknown # Fake driver, will be replaced by g5k-checks + cstate_governor: unknown # Fake governor, will be replaced by g5k-checks + ht_enabled: true # common value for hyper threading, will be replaced by g5k-checks + pstate_driver: unknwon # Fake driver, will be replaced by g5k-checks + pstate_governor: unknown # Fake driver, will be replaced by g5k-checks + turboboost_enabled: true # Default value for turboboost, will be replaced by g5k-checks + network_adapters: + bmc: + management: true + mac: <%= mac_bmc_list[i - 1] %> + eth0: + interface: Ethernet + management: false + driver: mlx_core + name: enp1s0f0np0 + rate: 10000000000 + mac: <%= mac_eth0_list[i - 1] %> + storage_devices: + disk0: + storage: SSD # Common value, will be replaced by g5k-checks + model: unknown # fake value, + size: 8 # Fake value, will be replaced by g5k-checks +<% } %> diff --git a/lib/refrepo/input_loader.rb b/lib/refrepo/input_loader.rb index b93350b45e1..11daefda2fb 100644 --- a/lib/refrepo/input_loader.rb +++ b/lib/refrepo/input_loader.rb @@ -742,7 +742,7 @@ def get_flops_per_cycle(microarch, cpu_name, cluster_uid) return 48 when "Cascade Lake-SP", "Skylake-SP" case cpu_name - when /Silver 4110/, /Silver 4114/, /Silver 4214/, /Gold 5218/, /Gold 5220/, /Gold 5115/, /Gold 5118/, /Gold 5120/, /Gold 5220R/ + when /Silver 4110/, /Silver 4114/, /Silver 4214/, /Silver 4216/, /Gold 5218/, /Gold 5220/, /Gold 5115/, /Gold 5118/, /Gold 5120/, /Gold 5220R/ return 16 when /Gold 6126/, /Gold 6130/, /Gold 6142/, /Gold 6154/, /Gold 6248/, /Gold 6254/, /Gold 6240L/ return 32 -- GitLab From 341d4324eec8b4080014e3ed51826a0c24fef605 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Wed, 5 Feb 2025 10:43:03 +0100 Subject: [PATCH 2/7] [rennes][abacus28] Reference Repository minimal configuration -- GitLab From 601b814873a0e6dcd97ed8cf1fc2a93b1d0128b2 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Thu, 6 Feb 2025 10:50:34 +0100 Subject: [PATCH 3/7] [rennes][abacus28] Add disk path --- .../sites/rennes/clusters/abacus28/nodes/abacus28-1.json | 4 ++-- input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml | 6 +++--- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json index 88d00ed3037..8f62a003731 100644 --- a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json +++ b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json @@ -105,9 +105,9 @@ "storage_devices": [ { "by_id": "", - "by_path": "/dev/disk/by-path/dummy", + "by_path": "/dev/disk/by-path/pci-0000:04:00.0-ata-1", "id": "disk0", - "interface": "SAS", + "interface": "SATA", "model": "unknown", "size": 8, "storage": "SSD", diff --git a/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml index 304433af955..eaa4a9917a3 100644 --- a/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml +++ b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml @@ -32,10 +32,10 @@ nodes: storage_devices: disk0: # This field will have to be renamed later. id: disk0 - interface: SAS - by_path: "/dev/disk/by-path/dummy" # this path will have to change later. + interface: SATA + by_path: "/dev/disk/by-path/pci-0000:04:00.0-ata-1" software: standard-environment: debian11-x64-std management_tools: bmc_vendor_tool: racadm - nodeset: abacus28 \ No newline at end of file + nodeset: abacus28 -- GitLab From 1edc9a1f457b22bfeb53b34efc02695750485e71 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Mon, 10 Feb 2025 13:20:19 +0100 Subject: [PATCH 4/7] [rennes][abacus28] Add predictable network interfaces mapping --- lib/refrepo/net_names_mapping.yaml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/lib/refrepo/net_names_mapping.yaml b/lib/refrepo/net_names_mapping.yaml index 0910400d214..db8b2050879 100644 --- a/lib/refrepo/net_names_mapping.yaml +++ b/lib/refrepo/net_names_mapping.yaml @@ -80,6 +80,11 @@ abacus26: abacus27: enp1s0f0np0: eth0 ens22f1np1: eth1 +abacus28: + enp5s0f0: eth0 + enp1s0f0: eth1 + enp1s0f1: eth2 + enp5s0f1: eth3 chetemi: eno1: eth0 eno2: eth1 -- GitLab From 55d613d5c7ef2f58af565f687b79b65eb53a1e24 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Thu, 13 Feb 2025 09:12:21 +0100 Subject: [PATCH 5/7] [rennes][abacus28] Change net name mapping --- .../sites/rennes/clusters/abacus28/nodes.yaml.erb | 2 +- lib/refrepo/net_names_mapping.yaml | 8 ++++---- 2 files changed, 5 insertions(+), 5 deletions(-) diff --git a/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb b/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb index eb14a7c9bec..fb7083205e0 100644 --- a/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb +++ b/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb @@ -67,7 +67,7 @@ nodes: interface: Ethernet management: false driver: mlx_core - name: enp1s0f0np0 + name: eno1 rate: 10000000000 mac: <%= mac_eth0_list[i - 1] %> storage_devices: diff --git a/lib/refrepo/net_names_mapping.yaml b/lib/refrepo/net_names_mapping.yaml index db8b2050879..cd6714357d9 100644 --- a/lib/refrepo/net_names_mapping.yaml +++ b/lib/refrepo/net_names_mapping.yaml @@ -81,10 +81,10 @@ abacus27: enp1s0f0np0: eth0 ens22f1np1: eth1 abacus28: - enp5s0f0: eth0 - enp1s0f0: eth1 - enp1s0f1: eth2 - enp5s0f1: eth3 + eno1: eth0 + eno2: eth3 + eno3: eth1 + eno4: eth2 chetemi: eno1: eth0 eno2: eth1 -- GitLab From 2bdfced6d63b7d21b57e3da73d4c32a5ebb6c78e Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Thu, 13 Feb 2025 09:39:36 +0100 Subject: [PATCH 6/7] [rennes][abacus28] Generate data with new interface name --- .../sites/rennes/clusters/abacus28/nodes/abacus28-1.json | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json index 8f62a003731..710bc341d03 100644 --- a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json +++ b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json @@ -48,7 +48,7 @@ "management": false, "mountable": true, "mounted": true, - "name": "enp1s0f0np0", + "name": "eno1", "network_address": "abacus28-1.rennes.grid5000.fr", "rate": 10000000000, "switch": null, -- GitLab From b6081c834990af81eec1ef4d18d45c7e9604ec67 Mon Sep 17 00:00:00 2001 From: Noah Mandler <noah.mandler@inria.fr> Date: Thu, 13 Feb 2025 10:30:34 +0100 Subject: [PATCH 7/7] [rennes][abacus28] Generate reference api --- .../rennes/clusters/abacus28/abacus28.json | 4 +- .../clusters/abacus28/nodes/abacus28-1.json | 246 +++++++++++++++--- input/grid5000/dell-product-data.yaml | 6 + input/grid5000/disks.yaml | 1 + .../rennes/clusters/abacus28/abacus28.yaml | 18 +- .../rennes/clusters/abacus28/nodes.yaml.erb | 78 ------ .../clusters/abacus28/nodes/abacus28-1.yaml | 170 ++++++++++++ 7 files changed, 407 insertions(+), 116 deletions(-) delete mode 100644 input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb create mode 100644 input/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.yaml diff --git a/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json b/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json index 1d5acad21ac..1757a3c94bf 100644 --- a/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json +++ b/data/grid5000/sites/rennes/clusters/abacus28/abacus28.json @@ -3,12 +3,12 @@ "created_at": "Wed, 05 Feb 2025 00:00:00 GMT", "exotic": false, "kavlan": false, - "manufactured_at": "2024-12-06", + "manufactured_at": "2020-12-05", "metrics": [ ], "model": "Dell PowerEdge C4140", - "priority": 202412, + "priority": 202112, "queues": [ "admin", "testing" diff --git a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json index 710bc341d03..c131500295b 100644 --- a/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json +++ b/data/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.json @@ -1,26 +1,97 @@ { "architecture": { - "cpu_core_numbering": "contiguous", - "nb_cores": 72, - "nb_procs": 1, - "nb_threads": 72, + "cpu_core_numbering": "round-robin", + "nb_cores": 32, + "nb_procs": 2, + "nb_threads": 64, "platform_type": "x86_64" }, "bios": { - "release_date": "01/01/2000", - "vendor": "Unknown", - "version": 1 + "release_date": "08/27/2020", + "vendor": "Dell Inc.", + "version": "2.8.2" }, - "bmc_version": "v1", + "bmc_version": "4.20.20.20", "chassis": { - "manufactured_at": "2024-12-06", - "manufacturer": "Unknown", - "name": "Unknown", + "manufactured_at": "2020-12-05", + "manufacturer": "Dell Inc.", + "name": "PowerEdge C4140", + "serial": "JYLR393", "warranty_end": "2027-12-06" }, "exotic": false, + "gpu_devices": { + "nvidia0": { + "compute_capability": "7.0", + "cores": 5120, + "cpu_affinity": 0, + "device": "/dev/nvidia0", + "memory": 34359738368, + "microarchitecture": "Volta", + "model": "Tesla V100-SXM2-32GB", + "performance": { + "fp-16": 28260000000000, + "fp-32": 14130000000000, + "fp-64": 7066000000000 + }, + "power_default_limit": "300.00 W", + "vbios_version": "88.00.80.00.01", + "vendor": "Nvidia" + }, + "nvidia1": { + "compute_capability": "7.0", + "cores": 5120, + "cpu_affinity": 0, + "device": "/dev/nvidia1", + "memory": 34359738368, + "microarchitecture": "Volta", + "model": "Tesla V100-SXM2-32GB", + "performance": { + "fp-16": 28260000000000, + "fp-32": 14130000000000, + "fp-64": 7066000000000 + }, + "power_default_limit": "300.00 W", + "vbios_version": "88.00.80.00.01", + "vendor": "Nvidia" + }, + "nvidia2": { + "compute_capability": "7.0", + "cores": 5120, + "cpu_affinity": 1, + "device": "/dev/nvidia2", + "memory": 34359738368, + "microarchitecture": "Volta", + "model": "Tesla V100-SXM2-32GB", + "performance": { + "fp-16": 28260000000000, + "fp-32": 14130000000000, + "fp-64": 7066000000000 + }, + "power_default_limit": "300.00 W", + "vbios_version": "88.00.80.00.01", + "vendor": "Nvidia" + }, + "nvidia3": { + "compute_capability": "7.0", + "cores": 5120, + "cpu_affinity": 1, + "device": "/dev/nvidia3", + "memory": 34359738368, + "microarchitecture": "Volta", + "model": "Tesla V100-SXM2-32GB", + "performance": { + "fp-16": 28260000000000, + "fp-32": 14130000000000, + "fp-64": 7066000000000 + }, + "power_default_limit": "300.00 W", + "vbios_version": "88.00.80.00.01", + "vendor": "Nvidia" + } + }, "main_memory": { - "ram_size": 8 + "ram_size": 412316860416 }, "management_tools": { "bmc_vendor_tool": "racadm", @@ -30,29 +101,140 @@ }, "memory_devices": [ { - "device": "dimm_proc 1 dimm 1", - "size": 8, + "device": "dimm_a1", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_a2", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_a3", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_a4", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_a5", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_a6", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b1", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b2", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b3", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b4", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b5", + "size": 34359738368, + "technology": "dram" + }, + { + "device": "dimm_b6", + "size": 34359738368, "technology": "dram" } ], "network_adapters": [ { "device": "eth0", - "driver": "mlx_core", + "driver": "i40e", "enabled": true, + "firmware_version": "7.10 0x800075da 19.5.12", "interface": "Ethernet", "ip": "172.16.109.31", "ip6": "2001:660:4406:700:e::1f", "kavlan": false, "mac": "78:ac:44:15:dc:cc", "management": false, + "model": "Ethernet Controller X710 for 10GbE SFP+", "mountable": true, "mounted": true, "name": "eno1", "network_address": "abacus28-1.rennes.grid5000.fr", "rate": 10000000000, + "sriov": false, + "sriov_totalvfs": 0, "switch": null, - "switch_port": null + "switch_port": null, + "vendor": "Intel" + }, + { + "device": "eth1", + "driver": "igb", + "enabled": false, + "firmware_version": "1.67, 0x80000fa8, 19.5.12", + "interface": "Ethernet", + "kavlan": false, + "mac": "78:ac:44:15:dc:ec", + "management": false, + "model": "I350 Gigabit Network Connection", + "mountable": false, + "mounted": false, + "name": "eno3", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Intel" + }, + { + "device": "eth2", + "driver": "igb", + "enabled": false, + "firmware_version": "1.67, 0x80000fa8, 19.5.12", + "interface": "Ethernet", + "kavlan": false, + "mac": "78:ac:44:15:dc:ed", + "management": false, + "model": "I350 Gigabit Network Connection", + "mountable": false, + "mounted": false, + "name": "eno4", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Intel" + }, + { + "device": "eth3", + "driver": "i40e", + "enabled": false, + "firmware_version": "7.10 0x800075da 19.5.12", + "interface": "Ethernet", + "kavlan": false, + "mac": "78:ac:44:15:dc:ce", + "management": false, + "model": "Ethernet Controller X710 for 10GbE SFP+", + "mountable": false, + "mounted": false, + "name": "eno2", + "sriov": false, + "sriov_totalvfs": 0, + "vendor": "Intel" }, { "device": "bmc", @@ -69,28 +251,28 @@ ], "nodeset": "abacus28", "operating_system": { - "cstate_driver": "unknown", - "cstate_governor": "unknown", + "cstate_driver": "intel_idle", + "cstate_governor": "menu", "ht_enabled": true, - "pstate_driver": "unknwon", - "pstate_governor": "unknown", + "pstate_driver": "intel_cpufreq", + "pstate_governor": "performance", "turboboost_enabled": true }, "performance": { "core_flops": 33600000000, - "node_flops": 2419200000000 + "node_flops": 1075200000000 }, "processor": { "cache_l1": null, - "cache_l1d": 8, - "cache_l1i": 8, - "cache_l2": 8, - "cache_l3": 8, + "cache_l1d": 32768, + "cache_l1i": 32768, + "cache_l2": 1048576, + "cache_l3": 23068672, "clock_speed": 2100000000, "ht_capable": true, "instruction_set": "x86-64", "microarchitecture": "Cascade Lake-SP", - "microcode": "0xd000001", + "microcode": "0x5003707", "model": "Intel Xeon", "other_description": "Intel(R) Xeon(R) Silver 4216 CPU @ 2.10GHz", "vendor": "Intel", @@ -104,14 +286,15 @@ }, "storage_devices": [ { - "by_id": "", + "by_id": "/dev/disk/by-id/wwn-0x500a075129665976", "by_path": "/dev/disk/by-path/pci-0000:04:00.0-ata-1", + "firmware_version": "D3DJ004", "id": "disk0", "interface": "SATA", - "model": "unknown", - "size": 8, + "model": "MTFDDAV480TDS", + "size": 480103981056, "storage": "SSD", - "vendor": "Unknown" + "vendor": "Micron" } ], "supported_job_types": { @@ -121,7 +304,8 @@ "queues": [ "admin", "testing" - ] + ], + "virtual": "ivt" }, "type": "node", "uid": "abacus28-1" diff --git a/input/grid5000/dell-product-data.yaml b/input/grid5000/dell-product-data.yaml index ac0842f50d2..9c8e034e97a 100644 --- a/input/grid5000/dell-product-data.yaml +++ b/input/grid5000/dell-product-data.yaml @@ -1816,6 +1816,12 @@ sites: chassis: manufactured_at: 2021-08-02 warranty_end: 2028-08-04 + abacus28: + nodes: + abacus28-1: + chassis: + manufactured_at: 2020-12-05 + warranty_end: 2027-12-06 abacus3: nodes: abacus3-1: diff --git a/input/grid5000/disks.yaml b/input/grid5000/disks.yaml index a516e21bb9e..041dfdf90b1 100644 --- a/input/grid5000/disks.yaml +++ b/input/grid5000/disks.yaml @@ -107,6 +107,7 @@ disk_vendor_model_mapping: - MTFDDAK960TDT - MTFDDAV240TCB - MTFDDAV240TDU + - MTFDDAV480TDS Samsung: - MZ7KM240HMHQ0D3 - MZ7KH1T9HAJR0D3 diff --git a/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml index eaa4a9917a3..06be0177595 100644 --- a/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml +++ b/input/grid5000/sites/rennes/clusters/abacus28/abacus28.yaml @@ -9,9 +9,6 @@ queues: - testing nodes: abacus28-1: - chassis: - manufactured_at: 2024-12-06 - warranty_end: 2027-12-06 supported_job_types: deploy: true besteffort: true @@ -29,11 +26,22 @@ nodes: enabled: true mountable: true mounted: true + eth1: + enabled: false + mountable: false + mounted: false + eth2: + enabled: false + mountable: false + mounted: false + eth3: + enabled: false + mountable: false + mounted: false storage_devices: - disk0: # This field will have to be renamed later. + pci-0000:04:00.0-ata-1: id: disk0 interface: SATA - by_path: "/dev/disk/by-path/pci-0000:04:00.0-ata-1" software: standard-environment: debian11-x64-std management_tools: diff --git a/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb b/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb deleted file mode 100644 index fb7083205e0..00000000000 --- a/input/grid5000/sites/rennes/clusters/abacus28/nodes.yaml.erb +++ /dev/null @@ -1,78 +0,0 @@ -<% - cluster_name = "abacus28" - nodes_number = 1 - # MAC addresses declaration - mac_eth0_list = %w( - 78:ac:44:15:dc:cc - ) - - mac_bmc_list = %w( - 70:b5:e8:e3:e0:d8 - ) -%> ---- -nodes: -<% (1..nodes_number).each { |i| %> - <%= cluster_name %>-<%= i %>: - architecture: - nb_procs: 1 - nb_cores: 72 - nb_threads: 72 - platform_type: x86_64 - cpu_core_numbering: contiguous - bios: - release_date: 01/01/2000 # Fake date, will be replaced by g5k-checks - vendor: Unknown # Fake vendor, will be replaced by g5k-checks - version: 1 # Fake version, will be replaced by g5k-checks - bmc_version: v1 # Fake version, will be replaced by g5k-checks - chassis: - manufacturer: Unknown # Fake manufacturer, will be replaced by g5k-checks - name: Unknown # Fake name, will be replaced by g5k-checks - main_memory: - ram_size: 8 # Fake size, will be replaced by g5k-checks - memory_devices: - dimm: - size: 8 # Fake size, will be replaced by g5k-checks - technology: dram # Common memory technology, will be replaced by g5k-checks - processor: - model: Intel Xeon - other_description: Intel(R) Xeon(R) Silver 4216 CPU @ 2.10GHz - vendor: Intel - version: Silver 4216 - cache_l1d: 8 # Fake cache, will be replaced by g5k-checks - cache_l1i: 8 # Fake cache, will be replaced by g5k-checks - cache_l2: 8 # Fake cache, will be replaced by g5k-checks - cache_l3: 8 # Fake cache, will be replaced by g5k-checks - instruction_set: x86-64 # Common instruction set, will be replaced by g5k-checks - microcode: "0xd000001" # Fake microcode, will be replaced by g5k-checks - ht_capable: true # Default ht capable value, will be replaced by g5k-checks - main_memory: - ram_size: 8 # Fake ram size, will be replaced by g5k-checks - memory_devices: - dimm_proc 1 dimm 1: # Fake dimm name, will be replaced by g5k-checks - size: 8 # Fake dimm size, will be replaced by g5k-checks - technology: dram # Default dimm technology, will be replaced by g5k-checks - operating_system: - cstate_driver: unknown # Fake driver, will be replaced by g5k-checks - cstate_governor: unknown # Fake governor, will be replaced by g5k-checks - ht_enabled: true # common value for hyper threading, will be replaced by g5k-checks - pstate_driver: unknwon # Fake driver, will be replaced by g5k-checks - pstate_governor: unknown # Fake driver, will be replaced by g5k-checks - turboboost_enabled: true # Default value for turboboost, will be replaced by g5k-checks - network_adapters: - bmc: - management: true - mac: <%= mac_bmc_list[i - 1] %> - eth0: - interface: Ethernet - management: false - driver: mlx_core - name: eno1 - rate: 10000000000 - mac: <%= mac_eth0_list[i - 1] %> - storage_devices: - disk0: - storage: SSD # Common value, will be replaced by g5k-checks - model: unknown # fake value, - size: 8 # Fake value, will be replaced by g5k-checks -<% } %> diff --git a/input/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.yaml b/input/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.yaml new file mode 100644 index 00000000000..480e3bad57e --- /dev/null +++ b/input/grid5000/sites/rennes/clusters/abacus28/nodes/abacus28-1.yaml @@ -0,0 +1,170 @@ +# Generated by g5k-checks (g5k-checks -m api) +--- +abacus28-1: + architecture: + cpu_core_numbering: round-robin + nb_cores: 32 + nb_procs: 2 + nb_threads: 64 + platform_type: x86_64 + bios: + release_date: '08/27/2020' + vendor: Dell Inc. + version: 2.8.2 + bmc_version: 4.20.20.20 + chassis: + manufacturer: Dell Inc. + name: PowerEdge C4140 + serial: JYLR393 + gpu_devices: + nvidia0: + cpu_affinity: 0 + device: "/dev/nvidia0" + memory: 34359738368 + model: Tesla V100-SXM2-32GB + power_default_limit: 300.00 W + vbios_version: 88.00.80.00.01 + vendor: Nvidia + nvidia1: + cpu_affinity: 0 + device: "/dev/nvidia1" + memory: 34359738368 + model: Tesla V100-SXM2-32GB + power_default_limit: 300.00 W + vbios_version: 88.00.80.00.01 + vendor: Nvidia + nvidia2: + cpu_affinity: 1 + device: "/dev/nvidia2" + memory: 34359738368 + model: Tesla V100-SXM2-32GB + power_default_limit: 300.00 W + vbios_version: 88.00.80.00.01 + vendor: Nvidia + nvidia3: + cpu_affinity: 1 + device: "/dev/nvidia3" + memory: 34359738368 + model: Tesla V100-SXM2-32GB + power_default_limit: 300.00 W + vbios_version: 88.00.80.00.01 + vendor: Nvidia + main_memory: + ram_size: 412316860416 + memory_devices: + dimm_a1: + size: 34359738368 + technology: dram + dimm_a2: + size: 34359738368 + technology: dram + dimm_a3: + size: 34359738368 + technology: dram + dimm_a4: + size: 34359738368 + technology: dram + dimm_a5: + size: 34359738368 + technology: dram + dimm_a6: + size: 34359738368 + technology: dram + dimm_b1: + size: 34359738368 + technology: dram + dimm_b2: + size: 34359738368 + technology: dram + dimm_b3: + size: 34359738368 + technology: dram + dimm_b4: + size: 34359738368 + technology: dram + dimm_b5: + size: 34359738368 + technology: dram + dimm_b6: + size: 34359738368 + technology: dram + network_adapters: + bmc: + ip: 172.17.109.31 + mac: 70:b5:e8:e3:e0:d8 + management: true + eth0: + driver: i40e + firmware_version: 7.10 0x800075da 19.5.12 + interface: Ethernet + ip: 172.16.109.31 + mac: 78:ac:44:15:dc:cc + management: false + model: Ethernet Controller X710 for 10GbE SFP+ + name: eno1 + rate: 10000000000 + sriov: false + sriov_totalvfs: 0 + vendor: Intel + eth1: + driver: igb + firmware_version: 1.67, 0x80000fa8, 19.5.12 + interface: Ethernet + mac: 78:ac:44:15:dc:ec + management: false + model: I350 Gigabit Network Connection + name: eno3 + sriov: false + sriov_totalvfs: 0 + vendor: Intel + eth2: + driver: igb + firmware_version: 1.67, 0x80000fa8, 19.5.12 + interface: Ethernet + mac: 78:ac:44:15:dc:ed + management: false + model: I350 Gigabit Network Connection + name: eno4 + sriov: false + sriov_totalvfs: 0 + vendor: Intel + eth3: + driver: i40e + firmware_version: 7.10 0x800075da 19.5.12 + interface: Ethernet + mac: 78:ac:44:15:dc:ce + management: false + model: Ethernet Controller X710 for 10GbE SFP+ + name: eno2 + sriov: false + sriov_totalvfs: 0 + vendor: Intel + operating_system: + cstate_driver: intel_idle + cstate_governor: menu + ht_enabled: true + pstate_driver: intel_cpufreq + pstate_governor: performance + turboboost_enabled: true + processor: + cache_l1d: 32768 + cache_l1i: 32768 + cache_l2: 1048576 + cache_l3: 23068672 + ht_capable: true + instruction_set: x86-64 + microcode: '0x5003707' + model: Intel Xeon + other_description: Intel(R) Xeon(R) Silver 4216 CPU @ 2.10GHz + vendor: Intel + version: Silver 4216 + storage_devices: + pci-0000:04:00.0-ata-1: + by_id: "/dev/disk/by-id/wwn-0x500a075129665976" + by_path: "/dev/disk/by-path/pci-0000:04:00.0-ata-1" + firmware_version: D3DJ004 + model: MTFDDAV480TDS + size: 480103981056 + storage: SSD + supported_job_types: + virtual: ivt -- GitLab