Mentions légales du service

Skip to content
Snippets Groups Projects
Commit 6bdf177e authored by PAULIN Nathan's avatar PAULIN Nathan
Browse files

Merge branch 'testing-esterel24' into 'master'

[sophia][esterel24] add esterel24 to testing queue

See merge request !1175
parents 8ab65936 6586704a
No related branches found
No related tags found
1 merge request!1175[sophia][esterel24] add esterel24 to testing queue
Pipeline #1150564 passed
Pipeline: Resources Explorer

#1150566

    Showing
    with 709 additions and 1 deletion
    {
    "boot_type": "bios",
    "created_at": "Thu, 27 Mar 2025 00:00:00 GMT",
    "exotic": false,
    "kavlan": false,
    "manufactured_at": "2020-09-27",
    "metrics": [
    {
    "description": "Default subset of metrics from Prometheus Node Exporter",
    "name": "prom_default_metrics",
    "optional_period": 15000,
    "period": 0,
    "source": {
    "id": [
    "node_boot_time_seconds",
    "node_cpu_scaling_frequency_hertz",
    "node_cpu_seconds_total",
    "node_filesystem_free_bytes",
    "node_filesystem_size_bytes",
    "node_load1",
    "node_load15",
    "node_load5",
    "node_memory_Buffers_bytes",
    "node_memory_Cached_bytes",
    "node_memory_MemAvailable_bytes",
    "node_memory_MemFree_bytes",
    "node_memory_MemTotal_bytes",
    "node_memory_Shmem_bytes",
    "node_memory_SwapFree_bytes",
    "node_memory_SwapTotal_bytes",
    "node_network_receive_bytes_total",
    "node_network_receive_packets_total",
    "node_network_transmit_bytes_total",
    "node_network_transmit_packets_total",
    "node_procs_blocked",
    "node_procs_running",
    "kwollect_custom"
    ],
    "port": 9100,
    "protocol": "prometheus"
    }
    },
    {
    "description": "All metrics from Prometheus Node Exporter",
    "name": "prom_all_metrics",
    "optional_period": 15000,
    "period": 0,
    "source": {
    "port": 9100,
    "protocol": "prometheus"
    }
    },
    {
    "description": "Default subset of metrics from Prometheus Nvidia DCGM Exporter",
    "name": "prom_nvgpu_default_metrics",
    "optional_period": 15000,
    "period": 0,
    "source": {
    "id": [
    "DCGM_FI_DEV_SM_CLOCK",
    "DCGM_FI_DEV_MEM_CLOCK",
    "DCGM_FI_DEV_GPU_TEMP",
    "DCGM_FI_DEV_POWER_USAGE",
    "DCGM_FI_DEV_MEM_COPY_UTIL"
    ],
    "port": 9400,
    "protocol": "prometheus"
    }
    },
    {
    "description": "All metrics from Prometheus Nvidia DCGM Exporter",
    "name": "prom_nvgpu_all_metrics",
    "optional_period": 15000,
    "period": 0,
    "source": {
    "port": 9400,
    "protocol": "prometheus"
    }
    }
    ],
    "model": "Dell PowerEdge T640",
    "nodes_count": 1,
    "nodes_description": "2 CPUs Intel Xeon Gold 6240R, 24 cores/CPU, 4 GPUs Quadro RTX 8000, 384GB RAM, 558GB HDD, 4468GB HDD, 1 x 1Gb Ethernet, 1 x 40Gb InfiniBand",
    "priority": 202109,
    "queues": [
    "admin",
    "testing"
    ],
    "redfish": true,
    "type": "cluster",
    "uid": "esterel24",
    "warranty_end": "2027-09-29"
    }
    \ No newline at end of file
    {
    "architecture": {
    "cpu_core_numbering": "round-robin",
    "nb_cores": 48,
    "nb_procs": 2,
    "nb_threads": 96,
    "platform_type": "x86_64"
    },
    "bios": {
    "release_date": "01/09/2025",
    "vendor": "Dell Inc.",
    "version": "2.23.0"
    },
    "bmc_version": "7.00.00.181",
    "chassis": {
    "manufactured_at": "2020-09-27",
    "manufacturer": "Dell Inc.",
    "name": "PowerEdge T640",
    "serial": "F51GY63",
    "warranty_end": "2027-09-29"
    },
    "exotic": false,
    "gpu_devices": {
    "nvidia0": {
    "compute_capability": "7.5",
    "cores": 4608,
    "cpu_affinity": 0,
    "device": "/dev/nvidia0",
    "memory": 48318382080,
    "microarchitecture": "Turing",
    "model": "Quadro RTX 8000",
    "performance": {
    "fp-16": 32620000000000,
    "fp-32": 16310000000000,
    "fp-64": 510000000000
    },
    "power_default_limit": "250.00 W",
    "vbios_version": "90.02.4E.00.03",
    "vendor": "Nvidia"
    },
    "nvidia1": {
    "compute_capability": "7.5",
    "cores": 4608,
    "cpu_affinity": 0,
    "device": "/dev/nvidia1",
    "memory": 48318382080,
    "microarchitecture": "Turing",
    "model": "Quadro RTX 8000",
    "performance": {
    "fp-16": 32620000000000,
    "fp-32": 16310000000000,
    "fp-64": 510000000000
    },
    "power_default_limit": "250.00 W",
    "vbios_version": "90.02.4E.00.03",
    "vendor": "Nvidia"
    },
    "nvidia2": {
    "compute_capability": "7.5",
    "cores": 4608,
    "cpu_affinity": 1,
    "device": "/dev/nvidia2",
    "memory": 48318382080,
    "microarchitecture": "Turing",
    "model": "Quadro RTX 8000",
    "performance": {
    "fp-16": 32620000000000,
    "fp-32": 16310000000000,
    "fp-64": 510000000000
    },
    "power_default_limit": "250.00 W",
    "vbios_version": "90.02.4E.00.03",
    "vendor": "Nvidia"
    },
    "nvidia3": {
    "compute_capability": "7.5",
    "cores": 4608,
    "cpu_affinity": 1,
    "device": "/dev/nvidia3",
    "memory": 48318382080,
    "microarchitecture": "Turing",
    "model": "Quadro RTX 8000",
    "performance": {
    "fp-16": 32620000000000,
    "fp-32": 16310000000000,
    "fp-64": 510000000000
    },
    "power_default_limit": "250.00 W",
    "vbios_version": "90.02.4E.00.03",
    "vendor": "Nvidia"
    }
    },
    "main_memory": {
    "ram_size": 412316860416
    },
    "management_tools": {
    "bmc_vendor_tool": "racadm",
    "ipmitool": {
    "retries": 5
    }
    },
    "memory_devices": [
    {
    "device": "dimm_a1",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_a2",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_a3",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_a4",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_a5",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_a6",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b1",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b2",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b3",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b4",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b5",
    "size": 34359738368,
    "technology": "dram"
    },
    {
    "device": "dimm_b6",
    "size": 34359738368,
    "technology": "dram"
    }
    ],
    "network_adapters": [
    {
    "device": "eth0",
    "driver": "bnxt_en",
    "enabled": true,
    "firmware_version": "218.0.219.13/pkg 21.85.21.92",
    "interface": "Ethernet",
    "ip": "172.16.131.31",
    "ip6": "2001:660:4406:800:4::1f",
    "kavlan": false,
    "mac": "70:b5:e8:c9:ff:d2",
    "management": false,
    "model": "BCM57416 NetXtreme-E Dual-Media 10G RDMA Ethernet Controller",
    "mountable": true,
    "mounted": true,
    "name": "enp1s0f0np0",
    "network_address": "esterel24-1.sophia.grid5000.fr",
    "rate": 1000000000,
    "sriov": false,
    "sriov_totalvfs": 0,
    "switch": "sw-5",
    "switch_port": "1/1/1",
    "vendor": "Broadcom Inc. and subsidiaries"
    },
    {
    "device": "eth1",
    "driver": "bnxt_en",
    "enabled": false,
    "firmware_version": "218.0.219.13/pkg 21.85.21.92",
    "interface": "Ethernet",
    "kavlan": false,
    "mac": "70:b5:e8:c9:ff:d3",
    "management": false,
    "model": "BCM57416 NetXtreme-E Dual-Media 10G RDMA Ethernet Controller",
    "mountable": false,
    "mounted": false,
    "name": "eno2np1",
    "sriov": false,
    "sriov_totalvfs": 0,
    "vendor": "Broadcom Inc. and subsidiaries"
    },
    {
    "device": "ib0",
    "driver": "mlx4_core",
    "enabled": true,
    "firmware_version": "2.7.626",
    "guid": "0x0002c903000ceab3",
    "interface": "InfiniBand",
    "ip": "172.18.131.31",
    "kavlan": false,
    "mac": "00:02:c9:03:00:0c:ea:b3",
    "management": false,
    "model": "MT25408A0-FCC-QI ConnectX, Dual Port 40Gb/s InfiniBand / 10GigE Adapter IC with PCIe 2.0 x8 5.0GT/s Interface",
    "mountable": true,
    "mounted": true,
    "name": "ib0",
    "netmask": "255.255.240.0",
    "network_address": "esterel24-1-ib0.sophia.grid5000.fr",
    "rate": 40000000000,
    "vendor": "Mellanox Technologies"
    },
    {
    "device": "bmc",
    "enabled": true,
    "interface": "Ethernet",
    "ip": "172.17.131.31",
    "kavlan": false,
    "mac": "70:b5:e8:c9:ff:e2",
    "management": true,
    "mountable": false,
    "mounted": false,
    "network_address": "esterel24-1-bmc.sophia.grid5000.fr"
    }
    ],
    "nodeset": "esterel24",
    "operating_system": {
    "cstate_driver": "intel_idle",
    "cstate_governor": "menu",
    "ht_enabled": true,
    "pstate_driver": "intel_pstate",
    "pstate_governor": "performance",
    "turboboost_enabled": true
    },
    "performance": {
    "core_flops": 76800000000,
    "node_flops": 3686400000000
    },
    "processor": {
    "cache_l1": null,
    "cache_l1d": 32768,
    "cache_l1i": 32768,
    "cache_l2": 1048576,
    "cache_l3": 37486592,
    "clock_speed": 2400000000,
    "ht_capable": true,
    "instruction_set": "x86-64",
    "microarchitecture": "Cascade Lake-SP",
    "microcode": "0x5003801",
    "model": "Intel Xeon",
    "other_description": "Intel(R) Xeon(R) Gold 6240R CPU @ 2.40GHz",
    "vendor": "Intel",
    "version": "Gold 6240R"
    },
    "redfish": true,
    "software": {
    "forced-deployment-timestamp": 202007300948,
    "postinstall-version": "1.2025032008",
    "standard-environment": "debian11-x64-std"
    },
    "storage_devices": [
    {
    "by_id": "/dev/disk/by-id/wwn-0x62cea7f06670a0002790bcc0151d50db",
    "by_path": "/dev/disk/by-path/pci-0000:19:00.0-scsi-0:2:0:0",
    "firmware_version": 4.3,
    "id": "disk0",
    "interface": "SAS",
    "model": "PERC H730P Adp",
    "size": 599550590976,
    "storage": "HDD",
    "vendor": "Dell"
    },
    {
    "by_id": "/dev/disk/by-id/wwn-0x62cea7f06670a0002790bca813ab564d",
    "by_path": "/dev/disk/by-path/pci-0000:19:00.0-scsi-0:2:63:0",
    "firmware_version": 4.3,
    "id": "disk1",
    "interface": "SATA",
    "model": "PERC H730P Adp",
    "size": 4798283776000,
    "storage": "HDD",
    "vendor": "Dell"
    }
    ],
    "supported_job_types": {
    "besteffort": true,
    "deploy": true,
    "max_walltime": 0,
    "queues": [
    "admin",
    "testing"
    ],
    "virtual": "ivt"
    },
    "type": "node",
    "uid": "esterel24-1"
    }
    \ No newline at end of file
    ......@@ -11,6 +11,10 @@
    {
    },
    {
    "kind": "node",
    "port": "eth0",
    "snmp_name": "1/1/1",
    "uid": "esterel24-1"
    },
    {
    },
    ......
    ......@@ -11,6 +11,9 @@
    {
    },
    {
    "kind": "other",
    "snmp_name": "1/1/1",
    "uid": "esterel24-1-bmc"
    },
    {
    },
    ......
    ......@@ -2256,6 +2256,12 @@ sites:
    chassis:
    manufactured_at: 2016-05-04
    warranty_end: 2021-05-04
    esterel24:
    nodes:
    esterel24-1:
    chassis:
    manufactured_at: 2020-09-27
    warranty_end: 2027-09-29
    esterel26:
    nodes:
    esterel26-1:
    ......
    ......@@ -186,7 +186,8 @@ ipv4:
    sophia esterel21 eth0 0 0 3 26
    sophia esterel22 eth0 0 0 3 27
    sophia esterel23 eth0 0 0 3 28
    sophia esterel24 eth0 0 0 3 29
    sophia esterel24 eth0 0 0 3 30
    sophia esterel24 ib0 0 0 3 30
    sophia esterel25 eth0 0 0 3 31
    sophia esterel26 eth0 0 0 3 32
    sophia esterel26 ib0 0 0 3 32
    ......
    ---
    model: Dell PowerEdge T640
    created_at: 2025-03-27
    kavlan: false
    boot_type: bios
    exotic: false
    queues:
    - admin
    - testing
    nodes:
    esterel24-1:
    supported_job_types:
    deploy: true
    besteffort: true
    max_walltime: 0
    processor:
    microarchitecture: Cascade Lake-SP
    clock_speed: 2_400_000_000
    network_adapters:
    bmc:
    interface: Ethernet
    enabled: true
    mountable: false
    mounted: false
    eth0:
    enabled: true
    mountable: true
    mounted: true
    eth1:
    enabled: false
    mountable: false
    mounted: false
    storage_devices:
    pci-0000:19:00.0-scsi-0:2:0:0:
    id: disk0
    interface: SAS
    pci-0000:19:00.0-scsi-0:2:63:0:
    id: disk1
    interface: SATA
    software:
    standard-environment: debian11-x64-std
    management_tools:
    bmc_vendor_tool: racadm
    nodeset: esterel24
    ---
    nodes:
    esterel24-1:
    network_adapters:
    ib0:
    enabled: true
    mountable: true
    mounted: true
    netmask: 255.255.240.0
    \ No newline at end of file
    ---
    metrics:
    - name: prom_default_metrics
    description: Default subset of metrics from Prometheus Node Exporter
    period: 0
    optional_period: 15000
    source:
    protocol: prometheus
    port: 9100
    id:
    - node_boot_time_seconds
    - node_cpu_scaling_frequency_hertz
    - node_cpu_seconds_total
    - node_filesystem_free_bytes
    - node_filesystem_size_bytes
    - node_load1
    - node_load15
    - node_load5
    - node_memory_Buffers_bytes
    - node_memory_Cached_bytes
    - node_memory_MemAvailable_bytes
    - node_memory_MemFree_bytes
    - node_memory_MemTotal_bytes
    - node_memory_Shmem_bytes
    - node_memory_SwapFree_bytes
    - node_memory_SwapTotal_bytes
    - node_network_receive_bytes_total
    - node_network_receive_packets_total
    - node_network_transmit_bytes_total
    - node_network_transmit_packets_total
    - node_procs_blocked
    - node_procs_running
    - kwollect_custom
    - name: prom_all_metrics
    description: All metrics from Prometheus Node Exporter
    period: 0
    optional_period: 15000
    source:
    protocol: prometheus
    port: 9100
    - name: prom_nvgpu_default_metrics
    description: Default subset of metrics from Prometheus Nvidia DCGM Exporter
    period: 0
    optional_period: 15000
    source:
    protocol: prometheus
    port: 9400
    id:
    - DCGM_FI_DEV_SM_CLOCK
    - DCGM_FI_DEV_MEM_CLOCK
    - DCGM_FI_DEV_GPU_TEMP
    - DCGM_FI_DEV_POWER_USAGE
    - DCGM_FI_DEV_MEM_COPY_UTIL
    - name: prom_nvgpu_all_metrics
    description: All metrics from Prometheus Nvidia DCGM Exporter
    period: 0
    optional_period: 15000
    source:
    protocol: prometheus
    port: 9400
    \ No newline at end of file
    # Generated by g5k-checks (g5k-checks -m api)
    ---
    esterel24-1:
    architecture:
    cpu_core_numbering: round-robin
    nb_cores: 48
    nb_procs: 2
    nb_threads: 96
    platform_type: x86_64
    bios:
    release_date: 01/09/2025
    vendor: Dell Inc.
    version: 2.23.0
    bmc_version: 7.00.00.181
    chassis:
    manufacturer: Dell Inc.
    name: PowerEdge T640
    serial: F51GY63
    gpu_devices:
    nvidia0:
    cpu_affinity: 0
    device: "/dev/nvidia0"
    memory: 48318382080
    model: Quadro RTX 8000
    power_default_limit: 250.00 W
    vbios_version: 90.02.4E.00.03
    vendor: Nvidia
    nvidia1:
    cpu_affinity: 0
    device: "/dev/nvidia1"
    memory: 48318382080
    model: Quadro RTX 8000
    power_default_limit: 250.00 W
    vbios_version: 90.02.4E.00.03
    vendor: Nvidia
    nvidia2:
    cpu_affinity: 1
    device: "/dev/nvidia2"
    memory: 48318382080
    model: Quadro RTX 8000
    power_default_limit: 250.00 W
    vbios_version: 90.02.4E.00.03
    vendor: Nvidia
    nvidia3:
    cpu_affinity: 1
    device: "/dev/nvidia3"
    memory: 48318382080
    model: Quadro RTX 8000
    power_default_limit: 250.00 W
    vbios_version: 90.02.4E.00.03
    vendor: Nvidia
    main_memory:
    ram_size: 412316860416
    memory_devices:
    dimm_a1:
    size: 34359738368
    technology: dram
    dimm_a2:
    size: 34359738368
    technology: dram
    dimm_a3:
    size: 34359738368
    technology: dram
    dimm_a4:
    size: 34359738368
    technology: dram
    dimm_a5:
    size: 34359738368
    technology: dram
    dimm_a6:
    size: 34359738368
    technology: dram
    dimm_b1:
    size: 34359738368
    technology: dram
    dimm_b2:
    size: 34359738368
    technology: dram
    dimm_b3:
    size: 34359738368
    technology: dram
    dimm_b4:
    size: 34359738368
    technology: dram
    dimm_b5:
    size: 34359738368
    technology: dram
    dimm_b6:
    size: 34359738368
    technology: dram
    network_adapters:
    bmc:
    ip: 172.17.131.31
    mac: 70:b5:e8:c9:ff:e2
    management: true
    eth0:
    driver: bnxt_en
    firmware_version: 218.0.219.13/pkg 21.85.21.92
    interface: Ethernet
    ip: 172.16.131.31
    mac: 70:b5:e8:c9:ff:d2
    management: false
    model: BCM57416 NetXtreme-E Dual-Media 10G RDMA Ethernet Controller
    name: enp1s0f0np0
    rate: 1000000000
    sriov: false
    sriov_totalvfs: 0
    vendor: Broadcom Inc. and subsidiaries
    eth1:
    driver: bnxt_en
    firmware_version: 218.0.219.13/pkg 21.85.21.92
    interface: Ethernet
    mac: 70:b5:e8:c9:ff:d3
    management: false
    model: BCM57416 NetXtreme-E Dual-Media 10G RDMA Ethernet Controller
    name: eno2np1
    sriov: false
    sriov_totalvfs: 0
    vendor: Broadcom Inc. and subsidiaries
    ib0:
    driver: mlx4_core
    firmware_version: 2.7.626
    guid: '0x0002c903000ceab3'
    interface: InfiniBand
    ip: 172.18.131.31
    mac: 00:02:c9:03:00:0c:ea:b3
    management: false
    model: MT25408A0-FCC-QI ConnectX, Dual Port 40Gb/s InfiniBand / 10GigE Adapter
    IC with PCIe 2.0 x8 5.0GT/s Interface
    name: ib0
    rate: 40000000000
    vendor: Mellanox Technologies
    operating_system:
    cstate_driver: intel_idle
    cstate_governor: menu
    ht_enabled: true
    pstate_driver: intel_pstate
    pstate_governor: performance
    turboboost_enabled: true
    processor:
    cache_l1d: 32768
    cache_l1i: 32768
    cache_l2: 1048576
    cache_l3: 37486592
    ht_capable: true
    instruction_set: x86-64
    microcode: '0x5003801'
    model: Intel Xeon
    other_description: Intel(R) Xeon(R) Gold 6240R CPU @ 2.40GHz
    vendor: Intel
    version: Gold 6240R
    storage_devices:
    pci-0000:19:00.0-scsi-0:2:0:0:
    by_id: "/dev/disk/by-id/wwn-0x62cea7f06670a0002790bcc0151d50db"
    by_path: "/dev/disk/by-path/pci-0000:19:00.0-scsi-0:2:0:0"
    firmware_version: 4.3
    model: PERC H730P Adp
    size: 599550590976
    storage: HDD
    pci-0000:19:00.0-scsi-0:2:63:0:
    by_id: "/dev/disk/by-id/wwn-0x62cea7f06670a0002790bca813ab564d"
    by_path: "/dev/disk/by-path/pci-0000:19:00.0-scsi-0:2:63:0"
    firmware_version: 4.3
    model: PERC H730P Adp
    size: 4798283776000
    storage: HDD
    supported_job_types:
    virtual: ivt
    ......@@ -14,6 +14,8 @@ sw-5:
    rate: 1000000000
    kind: node
    ports:
    1:
    uid: esterel24-1
    25:
    uid: gw
    kind: router
    ......
    ......@@ -14,6 +14,9 @@ swadmin-5:
    rate: 1000000000
    kind: node
    ports:
    1:
    uid: esterel24-1-bmc
    kind: other
    25:
    uid: sw-5
    kind: switch
    ......
    ......@@ -431,6 +431,10 @@ esterel10:
    enp1s0f0: eth0
    enp1s0f1: eth1
    ibp130s0: ib0
    esterel24:
    enp1s0f0np0: eth0
    eno2np1: eth1
    ibp137s0: ib0
    esterel26:
    enp1s0f0np0: eth0
    eno2np1: eth1
    ......
    0% Loading or .
    You are about to add 0 people to the discussion. Proceed with caution.
    Finish editing this message first!
    Please register or to comment