From 0cb216e4259b29ec61f3d0dda4cd241d5c55bfea Mon Sep 17 00:00:00 2001 From: Bruno Travouillon Date: Mon, 5 Aug 2024 11:26:03 -0400 Subject: [PATCH] L40S does not support FP64 (#27) --- slurm-job-exporter.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/slurm-job-exporter.py b/slurm-job-exporter.py index 0577e71..8c3ee3f 100644 --- a/slurm-job-exporter.py +++ b/slurm-job-exporter.py @@ -161,7 +161,7 @@ def __init__(self, dcgm_update_interval=10): device = pydcgm.dcgm_agent.dcgmGetDeviceAttributes(self.handle.handle, gpu_id) name = device.identifiers.deviceName print('Detected gpu {} with ID {}'.format(name, gpu_id)) - if name in ['NVIDIA RTX A6000', 'NVIDIA L4']: + if name in ['NVIDIA RTX A6000', 'NVIDIA L4', 'NVIDIA L40S']: # This GPU does not supports fp64, we don't support a mix of fp64 and non-fp64 GPUs in the same node print('Removing fp64 metrics since {} does not support fp64'.format(name)) del self.fieldIds_dict[dcgm_fields.DCGM_FI_PROF_PIPE_FP64_ACTIVE]