fix: available GPU models should be filtered by VO

ai4os · IgnacioHeredia · Aug 5, 2024 · Nov 23, 2023 · Nov 23, 2023 · Nov 23, 2023
commit dae82d2c29b5c740a9842f217f8e62fb53c6a5d3
diff --git a/ai4papi/nomad/common.py b/ai4papi/nomad/common.py
@@ -17,6 +17,7 @@
 from nomad.api import exceptions
 import requests
 
+import ai4papi.conf as papiconf
 import ai4papi.nomad.patches as nomad_patches
 
 
@@ -367,13 +368,19 @@ def delete_deployment(
     return {'status': 'success'}
 
 
-def get_gpu_models():
+@cached(cache=TTLCache(maxsize=1024, ttl=1*60*60))
+def get_gpu_models(vo):
     """
-    Retrieve available GPU models in the cluster.
+    Retrieve available GPU models in the cluster, filtering nodes by VO.
     """
     gpu_models = set()
     nodes = Nomad.nodes.get_nodes(resources=True)
     for node in nodes:
+        # Discard nodes that don't belong to the requested VO
+        meta = Nomad.node.get_node(node['ID'])['Meta']
+        if papiconf.MAIN_CONF['nomad']['namespaces'][vo] not in meta['namespace']:
+            continue
+
         # Discard GPU models of nodes that are not eligible
         if node['SchedulingEligibility'] != 'eligible':
             continue

diff --git a/ai4papi/routers/v1/catalog/modules.py b/ai4papi/routers/v1/catalog/modules.py
@@ -73,7 +73,7 @@ def get_config(
     )
 
     # Fill with available GPU models in the cluster
-    models = nomad.common.get_gpu_models()
+    models = nomad.common.get_gpu_models(vo)
     if models:
         conf["hardware"]["gpu_type"]["options"] += models