We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 70bd83e commit ef4b74dCopy full SHA for ef4b74d
keras_remote/backend/gke_client.py
@@ -461,6 +461,14 @@ def _check_node_pool_exists_cached(selector_items) -> bool:
461
"cloud.google.com/gke-tpu-topology", ""
462
)
463
464
+ # Infer accelerator count from machine type using registry
465
+ # This is robust because it uses the same source of truth as the Pod spec generation
466
+ for tpu_spec in accelerators.TPUS.values():
467
+ for chips, topo_spec in tpu_spec.topologies.items():
468
+ if topo_spec.machine_type == machine_type:
469
+ pool_labels["cloud.google.com/gke-accelerator-count"] = str(chips)
470
+ break
471
+
472
if all(pool_labels.get(k) == str(v) for k, v in selector.items()):
473
return True
474
return False
0 commit comments