pytorch · will-cromar · Oct 10, 2023 · Oct 10, 2023 · Oct 10, 2023 · Oct 10, 2023
diff --git a/torch_xla/__init__.py b/torch_xla/__init__.py
@@ -40,7 +40,6 @@ def _setup_default_env():
   _set_missing_env('GRPC_VERBOSITY', 'ERROR')
   _set_missing_env('ALLOW_MULTIPLE_LIBTPU_LOAD', '1')
   _set_missing_env('TPU_ML_PLATFORM', 'PyTorch/XLA')
-  _set_missing_env('TPU_MEGACORE', 'megacore_dense')
 
 
 _fd, _tmp_fname = -1, ''

diff --git a/torch_xla/_internal/tpu.py b/torch_xla/_internal/tpu.py
@@ -266,6 +266,9 @@ def configure_topology(local_rank: int,
   os.environ.setdefault(xenv.TPU_VISIBLE_CHIPS, str(local_rank))
   os.environ.setdefault(xenv.TPU_PROCESS_PORT, str(ports[local_rank]))
 
+  if version() == 4:
+    os.environ.setdefault(xenv.TPU_MEGACORE, 'megacore_dense')
+
 
 def discover_master_worker_ip(use_localhost: bool = True) -> str:
   """Find the IP of the TPU host with TPU:0.

diff --git a/torch_xla/core/xla_env_vars.py b/torch_xla/core/xla_env_vars.py
@@ -22,6 +22,7 @@
 TPU_PROCESS_ADDRESSES = 'TPU_PROCESS_ADDRESSES'
 TPU_VISIBLE_CHIPS = 'TPU_VISIBLE_CHIPS'
 TPU_PROCESS_PORT = 'TPU_PROCESS_PORT'
+TPU_MEGACORE = 'TPU_MEGACORE'
 PJRT_CPU_ASYNC_CLIENT = 'PJRT_CPU_ASYNC_CLIENT'
 PJRT_GPU_ASYNC_CLIENT = 'PJRT_GPU_ASYNC_CLIENT'
 PJRT_DIST_SERVICE_ADDR = 'PJRT_DIST_SERVICE_ADDR'