diff --git a/pyproject.toml b/pyproject.toml
index 15b8391cdbfcf..91e2eaa8b70d1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -82,7 +82,6 @@ module = [
     "pytorch_lightning.profiler.pytorch",
     "pytorch_lightning.profiler.simple",
     "pytorch_lightning.trainer.callback_hook",
-    "pytorch_lightning.trainer.connectors.accelerator_connector",
     "pytorch_lightning.trainer.connectors.callback_connector",
     "pytorch_lightning.trainer.connectors.data_connector",
     "pytorch_lightning.trainer.data_loading",
diff --git a/pytorch_lightning/callbacks/gpu_stats_monitor.py b/pytorch_lightning/callbacks/gpu_stats_monitor.py
index 2d10b17acdc95..a871bfa309c96 100644
--- a/pytorch_lightning/callbacks/gpu_stats_monitor.py
+++ b/pytorch_lightning/callbacks/gpu_stats_monitor.py
@@ -29,7 +29,6 @@
 
 import pytorch_lightning as pl
 from pytorch_lightning.callbacks.base import Callback
-from pytorch_lightning.utilities import _AcceleratorType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.parsing import AttributeDict
 from pytorch_lightning.utilities.rank_zero import rank_zero_deprecation, rank_zero_only
@@ -127,7 +126,7 @@ def setup(self, trainer: "pl.Trainer", pl_module: "pl.LightningModule", stage: O
         if not trainer.logger:
             raise MisconfigurationException("Cannot use GPUStatsMonitor callback with Trainer that has no logger.")
 
-        if trainer._device_type != _AcceleratorType.GPU:
+        if trainer.strategy.root_device.type != "cuda":
             raise MisconfigurationException(
                 "You are using GPUStatsMonitor but are not running on GPU"
                 f" since gpus attribute in Trainer is set to {trainer.gpus}."
diff --git a/pytorch_lightning/lite/lite.py b/pytorch_lightning/lite/lite.py
index 218decdddd969..117125f29d8db 100644
--- a/pytorch_lightning/lite/lite.py
+++ b/pytorch_lightning/lite/lite.py
@@ -82,7 +82,7 @@ def __init__(
         self._check_strategy_support(strategy)
         gpu_ids, tpu_cores = _parse_devices(gpus=gpus, auto_select_gpus=False, tpu_cores=tpu_cores)
         self._accelerator_connector = AcceleratorConnector(
-            num_processes=1,
+            num_processes=None,
             devices=devices,
             tpu_cores=tpu_cores,
             ipus=None,
diff --git a/pytorch_lightning/strategies/bagua.py b/pytorch_lightning/strategies/bagua.py
index 3c1520a712ea4..17318331b840d 100644
--- a/pytorch_lightning/strategies/bagua.py
+++ b/pytorch_lightning/strategies/bagua.py
@@ -13,7 +13,6 @@
 from pytorch_lightning.strategies.ddp import DDPStrategy
 from pytorch_lightning.strategies.strategy import TBroadcast
 from pytorch_lightning.utilities.distributed import ReduceOp
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.imports import _BAGUA_AVAILABLE
 from pytorch_lightning.utilities.seed import reset_seed
@@ -58,7 +57,7 @@ def __init__(self, pl_module: "pl.LightningModule") -> None:
 
 
 class BaguaStrategy(DDPStrategy):
-    distributed_backend = _StrategyType.BAGUA
+    strategy_name = "bagua"
 
     def __init__(
         self,
@@ -180,8 +179,12 @@ def _setup_model(self, model: Module) -> BaguaDistributedDataParallel:
         )
 
     @classmethod
-    def register_plugins(cls, plugin_registry: Dict) -> None:
-        plugin_registry.register("bagua", cls, description="Default Bagua Plugin")
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
 
     def teardown(self) -> None:
         # abort the background communication for async algorithm
diff --git a/pytorch_lightning/strategies/ddp.py b/pytorch_lightning/strategies/ddp.py
index 6444e489c9b2f..b5d83478101f1 100644
--- a/pytorch_lightning/strategies/ddp.py
+++ b/pytorch_lightning/strategies/ddp.py
@@ -45,7 +45,6 @@
 from pytorch_lightning.utilities.distributed import _revert_sync_batchnorm, distributed_available
 from pytorch_lightning.utilities.distributed import group as _group
 from pytorch_lightning.utilities.distributed import init_dist_connection, ReduceOp, sync_ddp_if_available
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.exceptions import DeadlockDetectedException
 from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
 from pytorch_lightning.utilities.seed import reset_seed
@@ -63,7 +62,7 @@
 class DDPStrategy(ParallelStrategy):
     """Strategy for multi-process single-device training on one or multiple nodes."""
 
-    distributed_backend = _StrategyType.DDP
+    strategy_name = "ddp"
 
     def __init__(
         self,
@@ -96,7 +95,6 @@ def __init__(
         self._pids: Optional[List[int]] = None
         self._sync_dir: Optional[str] = None
         self._rank_0_will_call_children_scripts: bool = False
-        self.set_world_ranks()
 
     @property
     def is_distributed(self) -> bool:
@@ -114,7 +112,6 @@ def num_nodes(self) -> int:
     def num_nodes(self, num_nodes: int) -> None:
         # note that world ranks is related to num_nodes, when resetting it, need to reset world ranks
         self._num_nodes = num_nodes
-        self.set_world_ranks()
 
     @property
     def num_processes(self):
@@ -346,6 +343,11 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
             description="DDP Strategy with `find_unused_parameters` as False",
             find_unused_parameters=False,
         )
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
 
     def _should_run_deadlock_detection(self) -> bool:
         """Determines whether the plugin will perform process reconciliation in case of errors.
diff --git a/pytorch_lightning/strategies/ddp2.py b/pytorch_lightning/strategies/ddp2.py
index 9bde0f67e1b1a..2023316e0e118 100644
--- a/pytorch_lightning/strategies/ddp2.py
+++ b/pytorch_lightning/strategies/ddp2.py
@@ -11,18 +11,19 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+from typing import Dict
+
 import torch
 
 from pytorch_lightning.strategies.ddp import DDPStrategy
 from pytorch_lightning.utilities.apply_func import apply_to_collection
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.types import _METRIC_COLLECTION
 
 
 class DDP2Strategy(DDPStrategy):
     """DDP2 behaves like DP in one node, but synchronization across nodes behaves like in DDP."""
 
-    distributed_backend = _StrategyType.DDP2
+    strategy_name = "ddp2"
 
     @property
     def global_rank(self) -> int:
@@ -73,3 +74,11 @@ def set_world_ranks(self) -> None:
             return
         self.cluster_environment.set_global_rank(self.node_rank)
         self.cluster_environment.set_world_size(self.num_nodes)
+
+    @classmethod
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/strategies/ddp_spawn.py b/pytorch_lightning/strategies/ddp_spawn.py
index 9b58137d2719d..0eb4b68651aa8 100644
--- a/pytorch_lightning/strategies/ddp_spawn.py
+++ b/pytorch_lightning/strategies/ddp_spawn.py
@@ -33,7 +33,6 @@
 from pytorch_lightning.utilities.distributed import _revert_sync_batchnorm, distributed_available
 from pytorch_lightning.utilities.distributed import group as _group
 from pytorch_lightning.utilities.distributed import init_dist_connection, ReduceOp, sync_ddp_if_available
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.rank_zero import rank_zero_only, rank_zero_warn
 from pytorch_lightning.utilities.seed import reset_seed
 from pytorch_lightning.utilities.types import STEP_OUTPUT
@@ -48,7 +47,7 @@ class DDPSpawnStrategy(ParallelStrategy):
     """Spawns processes using the :func:`torch.multiprocessing.spawn` method and joins processes after training
     finishes."""
 
-    distributed_backend = _StrategyType.DDP_SPAWN
+    strategy_name = "ddp_spawn"
 
     def __init__(
         self,
@@ -76,7 +75,6 @@ def __init__(
         self._ddp_comm_hook = ddp_comm_hook
         self._ddp_comm_wrapper = ddp_comm_wrapper
         self._local_rank = 0
-        self.set_world_ranks()
 
     @property
     def num_nodes(self) -> int:
@@ -86,7 +84,6 @@ def num_nodes(self) -> int:
     def num_nodes(self, num_nodes: int) -> None:
         # note that world ranks is related to num_nodes, when resetting it, need to reset world ranks
         self._num_nodes = num_nodes
-        self.set_world_ranks()
 
     @property
     def local_rank(self) -> int:
@@ -264,6 +261,11 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
             description="DDPSpawn Strategy with `find_unused_parameters` as False",
             find_unused_parameters=False,
         )
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
 
     def teardown(self) -> None:
         super().teardown()
diff --git a/pytorch_lightning/strategies/deepspeed.py b/pytorch_lightning/strategies/deepspeed.py
index fa9c4d5376ff8..cbf66b7040d22 100644
--- a/pytorch_lightning/strategies/deepspeed.py
+++ b/pytorch_lightning/strategies/deepspeed.py
@@ -35,7 +35,7 @@
 from pytorch_lightning.utilities import GradClipAlgorithmType
 from pytorch_lightning.utilities.apply_func import apply_to_collection
 from pytorch_lightning.utilities.distributed import log
-from pytorch_lightning.utilities.enums import _StrategyType, AMPType, PrecisionType
+from pytorch_lightning.utilities.enums import AMPType, PrecisionType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.imports import _DEEPSPEED_AVAILABLE
 from pytorch_lightning.utilities.model_helpers import is_overridden
@@ -82,7 +82,7 @@ def _move_float_tensors_to_half(self, batch: Any):
 
 
 class DeepSpeedStrategy(DDPStrategy):
-    distributed_backend = _StrategyType.DEEPSPEED
+    strategy_name = "deepspeed"
     DEEPSPEED_ENV_VAR = "PL_DEEPSPEED_CONFIG_PATH"
 
     def __init__(
diff --git a/pytorch_lightning/strategies/dp.py b/pytorch_lightning/strategies/dp.py
index 0c9723c183a5e..484f7b474b02f 100644
--- a/pytorch_lightning/strategies/dp.py
+++ b/pytorch_lightning/strategies/dp.py
@@ -11,7 +11,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from typing import Any, List, Optional
+from typing import Any, Dict, List, Optional
 
 import torch
 from torch.nn import DataParallel, Module
@@ -22,7 +22,6 @@
 from pytorch_lightning.plugins.precision import PrecisionPlugin
 from pytorch_lightning.strategies.parallel import ParallelStrategy
 from pytorch_lightning.utilities.apply_func import apply_to_collection
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.model_helpers import is_overridden
 from pytorch_lightning.utilities.types import _METRIC_COLLECTION, STEP_OUTPUT
 
@@ -31,7 +30,7 @@ class DataParallelStrategy(ParallelStrategy):
     """Implements data-parallel training in a single process, i.e., the model gets replicated to each device and
     each gets a split of the data."""
 
-    distributed_backend = _StrategyType.DP
+    strategy_name = "dp"
 
     def __init__(
         self,
@@ -149,6 +148,14 @@ def training_step_end(self, output):
 
         return output
 
+    @classmethod
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
+
     def teardown(self) -> None:
         super().teardown()
         if self.root_device.type == "cuda":
diff --git a/pytorch_lightning/strategies/fully_sharded.py b/pytorch_lightning/strategies/fully_sharded.py
index 9a24197c6c33d..af2d6d74bfdd2 100644
--- a/pytorch_lightning/strategies/fully_sharded.py
+++ b/pytorch_lightning/strategies/fully_sharded.py
@@ -23,7 +23,7 @@
 from pytorch_lightning.plugins.precision import PrecisionPlugin
 from pytorch_lightning.strategies.ddp import DDPStrategy
 from pytorch_lightning.utilities import _FAIRSCALE_FULLY_SHARDED_AVAILABLE
-from pytorch_lightning.utilities.enums import _StrategyType, PrecisionType
+from pytorch_lightning.utilities.enums import PrecisionType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.types import STEP_OUTPUT
 
@@ -36,7 +36,7 @@
 
 class DDPFullyShardedStrategy(DDPStrategy):
 
-    distributed_backend = _StrategyType.DDP_FULLY_SHARDED
+    strategy_name = "ddp_fully_sharded"
 
     def __init__(
         self,
@@ -212,3 +212,9 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
         strategy_registry.register(
             "fsdp", cls, description="Fully sharded training with checkpointing the full state dict."
         )
+
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/strategies/horovod.py b/pytorch_lightning/strategies/horovod.py
index a69850b60f9c0..f4a733909651e 100644
--- a/pytorch_lightning/strategies/horovod.py
+++ b/pytorch_lightning/strategies/horovod.py
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 from contextlib import ExitStack
-from typing import Any, List, Optional, Tuple, Union
+from typing import Any, Dict, List, Optional, Tuple, Union
 
 import torch
 import torch.nn as nn
@@ -26,7 +26,6 @@
 from pytorch_lightning.utilities.distributed import distributed_available
 from pytorch_lightning.utilities.distributed import group as dist_group
 from pytorch_lightning.utilities.distributed import ReduceOp
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.imports import _HOROVOD_AVAILABLE
 from pytorch_lightning.utilities.rank_zero import rank_zero_only
 
@@ -37,7 +36,7 @@
 class HorovodStrategy(ParallelStrategy):
     """Plugin for Horovod distributed training integration."""
 
-    distributed_backend = _StrategyType.HOROVOD
+    strategy_name = "horovod"
 
     def __init__(
         self,
@@ -196,6 +195,14 @@ def _filter_named_parameters(model: nn.Module, optimizer: Optimizer) -> List[Tup
         opt_params = {p for group in optimizer.param_groups for p in group.get("params", [])}
         return [(name, p) for name, p in model.named_parameters() if p in opt_params]
 
+    @classmethod
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
+
     def teardown(self) -> None:
         super().teardown()
         # teardown may be called before `_exit_stack` is set
diff --git a/pytorch_lightning/strategies/ipu.py b/pytorch_lightning/strategies/ipu.py
index 6b6433841d5ae..6f6f4dd92a1f9 100644
--- a/pytorch_lightning/strategies/ipu.py
+++ b/pytorch_lightning/strategies/ipu.py
@@ -13,7 +13,7 @@
 # limitations under the License.
 import json
 import os
-from typing import Any, Callable, List, Optional, Union
+from typing import Any, Callable, Dict, List, Optional, Union
 
 import torch
 from torch.utils.data import DataLoader
@@ -62,6 +62,8 @@ def _move_float_tensors_to_half(self, batch: Any) -> Any:
 class IPUStrategy(ParallelStrategy):
     """Plugin for training on IPU devices."""
 
+    strategy_name = "ipu_strategy"
+
     def __init__(
         self,
         accelerator: Optional["pl.accelerators.accelerator.Accelerator"] = None,
@@ -360,3 +362,11 @@ def all_gather(self, tensor: torch.Tensor, group: Optional[Any] = None, sync_gra
 
     def broadcast(self, obj: object, src: int = 0) -> object:
         return obj
+
+    @classmethod
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/strategies/sharded.py b/pytorch_lightning/strategies/sharded.py
index 2d1584a2e15e5..6811721ecaab7 100644
--- a/pytorch_lightning/strategies/sharded.py
+++ b/pytorch_lightning/strategies/sharded.py
@@ -22,7 +22,7 @@
 from pytorch_lightning.core.optimizer import LightningOptimizer
 from pytorch_lightning.strategies.ddp import DDPStrategy
 from pytorch_lightning.trainer.states import TrainerFn
-from pytorch_lightning.utilities.enums import _StrategyType, PrecisionType
+from pytorch_lightning.utilities.enums import PrecisionType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.imports import _FAIRSCALE_AVAILABLE, _FAIRSCALE_OSS_FP16_BROADCAST_AVAILABLE
 from pytorch_lightning.utilities.rank_zero import rank_zero_only
@@ -37,7 +37,7 @@
 class DDPShardedStrategy(DDPStrategy):
     """Optimizer and gradient sharded training provided by FairScale."""
 
-    distributed_backend = _StrategyType.DDP_SHARDED
+    strategy_name = "ddp_sharded"
     _REDUCE_BUFFER_SIZE_DEFAULT: int = 2 ** 23  # 8M
 
     def configure_ddp(self) -> None:
@@ -135,3 +135,8 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
             description="DDP Sharded Strategy with `find_unused_parameters` as False",
             find_unused_parameters=False,
         )
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/strategies/sharded_spawn.py b/pytorch_lightning/strategies/sharded_spawn.py
index 289e3491be0b4..8cb6ca8b62028 100644
--- a/pytorch_lightning/strategies/sharded_spawn.py
+++ b/pytorch_lightning/strategies/sharded_spawn.py
@@ -21,7 +21,6 @@
 import pytorch_lightning as pl
 from pytorch_lightning.strategies.ddp_spawn import DDPSpawnStrategy
 from pytorch_lightning.trainer.states import TrainerFn
-from pytorch_lightning.utilities.enums import _StrategyType
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
 from pytorch_lightning.utilities.imports import _FAIRSCALE_AVAILABLE
 from pytorch_lightning.utilities.rank_zero import rank_zero_only
@@ -36,7 +35,7 @@
 class DDPSpawnShardedStrategy(DDPSpawnStrategy):
     """Optimizer sharded training provided by FairScale."""
 
-    distributed_backend = _StrategyType.DDP_SHARDED_SPAWN
+    strategy_name = "ddp_sharded_spawn"
 
     def configure_ddp(self) -> None:
         self.model, self.optimizers = self._setup_model_and_optimizers(
@@ -118,3 +117,8 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
             description="DDP Spawn Sharded Strategy with `find_unused_parameters` as False",
             find_unused_parameters=False,
         )
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/strategies/single_device.py b/pytorch_lightning/strategies/single_device.py
index 440c73afce8fc..da80bad32ad13 100644
--- a/pytorch_lightning/strategies/single_device.py
+++ b/pytorch_lightning/strategies/single_device.py
@@ -27,9 +27,11 @@
 class SingleDeviceStrategy(Strategy):
     """Strategy that handles communication on a single device."""
 
+    strategy_name = "single_device"
+
     def __init__(
         self,
-        device: _DEVICE,
+        device: _DEVICE = "cpu",
         accelerator: pl.accelerators.accelerator.Accelerator | None = None,
         checkpoint_io: CheckpointIO | None = None,
         precision_plugin: PrecisionPlugin | None = None,
@@ -79,6 +81,14 @@ def barrier(self, *args, **kwargs) -> None:
     def broadcast(self, obj: object, src: int = 0) -> object:
         return obj
 
+    @classmethod
+    def register_strategies(cls, strategy_registry: dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
+
     def teardown(self) -> None:
         super().teardown()
         if self.root_device.type == "cuda":
diff --git a/pytorch_lightning/strategies/single_tpu.py b/pytorch_lightning/strategies/single_tpu.py
index 8465656f034ab..757b335e5ae2c 100644
--- a/pytorch_lightning/strategies/single_tpu.py
+++ b/pytorch_lightning/strategies/single_tpu.py
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import os
-from typing import Optional
+from typing import Dict, Optional
 
 import pytorch_lightning as pl
 from pytorch_lightning.plugins.io.xla_plugin import XLACheckpointIO
@@ -28,6 +28,8 @@
 class SingleTPUStrategy(SingleDeviceStrategy):
     """Strategy for training on a single TPU device."""
 
+    strategy_name = "single_tpu"
+
     def __init__(
         self,
         device: int,
@@ -71,6 +73,14 @@ def setup(self, trainer: "pl.Trainer") -> None:
     def model_to_device(self) -> None:
         self.model.to(self.root_device)
 
+    @classmethod
+    def register_strategies(cls, strategy_registry: Dict) -> None:
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
+
     def teardown(self) -> None:
         super().teardown()
         # TPU teardown
diff --git a/pytorch_lightning/strategies/strategy.py b/pytorch_lightning/strategies/strategy.py
index 37b9b435b7413..e4d8827e9a3c0 100644
--- a/pytorch_lightning/strategies/strategy.py
+++ b/pytorch_lightning/strategies/strategy.py
@@ -449,7 +449,7 @@ def teardown(self) -> None:
         self.precision_plugin.teardown()
 
     @classmethod
-    def register_strategies(cls, strategies_registry) -> None:
+    def register_strategies(cls, strategy_registry) -> None:
         pass
 
     def on_train_start(self) -> None:
diff --git a/pytorch_lightning/strategies/strategy_registry.py b/pytorch_lightning/strategies/strategy_registry.py
index b0d7995053a30..17e08acb23bcc 100644
--- a/pytorch_lightning/strategies/strategy_registry.py
+++ b/pytorch_lightning/strategies/strategy_registry.py
@@ -75,7 +75,7 @@ def register(
 
         def do_register(strategy: Callable) -> Callable:
             data["strategy"] = strategy
-            data["distributed_backend"] = strategy.distributed_backend
+            data["strategy_name"] = strategy.strategy_name
             self[name] = data
             return strategy
 
diff --git a/pytorch_lightning/strategies/tpu_spawn.py b/pytorch_lightning/strategies/tpu_spawn.py
index f3d855b43f8a6..d97797f92daa2 100644
--- a/pytorch_lightning/strategies/tpu_spawn.py
+++ b/pytorch_lightning/strategies/tpu_spawn.py
@@ -48,6 +48,8 @@
 class TPUSpawnStrategy(DDPSpawnStrategy):
     """Strategy for training multiple TPU devices using the :func:`torch.multiprocessing.spawn` method."""
 
+    strategy_name = "tpu_spawn"
+
     def __init__(
         self,
         accelerator: Optional["pl.accelerators.accelerator.Accelerator"] = None,
@@ -296,3 +298,9 @@ def register_strategies(cls, strategy_registry: Dict) -> None:
         strategy_registry.register(
             "tpu_spawn_debug", cls, description="TPUSpawn Strategy with `debug` as True", debug=True
         )
+
+        strategy_registry.register(
+            cls.strategy_name,
+            cls,
+            description=f"{cls.__class__.__name__}",
+        )
diff --git a/pytorch_lightning/trainer/connectors/accelerator_connector.py b/pytorch_lightning/trainer/connectors/accelerator_connector.py
index 8f770feb790c3..20c5f485b4e71 100644
--- a/pytorch_lightning/trainer/connectors/accelerator_connector.py
+++ b/pytorch_lightning/trainer/connectors/accelerator_connector.py
@@ -14,8 +14,7 @@
 
 import logging
 import os
-from typing import List, Optional, Sequence, Union
-from weakref import proxy
+from typing import List, Optional, Union
 
 import torch
 
@@ -32,6 +31,7 @@
     FullyShardedNativeMixedPrecisionPlugin,
     IPUPrecisionPlugin,
     NativeMixedPrecisionPlugin,
+    PLUGIN_INPUT,
     PrecisionPlugin,
     ShardedNativeMixedPrecisionPlugin,
     TPUBf16PrecisionPlugin,
@@ -47,7 +47,6 @@
     TorchElasticEnvironment,
 )
 from pytorch_lightning.strategies import (
-    BaguaStrategy,
     DataParallelStrategy,
     DDP2Strategy,
     DDPFullyShardedStrategy,
@@ -58,975 +57,805 @@
     DeepSpeedStrategy,
     HorovodStrategy,
     IPUStrategy,
+    ParallelStrategy,
     SingleDeviceStrategy,
     SingleTPUStrategy,
     Strategy,
     StrategyRegistry,
     TPUSpawnStrategy,
 )
-from pytorch_lightning.utilities import _AcceleratorType, _StrategyType, AMPType, device_parser
-from pytorch_lightning.utilities.enums import PrecisionType
-from pytorch_lightning.utilities.exceptions import MisconfigurationException
-from pytorch_lightning.utilities.imports import (
-    _HOROVOD_AVAILABLE,
-    _IPU_AVAILABLE,
-    _TORCH_GREATER_EQUAL_1_8,
-    _TPU_AVAILABLE,
+from pytorch_lightning.utilities import (
+    _StrategyType,
+    AMPType,
+    device_parser,
+    LightningEnum,
+    rank_zero_deprecation,
+    rank_zero_info,
+    rank_zero_warn,
 )
-from pytorch_lightning.utilities.rank_zero import rank_zero_deprecation, rank_zero_info, rank_zero_warn
+from pytorch_lightning.utilities.exceptions import MisconfigurationException
+from pytorch_lightning.utilities.imports import _HOROVOD_AVAILABLE, _IPU_AVAILABLE, _TPU_AVAILABLE
+
+log = logging.getLogger(__name__)
 
 if _HOROVOD_AVAILABLE:
     import horovod.torch as hvd
 
-log = logging.getLogger(__name__)
-
 
 class AcceleratorConnector:
     def __init__(
         self,
-        num_processes,
-        devices,
-        tpu_cores,
-        ipus,
-        accelerator,
-        strategy: Optional[Union[str, Strategy]],
-        gpus,
-        gpu_ids,
-        num_nodes,
-        sync_batchnorm,
-        benchmark,
-        replace_sampler_ddp,
-        deterministic: bool,
-        precision,
-        amp_type,
-        amp_level,
-        plugins,
-    ):
-        # initialization
-        self._device_type = _AcceleratorType.CPU
-        self._strategy_type = None
-        self._accelerator_type = None
-
-        self._strategy_flag = strategy.lower() if isinstance(strategy, str) else strategy
-        # TODO: Rename this to something else once all the distributed flags are moved to strategy
-        self.distributed_backend = accelerator
-
-        self._init_deterministic(deterministic)
-
-        self.num_processes = num_processes
-        self.devices = devices
-        # `gpus` is the input passed to the Trainer, whereas `gpu_ids` is a list of parsed gpu ids.
-        self.gpus = gpus
-        self.parallel_device_ids = gpu_ids
-        self.tpu_cores = tpu_cores
-        self.ipus = ipus
-        self.num_nodes = num_nodes
-        self.sync_batchnorm = sync_batchnorm
-        self.benchmark = benchmark
+        devices: Optional[Union[List[int], str, int]] = None,
+        num_nodes: int = 1,
+        accelerator: Optional[Union[str, Accelerator]] = None,
+        strategy: Optional[Union[str, Strategy]] = None,
+        plugins: Optional[Union[PLUGIN_INPUT, List[PLUGIN_INPUT]]] = None,
+        precision: Union[int, str] = 32,
+        amp_type: str = "native",
+        amp_level: Optional[str] = None,
+        sync_batchnorm: bool = False,
+        benchmark: bool = False,
+        replace_sampler_ddp: bool = True,
+        deterministic: bool = False,
+        num_processes: Optional[int] = None,  # deprecated
+        tpu_cores: Optional[Union[List[int], int]] = None,  # deprecated
+        ipus: Optional[int] = None,  # deprecated
+        gpus: Optional[Union[List[int], str, int]] = None,  # deprecated
+        gpu_ids: Optional[List[int]] = None,  # TODO can be removed
+    ) -> None:
+        """The AcceleratorConnector parses several Trainer arguments and instantiates the Strategy including other
+        components such as the Accelerator and Precision plugins.
+
+            A. accelerator flag could be:
+                1. strategy class (deprecated in 1.5 will be removed in 1.7)
+                2. strategy str (deprecated in 1.5 will be removed in 1.7)
+                3. accelerator class
+                4. accelerator str
+                5. accelerator auto
+
+            B. strategy flag could be :
+                1. strategy class
+                2. strategy str registered with StrategyRegistry
+                3. strategy str in _strategy_type enum which listed in each strategy as
+                   backend (registed these too, and _strategy_type could be deprecated)
+
+            C. plugins flag could be:
+                1. List of str, which could contain:
+                    i. strategy str
+                    ii. precision str (Not supported in the old accelerator_connector version)
+                    iii. checkpoint_io str (Not supported in the old accelerator_connector version)
+                    iv. cluster_environment str (Not supported in the old accelerator_connector version)
+                2. List of class, which could contains:
+                    i. strategy class (deprecated in 1.5 will be removed in 1.7)
+                    ii. precision class (should be removed, and precision flag should allow user pass classes)
+                    iii. checkpoint_io class
+                    iv. cluster_environment class
+
+
+        priorities which to take when:
+            A. Class > str
+            B. Strategy > Accelerator/precision/plugins
+            C. TODO When multiple flag set to the same thing
+        """
+        # TODO: move to gpu accelerator
+        torch.backends.cudnn.benchmark = benchmark
         self.replace_sampler_ddp = replace_sampler_ddp
-        if not PrecisionType.supported_type(precision):
-            raise MisconfigurationException(
-                f"Precision {repr(precision)} is invalid. Allowed precision values: {PrecisionType.supported_types()}"
-            )
-        self.precision = precision
-        self.amp_type = amp_type.lower() if isinstance(amp_type, str) else None
-        self.amp_level = amp_level
-
-        self._precision_plugin: Optional[PrecisionPlugin] = None
-        self._strategy: Optional[Strategy] = None
-        self._cluster_environment: Optional[ClusterEnvironment] = None
-        self._checkpoint_io: Optional[CheckpointIO] = None
-
-        plugins = plugins if plugins is not None else []
-
-        if isinstance(plugins, str):
-            plugins = [plugins]
-
-        if not isinstance(plugins, Sequence):
-            plugins = [plugins]
-
-        self.plugins = plugins
-
-        self._handle_accelerator_and_strategy()
-
-        self._validate_accelerator_and_devices()
-
-        self._warn_if_devices_flag_ignored()
-
-        self.select_accelerator_type()
-
-        if self._strategy_flag is not None:
-            self._set_strategy()
-        else:
-            self.set_distributed_mode()
-
-        self.handle_given_plugins()
-        self._set_strategy_type_if_strategy_passed()
+        self.sync_batchnorm = sync_batchnorm
 
-        self._cluster_environment = self.select_cluster_environment()
+        # 1. Parsing flags
+        # Get registered strategies, built-in accelerators and precision plugins
+        self._registered_strategies = StrategyRegistry.available_strategies()
+        self._accelerator_types = ("tpu", "ipu", "gpu", "cpu")
+        self._precision_types = ("16", "32", "64", "bf16", "mixed")
+
+        # Raise an exception if there are conflicts between flags
+        # Set each valid flag to `self._x_flag` after validation
+        # Example: If accelerator is set to a strategy type, set `self._strategy_flag = accelerator`.
+        # For devices: Assign gpus, ipus, etc. to the accelerator flag and devices flag
+        self._strategy_flag: Optional[Union[Strategy, str]] = None
+        self._accelerator_flag: Optional[Union[Accelerator, str]] = None
+        self._precision_flag: Optional[Union[int, str]] = None
+        self._precision_plugin_flag: Optional[PrecisionPlugin] = None
+        self._cluster_environment_flag: Optional[Union[ClusterEnvironment, str]] = None
+        self.checkpoint_io: Optional[CheckpointIO] = None
+        self._amp_type_flag: Optional[LightningEnum] = None
+        self._amp_level_flag: Optional[str] = amp_level
+
+        self._check_config_and_set_final_flags(
+            strategy=strategy,
+            accelerator=accelerator,
+            precision=precision,
+            plugins=plugins,
+            amp_type=amp_type,
+            amp_level=amp_level,
+        )
+        self._check_device_config_and_set_final_flags(
+            devices=devices, num_nodes=num_nodes, num_processes=num_processes, gpus=gpus, ipus=ipus, tpu_cores=tpu_cores
+        )
 
-        self.update_device_type_if_ipu_plugin()
-        self.update_device_type_if_strategy_passed()
+        # 2. Instantiate Accelerator
+        # handle `auto` and `None`
+        self._set_accelerator_if_ipu_strategy_is_passed()
+        if self._accelerator_flag == "auto" or self._accelerator_flag is None:
+            self._accelerator_flag = self._choose_accelerator()
+        self._set_parallel_devices_and_init_accelerator()
 
-        self._validate_accelerator_type()
-        self._set_devices_if_none()
+        # 3. Instantiate ClusterEnvironment
+        self.cluster_environment: ClusterEnvironment = self._choose_and_init_cluster_environment()
 
-        self.strategy = self.final_strategy()
-        self.strategy._configure_launcher()
-        self.accelerator = self.strategy.accelerator
-        self._check_plugin_compatibility()
+        # 4. Instantiate Strategy - Part 1
+        if self._strategy_flag is None:
+            self._strategy_flag = self._choose_strategy()
+        # In specific cases, ignore user selection and fall back to a different strategy
+        self._check_strategy_and_fallback()
+        self._init_strategy()
 
-        # benchmarking
-        # TODO: should this be moved to GPU accelerator?
-        torch.backends.cudnn.benchmark = self.benchmark
+        # 5. Instantiate Precision Plugin
+        self.precision_plugin = self._check_and_init_precision()
 
-        self.replace_sampler_ddp = replace_sampler_ddp
+        # 6. Instantiate Strategy - Part 2
+        self._lazy_init_strategy()
 
-    def _init_deterministic(self, deterministic: bool) -> None:
-        self.deterministic = deterministic
-        if _TORCH_GREATER_EQUAL_1_8:
-            torch.use_deterministic_algorithms(deterministic)
-        else:
-            torch.set_deterministic(deterministic)
-        if deterministic:
-            # fixing non-deterministic part of horovod
-            # https://github.com/PyTorchLightning/pytorch-lightning/pull/1572/files#r420279383
-            os.environ["HOROVOD_FUSION_THRESHOLD"] = str(0)
-            # https://docs.nvidia.com/cuda/cublas/index.html#cublasApi_reproducibility
-            os.environ["CUBLAS_WORKSPACE_CONFIG"] = ":4096:8"
-
-    def select_accelerator_type(self) -> None:
-        if self.distributed_backend == "auto":
-            if self.has_tpu:
-                self._accelerator_type = _AcceleratorType.TPU
-            elif self.has_ipu:
-                self._accelerator_type = _AcceleratorType.IPU
-            elif self.has_gpu:
-                self._accelerator_type = _AcceleratorType.GPU
-            else:
-                self._set_devices_to_cpu_num_processes()
-                self._accelerator_type = _AcceleratorType.CPU
-        elif self.distributed_backend == _AcceleratorType.TPU:
-            if not self.has_tpu:
-                msg = "TPUs are not available" if not _TPU_AVAILABLE else "you didn't pass `tpu_cores` to `Trainer`"
-                raise MisconfigurationException(f"You passed `accelerator='tpu'`, but {msg}.")
-            self._accelerator_type = _AcceleratorType.TPU
-        elif self.distributed_backend == _AcceleratorType.IPU:
-            if not self.has_ipu:
-                msg = "IPUs are not available" if not _IPU_AVAILABLE else "you didn't pass `ipus` to `Trainer`"
-                raise MisconfigurationException(f"You passed `accelerator='ipu'`, but {msg}.")
-            self._accelerator_type = _AcceleratorType.IPU
-        elif self.distributed_backend == _AcceleratorType.GPU:
-            if not self.has_gpu:
-                msg = "you didn't pass `gpus` to `Trainer`" if torch.cuda.is_available() else "GPUs are not available"
-                raise MisconfigurationException(f"You passed `accelerator='gpu'`, but {msg}.")
-            self._accelerator_type = _AcceleratorType.GPU
-        elif self.distributed_backend == _AcceleratorType.CPU:
-            self._set_devices_to_cpu_num_processes()
-            self._accelerator_type = _AcceleratorType.CPU
-
-        if self.distributed_backend in self.accelerator_types:
-            self.distributed_backend = None
-
-    def _validate_accelerator_and_devices(self) -> None:
-        if self.distributed_backend not in self.accelerator_types and self.devices is not None:
-            raise MisconfigurationException(
-                f"You passed `devices={self.devices}` but haven't specified"
-                " `accelerator=('auto'|'tpu'|'gpu'|'ipu'|'cpu')` for the devices mapping,"
-                f" got `accelerator={self.distributed_backend!r}`."
-            )
+    def _check_config_and_set_final_flags(
+        self,
+        strategy: Optional[Union[str, Strategy]],
+        accelerator: Optional[Union[str, Accelerator]],
+        precision: Union[int, str],
+        plugins: Optional[Union[PLUGIN_INPUT, List[PLUGIN_INPUT]]],
+        amp_type: str,
+        amp_level: Optional[str],
+    ) -> None:
+        """This method checks:
+
+        1. strategy: strategy, accelerator and plugin can all be set to strategies
+        2. accelerator: if the value of the accelerator argument is a type of accelerator (instance or string),
+            set self._accelerator_flag accordingly. If the value is strategy related (instance or string),
+            it gets handled by 1.
+        3. precision: The final value of the precision flag may be determined either by the precision argument or
+            by a plugin instance.
+        4. plugins: a plugin could occur as a value of the strategy argument (handled by 1), or the precision
+            argument (handled by 3). We also extract the CheckpointIO and ClusterEnvironment plugins.
+        """
+        if plugins is not None:
+            plugins = [plugins] if not isinstance(plugins, list) else plugins
 
-    def _validate_accelerator_type(self) -> None:
-        if self._accelerator_type and self._accelerator_type != self._device_type:
-            # internal error: should not happen.
-            raise ValueError(
-                f"Mismatch between the requested accelerator type ({self._accelerator_type})"
-                f" and assigned device type ({self._device_type})."
-            )
-        self._accelerator_type = self._device_type
-
-    def _warn_if_devices_flag_ignored(self) -> None:
-        if self.devices is None:
-            return
-        devices_warning = f"The flag `devices={self.devices}` will be ignored, as you have set"
-        if self.distributed_backend in ("auto", _AcceleratorType.TPU):
-            if self.tpu_cores is not None:
-                rank_zero_warn(f"{devices_warning} `tpu_cores={self.tpu_cores}`")
-        elif self.distributed_backend in ("auto", _AcceleratorType.IPU):
-            if self.ipus is not None:
-                rank_zero_warn(f"{devices_warning} `ipus={self.ipus}`")
-        elif self.distributed_backend in ("auto", _AcceleratorType.GPU):
-            if self.gpus is not None:
-                rank_zero_warn(f"{devices_warning} `gpus={self.gpus}`")
-        elif self.distributed_backend in ("auto", _AcceleratorType.CPU):
-            if self.num_processes != 1:
-                rank_zero_warn(f"{devices_warning} `num_processes={self.num_processes}`")
-
-    def _set_devices_if_none(self) -> None:
-        if self.devices is not None:
-            return
-        if self._accelerator_type == _AcceleratorType.TPU:
-            self.devices = self.tpu_cores
-        elif self._accelerator_type == _AcceleratorType.IPU:
-            self.devices = self.ipus
-        elif self._accelerator_type == _AcceleratorType.GPU:
-            self.devices = self.gpus
-        elif self._accelerator_type == _AcceleratorType.CPU:
-            self.devices = self.num_processes
-
-    def _handle_accelerator_and_strategy(self) -> None:
-        deprecated_types = [t for t in _StrategyType if t not in (_StrategyType.TPU_SPAWN, _StrategyType.DDP_CPU)]
-        if self.distributed_backend is not None and self.distributed_backend in deprecated_types:
-            rank_zero_deprecation(
-                f"Passing `Trainer(accelerator={self.distributed_backend!r})` has been deprecated"
-                f" in v1.5 and will be removed in v1.7. Use `Trainer(strategy={self.distributed_backend!r})` instead."
-            )
-            if self._strategy_flag is not None:
+        if strategy is not None:
+            self._strategy_flag = strategy
+            if strategy == "ddp_cpu":
                 raise MisconfigurationException(
-                    f"You have passed `Trainer(strategy={self._strategy_flag!r})` but have"
-                    f" also passed `Trainer(accelerator={self.distributed_backend!r})`."
-                    f" HINT: Use just `Trainer(strategy={self._strategy_flag!r})` instead."
+                    "`Trainer(strategy='ddp_cpu')` is not a valid strategy,"
+                    " you can use `Trainer(strategy='ddp'|'ddp_spawn', accelerator='cpu')` instead."
                 )
-        if self._strategy_flag == _StrategyType.TPU_SPAWN:
-            raise MisconfigurationException(
-                "`Trainer(strategy='tpu_spawn')` is not a valid strategy,"
-                " you can use `Trainer(strategy='ddp_spawn', accelerator='tpu')` instead."
-            )
-        if self._strategy_flag == _StrategyType.DDP_CPU:
-            raise MisconfigurationException(
-                "`Trainer(strategy='ddp_cpu')` is not a valid strategy,"
-                " you can use `Trainer(strategy='ddp'|'ddp_spawn', accelerator='cpu')` instead."
-            )
-
-    def _set_strategy(self) -> None:
-        if isinstance(self._strategy_flag, str) and self._strategy_flag in StrategyRegistry:
-            self._strategy = StrategyRegistry.get(self._strategy_flag)
-        if isinstance(self._strategy_flag, str):
-            self.set_distributed_mode(self._strategy_flag)
-        elif isinstance(self._strategy_flag, Strategy):
-            self._strategy = self._strategy_flag
-
-    def handle_given_plugins(self) -> None:
-
-        for plug in self.plugins:
-            if self._strategy_flag is not None and self._is_plugin_training_type(plug):
+            if strategy == "tpu_spawn":
+                raise MisconfigurationException(
+                    "`Trainer(strategy='tpu_spawn')` is not a valid strategy,"
+                    " you can use `Trainer(strategy='ddp_spawn', accelerator='tpu')` instead."
+                )
+            # handle duplications and conflict
+            if isinstance(accelerator, Strategy) and strategy != accelerator:
                 raise MisconfigurationException(
-                    f"You have passed `Trainer(strategy={self._strategy_flag!r})`"
-                    f" and you can only specify one training type plugin, but you have passed {plug} as a plugin."
+                    f"Incompatible values set in `strategy` and `accelerator` arguments."
+                    f"Received both strategy={strategy} and accelerator={accelerator}"
                 )
-            if self._is_plugin_training_type(plug):
+            if isinstance(accelerator, str) and accelerator in self._registered_strategies and strategy != accelerator:
+                raise MisconfigurationException(
+                    f"strategy {strategy} already set through `strategy` flag,"
+                    f" but have also passed {accelerator} in through the accelerator flag."
+                )
+            if plugins:
+                for plugin in plugins:
+                    if isinstance(plugin, Strategy):
+                        raise MisconfigurationException(
+                            f"You have passed `Trainer(strategy={strategy})`"
+                            f" and you can only specify one strategy, but you have passed {plugin} as a plugin."
+                        )
+                    if isinstance(plugin, str) and plugin in self._registered_strategies:
+                        raise MisconfigurationException(
+                            f"You have passed `Trainer(strategy={strategy})`"
+                            f" and you can only specify one strategy, but you have passed {plugin} as a plugin."
+                        )
+
+        if accelerator is not None:
+            if accelerator in self._accelerator_types or accelerator == "auto" or isinstance(accelerator, Accelerator):
+                self._accelerator_flag = accelerator
+            elif accelerator in self._registered_strategies or isinstance(accelerator, Strategy):
                 rank_zero_deprecation(
-                    f"Passing {plug} `strategy` to the `plugins` flag in Trainer has been deprecated"
-                    f" in v1.5 and will be removed in v1.7. Use `Trainer(strategy={plug})` instead."
+                    f"Passing `Trainer(accelerator={accelerator!r})` has been deprecated"
+                    f" in v1.5 and will be removed in v1.7. Use `Trainer(strategy={accelerator!r})` instead."
                 )
+                self._strategy_flag = accelerator
+            elif accelerator == "ddp_cpu" and not self._strategy_flag:
+                self._strategy_flag = accelerator
 
-        strategy = self._strategy or None
-        checkpoint = None
-        precision = None
-        cluster_environment = None
+        if precision is not None:
+            if str(precision) not in self._precision_types:
+                raise MisconfigurationException(
+                    f"Precision {repr(precision)} is invalid. Allowed precision values: {self._precision_types}"
+                )
+            self._precision_flag = precision
+
+        if plugins:
+            for plugin in plugins:
+                if isinstance(plugin, Strategy) or isinstance(plugin, str) and plugin in self._registered_strategies:
+                    self._strategy_flag = plugin
+                    rank_zero_deprecation(
+                        f"Passing {plugin} `strategy` to the `plugins` flag in Trainer has been deprecated"
+                        f" in v1.5 and will be removed in v1.7. Use `Trainer(strategy={plugin})` instead."
+                    )
 
-        for plug in self.plugins:
-            if isinstance(plug, str) and plug in StrategyRegistry:
-                if strategy is None:
-                    strategy = StrategyRegistry.get(plug)
+                elif isinstance(plugin, PrecisionPlugin):
+                    self._precision_plugin_flag = plugin
+                elif isinstance(plugin, str) and plugin in self._precision_types:
+                    self._precision_flag = plugin
+                elif isinstance(plugin, CheckpointIO):
+                    self.checkpoint_io = plugin
+                elif isinstance(plugin, ClusterEnvironment):
+                    self._cluster_environment_flag = plugin
                 else:
                     raise MisconfigurationException(
-                        "You can only specify one precision and one training type plugin."
-                        " Found more than 1 training type plugin:"
-                        f' {StrategyRegistry[plug]["strategy"]} registered to {plug}'
+                        f"Found invalid type for plugin {plugin}. Expected a precision plugin or training strategy."
                     )
-            if isinstance(plug, str):
-                # Reset the distributed type as the user has overridden training type
-                # via the plugins argument
-                self._strategy_type = None
-                self.set_distributed_mode(plug)
 
-            elif isinstance(plug, Strategy):
-                if strategy is None:
-                    strategy = plug
-
-                else:
+        # handle the case when the user passes in a strategy instance which has an accelerator, precision,
+        # checkpoint io or cluster env set up
+        # TODO: @awaelchli improve the error messages below
+        if self._strategy_flag and isinstance(self._strategy_flag, Strategy):
+            if self._strategy_flag._accelerator:
+                if self._accelerator_flag:
                     raise MisconfigurationException(
-                        "You can only specify one training type plugin."
-                        f" Available: {type(strategy).__name__}, given: {type(plug).__name__}"
+                        "accelerator set through both strategy class and accelerator flag, choose one"
                     )
-            elif isinstance(plug, PrecisionPlugin):
-                if precision is None:
-                    precision = plug
                 else:
-                    raise MisconfigurationException(
-                        "You can only specify one precision plugin."
-                        f" Available: {type(precision).__name__}, given: {type(plug).__name__}"
-                    )
-            elif isinstance(plug, CheckpointIO):
-                if checkpoint is None:
-                    checkpoint = plug
+                    self._accelerator_flag = self._strategy_flag._accelerator
+            if self._strategy_flag._precision_plugin:
+                # [RFC] handle precision plugin set up conflict?
+                if self._precision_plugin_flag:
+                    raise MisconfigurationException("precision set through both strategy class and plugins, choose one")
                 else:
+                    self._precision_plugin_flag = self._strategy_flag._precision_plugin
+            if self._strategy_flag._checkpoint_io:
+                if self.checkpoint_io:
                     raise MisconfigurationException(
-                        "You can only specify one checkpoint plugin."
-                        f" Available: {type(checkpoint).__name__}, given: {type(plug).__name__}"
+                        "checkpoint_io set through both strategy class and plugins, choose one"
                     )
-            elif isinstance(plug, ClusterEnvironment):
-                if cluster_environment is None:
-                    cluster_environment = plug
                 else:
+                    self.checkpoint_io = self._strategy_flag._checkpoint_io
+            if getattr(self._strategy_flag, "cluster_environment", None):
+                if self._cluster_environment_flag:
                     raise MisconfigurationException(
-                        "You can only specify one cluster environment. Found more than 1 cluster environment plugin"
+                        "cluster_environment set through both strategy class and plugins, choose one"
                     )
-            else:
-                raise MisconfigurationException(
-                    f"Found invalid type for plugin {plug}. Expected a precision or training type plugin."
-                )
-
-        self._strategy = strategy
-        self._precision_plugin = precision
-        self._checkpoint_io = checkpoint
-        self._cluster_environment = cluster_environment
-
-    @property
-    def accelerator_types(self) -> List[str]:
-        return ["auto"] + list(_AcceleratorType)
-
-    @property
-    def precision_plugin(self) -> PrecisionPlugin:
-        if self._precision_plugin is None:
-            self._precision_plugin = self.select_precision_plugin()
-        return self._precision_plugin
-
-    def final_strategy(self) -> Strategy:
-        if self._strategy is None:
-            self._strategy = self.select_strategy()
-        self._strategy = self.resolve_strategy(self._strategy)
-        # attach checkpoint plugin to the training type plugin
-        if self._checkpoint_io is not None:
-            self._strategy.checkpoint_io = self._checkpoint_io
-        if (
-            isinstance(self._strategy_flag, Strategy) and self._strategy_flag._precision_plugin is None
-        ) or not isinstance(self._strategy_flag, Strategy):
-            precision_plugin = self.precision_plugin
-            if precision_plugin is not None:
-                self._strategy.precision_plugin = precision_plugin
-        if (isinstance(self._strategy_flag, Strategy) and self._strategy_flag.accelerator is None) or not isinstance(
-            self._strategy_flag, Strategy
-        ):
-            self._strategy.accelerator = self.select_accelerator()
-        return self._strategy
-
-    @property
-    def cluster_environment(self) -> ClusterEnvironment:
-        if self._cluster_environment is None:
-            self._cluster_environment = self.select_cluster_environment()
-        return self._cluster_environment
-
-    @property
-    def has_cpu(self) -> bool:
-        return True
+                else:
+                    self._cluster_environment_flag = getattr(self._strategy_flag, "cluster_environment")
 
-    @property
-    def use_cpu(self) -> bool:
-        return self._accelerator_type == _AcceleratorType.CPU
+            # TODO: RFC existing accel_conn doesn't handle this, should we add conflict check?
+            #   eg: parallel_device is torch.device(cpu) but accelerator=gpu
+            if hasattr(self._strategy_flag, "parallel_devices"):
+                if self._strategy_flag.parallel_devices:
+                    if self._strategy_flag.parallel_devices[0].type == "cpu":
+                        self._accelerator_flag = "cpu"
+                    if self._strategy_flag.parallel_devices[0].type == "cuda":
+                        self._accelerator_flag = "gpu"
 
-    @property
-    def has_gpu(self) -> bool:
-        # Here, we are not checking for GPU availability, but instead if User has passed
-        # `gpus` to Trainer for training.
-        gpus = self.parallel_device_ids
-        if gpus is not None and len(gpus) > 0:
-            return True
-        return self._map_devices_to_accelerator(_AcceleratorType.GPU)
+        amp_type = amp_type if isinstance(amp_type, str) else None
+        self._amp_type_flag = AMPType.from_str(amp_type)
 
-    @property
-    def use_gpu(self) -> bool:
-        return self._accelerator_type == _AcceleratorType.GPU and self.has_gpu
+        if amp_level is not None and self._amp_type_flag != AMPType.APEX:
+            raise MisconfigurationException(
+                f"You have asked for `amp_level={amp_level!r}` but it's only supported with `amp_backend='apex'`."
+            )
 
-    @property
-    def has_tpu(self) -> bool:
-        # Here, we are not checking for TPU availability, but instead if User has passed
-        # `tpu_cores` to Trainer for training.
-        if self.tpu_cores is not None:
-            return True
-        return self._map_devices_to_accelerator(_AcceleratorType.TPU)
+    def _check_device_config_and_set_final_flags(
+        self,
+        devices: Optional[Union[List[int], str, int]],
+        num_nodes: int,
+        num_processes: Optional[int],
+        gpus: Optional[Union[List[int], str, int]],
+        ipus: Optional[int],
+        tpu_cores: Optional[Union[List[int], int]],
+    ) -> None:
+        self._num_nodes_flag = int(num_nodes) if num_nodes is not None else 1
+        self._devices_flag = devices
+
+        # TODO: Delete this method when num_processes, gpus, ipus and tpu_cores gets removed
+        self._map_deprecated_devices_specfic_info_to_accelerator_and_device_flag(
+            devices, num_processes, gpus, ipus, tpu_cores
+        )
 
-    @property
-    def use_tpu(self) -> bool:
-        return self._accelerator_type == _AcceleratorType.TPU and self.has_tpu
+        if self._devices_flag in ([], 0, "0", "0,"):
+            rank_zero_warn(f"You passed `devices={devices}`, switching to `cpu` accelerator")
+            self._accelerator_flag = "cpu"
 
-    @property
-    def tpu_id(self) -> Optional[int]:
-        if self.use_tpu and isinstance(self.tpu_cores, list):
-            return self.tpu_cores[0]
-        return None
-
-    @property
-    def has_ipu(self) -> bool:
-        # Here, we are not checking for IPU availability, but instead if User has passed
-        # `ipus` to Trainer for training.
-        if self.ipus is not None or isinstance(self._strategy, IPUStrategy):
-            return True
-        return self._map_devices_to_accelerator(_AcceleratorType.IPU)
+        if self._devices_flag == "auto" and self._accelerator_flag is None:
+            raise MisconfigurationException(
+                f"You passed `devices={devices}` but haven't specified"
+                " `accelerator=('auto'|'tpu'|'gpu'|'ipu'|'cpu')` for the devices mapping"
+            )
 
-    @property
-    def use_ipu(self) -> bool:
-        return self._accelerator_type == _AcceleratorType.IPU and self.has_ipu
+    def _map_deprecated_devices_specfic_info_to_accelerator_and_device_flag(
+        self,
+        devices: Optional[Union[List[int], str, int]],
+        num_processes: Optional[int],
+        gpus: Optional[Union[List[int], str, int]],
+        ipus: Optional[int],
+        tpu_cores: Optional[Union[List[int], str, int]],
+    ) -> None:
+        """Sets the `devices_flag` and `accelerator_flag` based on num_processes, gpus, ipus, tpu_cores."""
+        self._gpus: Optional[Union[List[int], str, int]] = gpus
+        self._tpu_cores: Optional[Union[List[int], str, int]] = tpu_cores
+        gpus = device_parser.parse_gpu_ids(gpus)
+        tpu_cores = device_parser.parse_tpu_cores(tpu_cores)
+        deprecated_devices_specific_flag = num_processes or gpus or ipus or tpu_cores
+        if deprecated_devices_specific_flag and deprecated_devices_specific_flag not in (0, "0"):
+            if devices:
+                # TODO: @awaelchli improve error message
+                rank_zero_warn(
+                    f"The flag `devices={devices}` will be ignored, "
+                    f"instead the device specific number {deprecated_devices_specific_flag} will be used"
+                )
 
-    def _set_devices_to_cpu_num_processes(self) -> None:
-        if self.num_processes == 1:
-            self._map_devices_to_accelerator(_AcceleratorType.CPU)
+            if [(num_processes is not None), (gpus is not None), (ipus is not None), (tpu_cores is not None)].count(
+                True
+            ) > 1:
+                # TODO: @awaelchli improve error message
+                rank_zero_warn("more than one device specific flag has been set")
+            self._devices_flag = deprecated_devices_specific_flag
+
+            if self._accelerator_flag is None:
+                # set accelerator type based on num_processes, gpus, ipus, tpu_cores
+                if ipus:
+                    self._accelerator_flag = "ipu"
+                if tpu_cores:
+                    self._accelerator_flag = "tpu"
+                if gpus:
+                    self._accelerator_flag = "gpu"
+                if num_processes:
+                    self._accelerator_flag = "cpu"
+
+    def _set_accelerator_if_ipu_strategy_is_passed(self) -> None:
+        # current logic only apply to object config
+        # TODO this logic should apply to both str and object config
+        if isinstance(self._strategy_flag, IPUStrategy):
+            self._accelerator_flag = "ipu"
+
+    def _choose_accelerator(self) -> str:
+        """Choose the accelerator type (str) based on availability when ``accelerator='auto'``."""
+        if self._accelerator_flag == "auto":
+            if _TPU_AVAILABLE:
+                return "tpu"
+            if _IPU_AVAILABLE:
+                return "ipu"
+            if torch.cuda.is_available() and torch.cuda.device_count() > 0:
+                return "gpu"
+        return "cpu"
+
+    def _set_parallel_devices_and_init_accelerator(self) -> None:
+        # TODO add device availability check
+        self._parallel_devices: List[Union[int, torch.device]] = []
+
+        if isinstance(self._accelerator_flag, Accelerator):
+            self.accelerator: Accelerator = self._accelerator_flag
+        elif self._accelerator_flag == "tpu":
+            self.accelerator = TPUAccelerator()
+            self._set_devices_flag_if_auto_passed()
+            if isinstance(self._devices_flag, int):
+                self._parallel_devices = list(range(self._devices_flag))
+            else:
+                self._parallel_devices = self._devices_flag  # type: ignore[assignment]
+
+        elif self._accelerator_flag == "ipu":
+            self.accelerator = IPUAccelerator()
+            self._set_devices_flag_if_auto_passed()
+            if isinstance(self._devices_flag, int):
+                self._parallel_devices = list(range(self._devices_flag))
+
+        elif self._accelerator_flag == "gpu":
+            self.accelerator = GPUAccelerator()
+            self._set_devices_flag_if_auto_passed()
+            if isinstance(self._devices_flag, int) or isinstance(self._devices_flag, str):
+                self._devices_flag = int(self._devices_flag)
+                self._parallel_devices = (
+                    [torch.device("cuda", i) for i in device_parser.parse_gpu_ids(self._devices_flag)]  # type: ignore
+                    if self._devices_flag != 0
+                    else []
+                )
+            else:
+                self._parallel_devices = [torch.device("cuda", i) for i in self._devices_flag]  # type: ignore
 
-    def _map_devices_to_accelerator(self, accelerator: str) -> bool:
-        if self.devices is None:
-            return False
-        if accelerator == _AcceleratorType.TPU and _TPU_AVAILABLE:
-            if self.devices == "auto":
-                self.devices = TPUAccelerator.auto_device_count()
-            self.tpu_cores = device_parser.parse_tpu_cores(self.devices)
-            return True
-        if accelerator == _AcceleratorType.IPU and _IPU_AVAILABLE:
-            if self.devices == "auto":
-                self.devices = IPUAccelerator.auto_device_count()
-            self.ipus = self.devices
-            return True
-        if accelerator == _AcceleratorType.GPU and torch.cuda.is_available():
-            if self.devices == "auto":
-                self.devices = GPUAccelerator.auto_device_count()
-            self.gpus = self.devices
-            self.parallel_device_ids = device_parser.parse_gpu_ids(self.devices)
-            return True
-        if accelerator == _AcceleratorType.CPU:
-            if self.devices == "auto":
-                self.devices = CPUAccelerator.auto_device_count()
-            if not isinstance(self.devices, int):
-                raise MisconfigurationException(
+        elif self._accelerator_flag == "cpu":
+            self.accelerator = CPUAccelerator()
+            self._set_devices_flag_if_auto_passed()
+            if isinstance(self._devices_flag, int):
+                self._parallel_devices = [torch.device("cpu")] * self._devices_flag
+            else:
+                rank_zero_warn(
                     "The flag `devices` must be an int with `accelerator='cpu'`,"
-                    f" got `devices={self.devices}` instead."
+                    f" got `devices={self._devices_flag}` instead."
                 )
-            self.num_processes = self.devices
-            return True
-        return False
 
-    @property
-    def use_dp(self) -> bool:
-        return self._strategy_type == _StrategyType.DP
+        self._gpus = self._devices_flag if not self._gpus else self._gpus
+        self._tpu_cores = self._devices_flag if not self._tpu_cores else self._tpu_cores
 
-    @property
-    def use_ddp(self) -> bool:
-        return self._strategy_type in (
-            _StrategyType.BAGUA,
-            _StrategyType.DDP,
-            _StrategyType.DDP_SPAWN,
-            _StrategyType.DDP_SHARDED,
-            _StrategyType.DDP_SHARDED_SPAWN,
-            _StrategyType.DDP_FULLY_SHARDED,
-            _StrategyType.DEEPSPEED,
-            _StrategyType.TPU_SPAWN,
-        )
+    def _set_devices_flag_if_auto_passed(self) -> None:
+        if self._devices_flag == "auto" or not self._devices_flag:
+            self._devices_flag = self.accelerator.auto_device_count()
 
-    @property
-    def use_ddp2(self) -> bool:
-        return self._strategy_type == _StrategyType.DDP2
-
-    @property
-    def use_horovod(self) -> bool:
-        return self._strategy_type == _StrategyType.HOROVOD
-
-    @property
-    def use_deepspeed(self) -> bool:
-        return self._strategy_type == _StrategyType.DEEPSPEED
-
-    @property
-    def use_bagua(self) -> bool:
-        return self._strategy_type == _StrategyType.BAGUA
-
-    @property
-    def _is_sharded_training_type(self) -> bool:
-        return isinstance(self._strategy, (DDPShardedStrategy, DDPSpawnShardedStrategy))
-
-    @property
-    def _is_fully_sharded_training_type(self) -> bool:
-        return isinstance(self._strategy, DDPFullyShardedStrategy)
+    def _choose_and_init_cluster_environment(self) -> ClusterEnvironment:
+        if isinstance(self._cluster_environment_flag, ClusterEnvironment):
+            return self._cluster_environment_flag
+        if self._is_slurm_managing_tasks():
+            rank_zero_info("Multiprocessing is handled by SLURM.")
+            return SLURMEnvironment()
+        for env_type in (BaguaEnvironment, TorchElasticEnvironment, KubeflowEnvironment, LSFEnvironment):
+            if env_type.detect():
+                return env_type()
+        return LightningEnvironment()
 
-    @property
-    def is_distributed(self) -> bool:
-        # Used for custom plugins.
-        # Custom plugins should implement is_distributed property.
-        if hasattr(self.strategy, "is_distributed") and not self.use_tpu:
-            return self.strategy.is_distributed
-        is_distributed = self.use_ddp or self.use_ddp2 or self.use_horovod
-        if self.use_tpu:
-            is_distributed |= self.strategy.is_distributed
-        return is_distributed
+    def _is_slurm_managing_tasks(self) -> bool:
+        """used by choosing cluster enviroment."""
+        if not SLURMEnvironment.detect() or SLURMEnvironment.job_name() == "bash":
+            return False
 
-    @property
-    def num_gpus(self) -> int:
-        gpus = self.parallel_device_ids
-        if gpus is None:
-            return 0
-        return len(gpus)
+        total_requested_devices = len(self._parallel_devices) * self._num_nodes_flag
+        num_slurm_tasks = int(os.environ["SLURM_NTASKS"], 0)
+        return num_slurm_tasks == total_requested_devices
 
-    @property
-    def num_ipus(self) -> int:
-        if isinstance(self.ipus, int):
-            return self.ipus
-        if isinstance(self._strategy, IPUStrategy):
-            return self._strategy.replication_factor
-        return 0
+    def _choose_strategy(self) -> Union[Strategy, str]:
+        if self._accelerator_flag == "ipu":
+            return IPUStrategy.strategy_name
+        if self._accelerator_flag == "tpu":
+            if self._parallel_devices and len(self._parallel_devices) > 1:
+                return TPUSpawnStrategy.strategy_name
+            else:
+                # TODO: lazy initialized device, then here could be self._strategy_flag = "single_tpu_device"
+                return SingleTPUStrategy(device=self._parallel_devices[0])  # type: ignore
+        if _HOROVOD_AVAILABLE and ("OMPI_COMM_WORLD_RANK" in os.environ or "HOROVOD_RANK" in os.environ):
+            return HorovodStrategy.strategy_name
+        if self._num_nodes_flag > 1:
+            return DDPStrategy.strategy_name
+        if len(self._parallel_devices) <= 1:
+            device = (
+                device_parser.determine_root_gpu_device(self._parallel_devices)  # type: ignore
+                if self._accelerator_flag == "gpu"
+                else "cpu"
+            )
+            # TODO: lazy initialized device, then here could be self._strategy_flag = "single_device"
+            return SingleDeviceStrategy(device=device)  # type: ignore
+        if len(self._parallel_devices) > 1:
+            return DDPSpawnStrategy.strategy_name
 
-    @property
-    def parallel_devices(self) -> List[Union[torch.device, int]]:
-        if self.use_gpu:
-            devices = [torch.device("cuda", i) for i in self.parallel_device_ids]
-        elif self.use_tpu:
-            # explicitly don't make a tpu device here!
-            # https://github.com/PyTorchLightning/pytorch-lightning/issues/3169
-            if isinstance(self.tpu_cores, int):
-                devices = list(range(self.tpu_cores))
-        elif self.use_ipu:
-            devices = list(range(self.num_ipus))
-        else:
-            devices = [torch.device("cpu")] * self.num_processes
-        return devices
+        return DDPStrategy.strategy_name
 
-    @property
-    def root_gpu(self) -> Optional[int]:
-        return (
-            self.strategy.root_device.index
-            if not isinstance(self.accelerator, (IPUAccelerator, TPUAccelerator))
-            else None
-        )
+    def _check_strategy_and_fallback(self) -> None:
+        """Checks edge cases when the strategy selection was a string input, and we need to fall back to a
+        different choice depending on other parameters or the environment."""
+        # current fallback and check logic only apply to user pass in str config and object config
+        # TODO this logic should apply to both str and object config
+        strategy_flag = "" if isinstance(self._strategy_flag, Strategy) else self._strategy_flag
 
-    @staticmethod
-    def _is_plugin_training_type(plugin: Union[str, Strategy]) -> bool:
-        if isinstance(plugin, str) and (plugin in StrategyRegistry or plugin in list(_StrategyType)):
-            return True
-        return isinstance(plugin, Strategy)
+        if strategy_flag == "ddp_cpu":
+            if _TPU_AVAILABLE:
+                raise MisconfigurationException(
+                    "`accelerator='ddp_cpu'` is not supported on TPU machines. "
+                    "Learn more: https://github.com/PyTorchLightning/pytorch-lightning/issues/7810"
+                )
+            if self._devices_flag == 1 and self._num_nodes_flag > 1:
+                strategy_flag = DDPStrategy.strategy_name
+            else:
+                strategy_flag = "ddp_spawn"
+            if self._accelerator_flag == "gpu":
+                rank_zero_warn(
+                    "You requested one or more GPUs, but set `accelerator='ddp_cpu'`. Training will not use GPUs."
+                )
+                self._accelerator_flag = "cpu"
+                self.accelerator = CPUAccelerator()
+        if strategy_flag in ("ddp_spawn", "ddp_spawn_find_unused_parameters_false") and (
+            TorchElasticEnvironment.detect() or KubeflowEnvironment.detect() or self._is_slurm_managing_tasks()
+        ):
+            strategy_flag = "ddp"
+        if strategy_flag in ("dp", "ddp2") and self._accelerator_flag == "cpu":
+            rank_zero_warn(f"{strategy_flag!r} is not supported on CPUs, hence setting `strategy='ddp'`.")
+            strategy_flag = "ddp"
 
-    @property
-    def is_training_type_in_plugins(self) -> bool:
-        return any(
-            (isinstance(plug, str) and plug in StrategyRegistry) or isinstance(plug, Strategy) for plug in self.plugins
-        )
+        if strategy_flag:
+            self._strategy_flag = strategy_flag
 
-    def select_precision_plugin(self) -> PrecisionPlugin:
-        # set precision type
-        self.amp_type = AMPType.from_str(self.amp_type)
+    def _handle_horovod(self) -> None:
+        if self._num_nodes_flag > 1:
+            raise MisconfigurationException(
+                "Horovod does not support setting num_nodes / num_gpus explicitly. Use "
+                "horovodrun / mpirun to configure the number of processes."
+            )
 
-        # validation for all plugins
-        if self.amp_level is not None and self.amp_type != AMPType.APEX:
+        if not _HOROVOD_AVAILABLE:
             raise MisconfigurationException(
-                f"You have asked for `amp_level={self.amp_level!r}` but it's only supported with `amp_backend='apex'`."
+                'Requested `accelerator="horovod"`, but Horovod is not installed.'
+                "Install with \n $HOROVOD_WITH_PYTORCH=1 pip install horovod[pytorch]"
             )
 
-        if self.use_ipu:
-            if self.precision not in (16, 32):
-                raise MisconfigurationException(
-                    f"`Trainer(accelerator='ipu', precision={self.precision!r})` is not supported."
-                )
-            return IPUPrecisionPlugin(self.precision)
-        if self.use_tpu:
-            if self.precision == 32:
+        hvd.init()
+        if isinstance(self.accelerator, GPUAccelerator):
+            # Horovod assigns one local GPU per process
+            self._parallel_devices = list(range(hvd.local_size()))
+        else:
+            self._parallel_devices = [torch.device("cpu")] * hvd.local_size()
+
+    def _init_strategy(self) -> None:
+        """Instantiate the Strategy given depending on the setting of ``_strategy_flag``."""
+        if isinstance(self._strategy_flag, HorovodStrategy) or self._strategy_flag == "horovod":
+            # handle horovod has to happen before initialize strategy because HorovodStrategy needs hvd.init() first.
+            # TODO lazy initialized and setup horovod strategy `global_rank`
+            self._handle_horovod()
+        if isinstance(self._strategy_flag, str):
+            self.strategy = StrategyRegistry.get(self._strategy_flag)
+        elif isinstance(self._strategy_flag, Strategy):
+            self.strategy = self._strategy_flag
+        else:
+            raise RuntimeError(f"{self.strategy} is not valid type: {self.strategy}")
+
+    def _check_and_init_precision(self) -> PrecisionPlugin:
+        self._validate_precision_choice()
+        if isinstance(self._precision_plugin_flag, PrecisionPlugin):
+            return self._precision_plugin_flag
+
+        if isinstance(self.accelerator, IPUAccelerator):
+            return IPUPrecisionPlugin(self._precision_flag)  # type: ignore
+        if isinstance(self.accelerator, TPUAccelerator):
+            if self._precision_flag == 32:
                 return TPUPrecisionPlugin()
-            elif self.precision == 64:
-                raise MisconfigurationException(
-                    "`Trainer(accelerator='tpu', precision=64)` is not implemented."
-                    " Please, open an issue in `https://github.com/PyTorchLightning/pytorch-lightning/issues`"
-                    " requesting this feature."
-                )
-            elif self.precision in (16, "bf16"):
-                if self.precision == 16:
-                    # this is not deprecated to ease transition between accelerator environments
+            elif self._precision_flag in (16, "bf16"):
+                if self._precision_flag == 16:
                     rank_zero_warn(
-                        f"You passed `Trainer(accelerator='tpu', precision=16)` but {self.amp_type.value} AMP"
-                        f" is not supported with TPUs. Using `precision='bf16'` instead."
+                        "You passed `Trainer(accelerator='tpu', precision=16)` but AMP"
+                        " is not supported with TPUs. Using `precision='bf16'` instead."
                     )
                 return TPUBf16PrecisionPlugin()
+        if isinstance(self.strategy, DeepSpeedStrategy):
+            return DeepSpeedPrecisionPlugin(
+                self._precision_flag, self._amp_type_flag, self._amp_level_flag  # type: ignore
+            )
 
-        if self._strategy_type == _StrategyType.DEEPSPEED or isinstance(self._strategy, DeepSpeedStrategy):
-            return DeepSpeedPrecisionPlugin(self.precision, self.amp_type, self.amp_level)
-
-        if self.precision == 32:
+        if self._precision_flag == 32:
             return PrecisionPlugin()
-        if self.precision == 64:
+        if self._precision_flag == 64:
             return DoublePrecisionPlugin()
 
-        # maybe convert the precision value
-        if self.precision == 16 and self.use_cpu:
-            if self.amp_type == AMPType.APEX:
-                # apex was explicitly passed, not a good idea to silently switch to native AMP
-                raise MisconfigurationException(
-                    "You passed `Trainer(accelerator='cpu', precision=16, amp_type='apex')`"
-                    " but apex AMP not supported on CPU."
-                )
-            # this automatic switch is to ease transition between accelerator environments
+        if self._precision_flag == 16 and self._accelerator_flag == "cpu":
             rank_zero_warn(
                 "You passed `Trainer(accelerator='cpu', precision=16)` but native AMP is not supported on CPU."
                 " Using `precision='bf16'` instead."
             )
-            self.precision = "bf16"
-
-        if self.precision in (16, "bf16"):
-            if self.precision == "bf16" and self.amp_type != AMPType.NATIVE:
-                raise MisconfigurationException(
-                    f"You passed `Trainer(amp_type={self.amp_type.value!r}, precision='bf16')` but it's not supported."
-                    " Try using `amp_type='native'` instead."
-                )
+            self._precision_flag = "bf16"
 
+        if self._precision_flag in (16, "bf16"):
             rank_zero_info(
-                f"Using 16bit {self.amp_type.value} Automatic Mixed Precision (AMP)"
-                if self.precision == 16
+                f"Using 16bit {self._amp_type_flag.value} Automatic Mixed Precision (AMP)"  # type: ignore
+                if self._precision_flag == 16
                 else "Using bfloat16 Automatic Mixed Precision (AMP)"
             )
 
-            if self.amp_type == AMPType.NATIVE:
-                device = "cpu" if self.use_cpu else "cuda"
+            if self._amp_type_flag == AMPType.NATIVE:
+                device = "cpu" if self._accelerator_flag == "cpu" else "cuda"
 
-                if self._is_sharded_training_type:
-                    return ShardedNativeMixedPrecisionPlugin(self.precision, device)
-                if self._is_fully_sharded_training_type:
-                    return FullyShardedNativeMixedPrecisionPlugin(self.precision, device)
-                return NativeMixedPrecisionPlugin(self.precision, device)
+                if isinstance(self.strategy, (DDPShardedStrategy, DDPSpawnShardedStrategy)):
+                    return ShardedNativeMixedPrecisionPlugin(self._precision_flag, device)
+                if isinstance(self.strategy, DDPFullyShardedStrategy):
+                    return FullyShardedNativeMixedPrecisionPlugin(self._precision_flag, device)
+                return NativeMixedPrecisionPlugin(self._precision_flag, device)
 
-            if self.amp_type == AMPType.APEX:
-                if self._is_sharded_training_type or self._is_fully_sharded_training_type:
-                    raise MisconfigurationException(
-                        "Sharded plugins are not supported with apex, please switch to `amp_backend='native'`."
-                    )
-                self.amp_level = self.amp_level or "O2"
-                return ApexMixedPrecisionPlugin(self.amp_level)
+            if self._amp_type_flag == AMPType.APEX:
+                self._amp_level_flag = self._amp_level_flag or "O2"
+                return ApexMixedPrecisionPlugin(self._amp_level_flag)
 
         raise RuntimeError("No precision set")
 
-    def select_strategy(self) -> Strategy:
-        if isinstance(self.distributed_backend, Accelerator) and self.distributed_backend.strategy is not None:
-            plugin = self.distributed_backend.strategy
-        elif self.use_ddp2:
-            plugin = DDP2Strategy(parallel_devices=self.parallel_devices, cluster_environment=self.cluster_environment)
-        elif self.use_ddp and self.use_deepspeed:
-            plugin = DeepSpeedStrategy(
-                cluster_environment=self.select_cluster_environment(), parallel_devices=self.parallel_devices
-            )
-        elif self.use_ddp and self.use_bagua:
-            plugin = BaguaStrategy(parallel_devices=self.parallel_devices, cluster_environment=self.cluster_environment)
-        elif self.use_ddp:
-            use_slurm_ddp = self.use_ddp and self._is_slurm_managing_tasks()
-            use_torchelastic_ddp = self.use_ddp and TorchElasticEnvironment.detect()
-            use_kubeflow_ddp = self.use_ddp and KubeflowEnvironment.detect()
-            use_ddp_spawn = self._strategy_type == _StrategyType.DDP_SPAWN
-            use_ddp_cpu_spawn = use_ddp_spawn and self.use_cpu
-            use_tpu_spawn = self.use_tpu and self._strategy_type == _StrategyType.TPU_SPAWN
-            use_ddp_cpu_torch_elastic = use_ddp_cpu_spawn and TorchElasticEnvironment.detect()
-            use_ddp_cpu_kubeflow = use_ddp_cpu_spawn and KubeflowEnvironment.detect()
-            use_ddp_cpu_slurm = use_ddp_cpu_spawn and self._is_slurm_managing_tasks()
-            use_ddp_sharded = self._strategy_type == _StrategyType.DDP_SHARDED
-            use_ddp_sharded_spawn = self._strategy_type == _StrategyType.DDP_SHARDED_SPAWN
-            use_ddp_fully_sharded = self._strategy_type == _StrategyType.DDP_FULLY_SHARDED
-
-            if use_tpu_spawn:
-                ddp_strategy_cls = TPUSpawnStrategy
-            elif use_ddp_sharded:
-                ddp_strategy_cls = DDPShardedStrategy
-            elif use_ddp_sharded_spawn:
-                ddp_strategy_cls = DDPSpawnShardedStrategy
-            elif (
-                use_ddp_cpu_slurm
-                or use_slurm_ddp
-                or use_ddp_cpu_torch_elastic
-                or use_torchelastic_ddp
-                or use_kubeflow_ddp
-                or use_ddp_cpu_kubeflow
-            ):
-                ddp_strategy_cls = DDPStrategy
-            elif use_ddp_spawn or use_ddp_cpu_spawn:
-                ddp_strategy_cls = DDPSpawnStrategy
-            elif use_ddp_fully_sharded:
-                ddp_strategy_cls = DDPFullyShardedStrategy
-            else:
-                ddp_strategy_cls = DDPStrategy
-
-            plugin = ddp_strategy_cls(
-                parallel_devices=self.parallel_devices, cluster_environment=self.cluster_environment
-            )
-        elif self.use_dp:
-            plugin = DataParallelStrategy(parallel_devices=self.parallel_devices)
-        elif self.use_horovod:
-            plugin = HorovodStrategy(parallel_devices=self.parallel_devices)
-        elif self.use_tpu and isinstance(self.tpu_cores, list):
-            plugin = SingleTPUStrategy(self.tpu_id)
-        elif self.use_ipu:
-            plugin = IPUStrategy(parallel_devices=self.parallel_devices)
-        else:
-            single_gpu_ordinal = device_parser.determine_root_gpu_device(self.parallel_device_ids)
-            plugin = SingleDeviceStrategy(device=single_gpu_ordinal if self.use_gpu else "cpu")
-        return plugin
-
-    def resolve_strategy(self, training_type: Strategy) -> Strategy:
-        # necessary for when the user has passed in a plugin
-        if hasattr(training_type, "parallel_devices") and getattr(training_type, "parallel_devices") is None:
-            training_type.parallel_devices = self.parallel_devices
-
-        if hasattr(training_type, "cluster_environment") and getattr(training_type, "cluster_environment") is None:
-            # transfer ownership of the cluster environment to the training type
-            training_type.cluster_environment = self.cluster_environment
-            self._cluster_environment = proxy(self.cluster_environment)
-
-        if hasattr(training_type, "num_nodes"):
-            # set num_nodes for training_type from trainer setting
-            training_type.num_nodes = self.num_nodes
-
-        if hasattr(training_type, "sync_batchnorm"):
-            # set sync_batchnorm for training_type from trainer setting
-            training_type.sync_batchnorm = self.sync_batchnorm
-
-        return training_type
-
-    def select_accelerator(self) -> Accelerator:
-        if isinstance(self.distributed_backend, Accelerator):
-            # custom accelerator from user
-            if self._precision_plugin is not None or self._strategy is not None:
-                # plugins also specified by user
-                rank_zero_warn(
-                    "Specified `Precision` and `TrainingType` plugins will be ignored,"
-                    " since an `Accelerator` instance was provided."
-                )
-            return self.distributed_backend
-
-        if self.use_gpu:
-            acc_cls = GPUAccelerator
-        elif self.use_tpu:
-            acc_cls = TPUAccelerator
-        elif self.use_ipu:
-            acc_cls = IPUAccelerator
-        else:
-            acc_cls = CPUAccelerator
-
-        accelerator = acc_cls()
-        return accelerator
-
-    def select_cluster_environment(self) -> ClusterEnvironment:
-        if self._cluster_environment is not None:
-            return self._cluster_environment
-        if self._is_slurm_managing_tasks():
-            rank_zero_info("Multiprocessing is handled by SLURM.")
-            return SLURMEnvironment()
-
-        for env_type in (BaguaEnvironment, TorchElasticEnvironment, KubeflowEnvironment, LSFEnvironment):
-            if env_type.detect():
-                return env_type()
-
-        return LightningEnvironment()
-
-    def set_distributed_mode(self, strategy: Optional[str] = None):
-
-        if strategy is None and self.is_training_type_in_plugins:
-            return
-
-        if strategy is not None and strategy in StrategyRegistry:
-            self.distributed_backend = StrategyRegistry[strategy]["distributed_backend"]
-        elif strategy is not None:
-            self.distributed_backend = strategy
-
-        if isinstance(self.distributed_backend, Accelerator):
-            return
-
-        is_cpu_accelerator_type = self._accelerator_type and self._accelerator_type == _AcceleratorType.CPU
-        _use_cpu = is_cpu_accelerator_type or self.distributed_backend and "cpu" in self.distributed_backend
-
-        if self.distributed_backend is None:
-            if self.has_horovodrun():
-                self._set_horovod_backend()
-            elif self.num_gpus == 0 and self.num_nodes > 1:
-                self._strategy_type = _StrategyType.DDP
-            elif self.num_gpus == 0 and self.num_processes > 1:
-                self.distributed_backend = _StrategyType.DDP_SPAWN
-            elif self.num_gpus > 1 and not _use_cpu:
-                rank_zero_warn(
-                    "You requested multiple GPUs but did not specify a backend, e.g."
-                    ' `Trainer(strategy="dp"|"ddp"|"ddp2")`. Setting `strategy="ddp_spawn"` for you.'
+    def _validate_precision_choice(self) -> None:
+        """Validate the combination of choices for precision, AMP type, and accelerator."""
+        # TODO: change exception type to ImpactableConfigurationException
+        if isinstance(self.accelerator, IPUAccelerator):
+            if self._precision_flag not in (16, 32):
+                raise MisconfigurationException(
+                    f"`Trainer(accelerator='ipu', precision={self._precision_flag!r})` is not supported."
                 )
-                self.distributed_backend = _StrategyType.DDP_SPAWN
-
-        # special case with DDP on CPUs
-        if self.distributed_backend == _StrategyType.DDP_CPU:
-            if _TPU_AVAILABLE:
+        if isinstance(self.accelerator, TPUAccelerator):
+            if self._precision_flag == 64:
                 raise MisconfigurationException(
-                    "`accelerator='ddp_cpu'` is not supported on TPU machines. "
-                    "Learn more: https://github.com/PyTorchLightning/pytorch-lightning/issues/7810"
+                    "`Trainer(accelerator='tpu', precision=64)` is not implemented."
+                    " Please, open an issue in `https://github.com/PyTorchLightning/pytorch-lightning/issues`"
+                    " requesting this feature."
                 )
-            if self.num_processes == 1 and self.num_nodes > 1:
-                self._strategy_type = _StrategyType.DDP
-            else:
-                self._strategy_type = _StrategyType.DDP_SPAWN
-            if self.num_gpus > 0:
-                rank_zero_warn(
-                    "You requested one or more GPUs, but set `accelerator='ddp_cpu'`. Training will not use GPUs."
+            if self._precision_plugin_flag and not isinstance(
+                self._precision_plugin_flag, (TPUPrecisionPlugin, TPUBf16PrecisionPlugin)
+            ):
+                raise ValueError(
+                    f"The `TPUAccelerator` can only be used with a `TPUPrecisionPlugin`,"
+                    f" found: {self._precision_plugin_flag}."
                 )
-                self.parallel_device_ids = None
-            if self.num_processes is None:
-                # define the max CPU available
-                self.num_processes = os.cpu_count()
-        # special case with TPUs
-        elif self.has_tpu and not _use_cpu:
-            self._device_type = _AcceleratorType.TPU
-            if isinstance(self.tpu_cores, int):
-                self._strategy_type = _StrategyType.TPU_SPAWN
-        elif self.has_ipu and not _use_cpu:
-            self._device_type = _AcceleratorType.IPU
-        elif self.distributed_backend and self._strategy_type is None:
-            self._strategy_type = _StrategyType(self.distributed_backend)
-
-        if self.num_gpus > 0 and not _use_cpu:
-            self._device_type = _AcceleratorType.GPU
-
-        _gpu_strategy_types = (_StrategyType.DP, _StrategyType.DDP, _StrategyType.DDP_SPAWN, _StrategyType.DDP2)
-        # DP and DDP2 cannot run without GPU
-        if self.num_gpus == 0 and self._strategy_type in _gpu_strategy_types and not _use_cpu:
-
-            if (self.num_nodes and self.num_nodes > 1) or (self.num_processes and self.num_processes > 1):
-                if self._strategy_type in (_StrategyType.DP, _StrategyType.DDP2):
-                    rank_zero_warn(
-                        f"{self._strategy_type.value!r} is not supported on CPUs, hence setting `strategy='ddp'`."
-                    )
-                    self._strategy_type = _StrategyType.DDP
-            else:
-                rank_zero_warn("You are running on single node with no parallelization, so distributed has no effect.")
-                self._strategy_type = None
-
-        # finished configuring self._strategy_type, check ipython environment
-        self.check_interactive_compatibility()
-
-        # for DDP overwrite nb processes by requested GPUs
-        if self._device_type == _AcceleratorType.GPU and self._strategy_type in (
-            _StrategyType.DDP,
-            _StrategyType.DDP_SPAWN,
+        if (
+            self._precision_flag == 16
+            and isinstance(self.accelerator, CPUAccelerator)
+            and self._amp_type_flag == AMPType.APEX
         ):
-            self.num_processes = self.num_gpus
-
-        if self._device_type == _AcceleratorType.GPU and self._strategy_type == _StrategyType.DDP2:
-            self.num_processes = self.num_nodes
-
-        # Horovod is an extra case...
-        if self.distributed_backend == _StrategyType.HOROVOD:
-            self._set_horovod_backend()
-
-        using_valid_distributed = self.use_ddp or self.use_ddp2
-        if self.num_nodes > 1 and not using_valid_distributed:
-            # throw error to force user to choose a supported strategy type such as ddp or ddp2
             raise MisconfigurationException(
-                "Your chosen strategy does not support `num_nodes > 1`. Please set `strategy=('ddp'|'ddp2')`."
+                "You passed `Trainer(accelerator='cpu', precision=16, amp_type='apex')`"
+                " but apex AMP not supported on CPU."
             )
+        if self._precision_flag == "bf16" and self._amp_type_flag != AMPType.NATIVE:
+            raise MisconfigurationException(
+                f"You passed `Trainer(amp_type={self._amp_type_flag.value!r}, precision='bf16')` but "  # type: ignore
+                "it's not supported. Try using `amp_type='native'` instead."
+            )
+        if self._precision_flag in (16, "bf16") and self._amp_type_flag == AMPType.APEX:
+            if isinstance(self.strategy, (DDPShardedStrategy, DDPSpawnShardedStrategy, DDPFullyShardedStrategy)):
+                raise MisconfigurationException(
+                    "Sharded plugins are not supported with apex, please switch to `amp_backend='native'`."
+                )
 
-    def _set_horovod_backend(self):
-        self.check_horovod()
-        self._strategy_type = _StrategyType.HOROVOD
-
-        # Initialize Horovod to get rank / size info
-        hvd.init()
-        if self.has_gpu:
-            # Horovod assigns one local GPU per process
-            self.parallel_device_ids = list(range(hvd.local_size()))
-        else:
-            self.num_processes = hvd.local_size()
+    def _lazy_init_strategy(self) -> None:
+        """Lazily set missing attributes on the previously instantiated strategy."""
+        self.strategy.accelerator = self.accelerator
+        if self.precision_plugin:
+            self.strategy.precision_plugin = self.precision_plugin
+        if self.checkpoint_io:
+            self.strategy.checkpoint_io = self.checkpoint_io
+        if hasattr(self.strategy, "cluster_environment"):
+            self.strategy.cluster_environment = self.cluster_environment
+        if hasattr(self.strategy, "parallel_devices"):
+            if self.strategy.parallel_devices:
+                self._parallel_devices = self.strategy.parallel_devices
+            else:
+                self.strategy.parallel_devices = self._parallel_devices
+        if hasattr(self.strategy, "num_nodes"):
+            self.strategy._num_nodes = self._num_nodes_flag
+        if hasattr(self.strategy, "sync_batchnorm"):
+            self.strategy.sync_batchnorm = self.sync_batchnorm
+        if hasattr(self.strategy, "set_world_ranks"):
+            self.strategy.set_world_ranks()
+        self.strategy._configure_launcher()
 
-    def check_interactive_compatibility(self):
-        """Raises a `MisconfigurationException` if the accelerator and/or plugin is not compatible with an
-        interactive environment."""
         from pytorch_lightning.utilities import _IS_INTERACTIVE
 
-        if _IS_INTERACTIVE and self._strategy_type is not None and not self._strategy_type.is_interactive_compatible():
+        # TODO move is_compatible logic to strategy API
+        interactive_compatible_strategy = (
+            DataParallelStrategy.strategy_name,
+            DDPSpawnStrategy.strategy_name,
+            DDPSpawnShardedStrategy.strategy_name,
+            TPUSpawnStrategy.strategy_name,
+        )
+        if _IS_INTERACTIVE and self.strategy.strategy_name not in interactive_compatible_strategy:
             raise MisconfigurationException(
-                f"`Trainer(strategy={self._strategy_type.value!r})` or"
-                f" `Trainer(accelerator={self._strategy_type.value!r})` is not compatible with an interactive"
+                f"`Trainer(strategy={self.strategy.strategy_name!r})` or"
+                f" `Trainer(accelerator={self.strategy.strategy_name!r})` is not compatible with an interactive"
                 " environment. Run your code as a script, or choose one of the compatible backends:"
-                f" {', '.join(_StrategyType.interactive_compatible_types())}."
+                f" {', '.join(interactive_compatible_strategy)}."
                 " In case you are spawning processes yourself, make sure to include the Trainer"
                 " creation inside the worker function."
             )
 
-    def check_horovod(self):
-        """Raises a `MisconfigurationException` if the Trainer is not configured correctly for Horovod."""
-        if not _HOROVOD_AVAILABLE:
-            raise MisconfigurationException(
-                'Requested `accelerator="horovod"`, but Horovod is not installed.'
-                "Install with \n $HOROVOD_WITH_PYTORCH=1 pip install horovod[pytorch]"
+        # TODO: should be moved to _check_strategy_and_fallback().
+        # Current test check precision first, so keep this check here to meet error order
+        if isinstance(self.accelerator, TPUAccelerator) and not isinstance(
+            self.strategy, (SingleTPUStrategy, TPUSpawnStrategy)
+        ):
+            raise ValueError(
+                "The `TPUAccelerator` can only be used with a `SingleTPUStrategy` or `TPUSpawnStrategy`,"
+                f" found {self.strategy}."
             )
 
-        if self.num_gpus > 1 or self.num_nodes > 1:
-            raise MisconfigurationException(
-                "Horovod does not support setting num_nodes / num_gpus explicitly. Use "
-                "horovodrun / mpirun to configure the number of processes."
-            )
+    """The following properties are here for backward-compatibility and will be deprecated and removed in favor
+    of accessing this information through the strategy/accelerator directly."""
+    # TODO: deprecate all properties below
 
-    @staticmethod
-    def has_horovodrun() -> bool:
-        """Returns True if running with `horovodrun` using Gloo or OpenMPI."""
-        return _HOROVOD_AVAILABLE and ("OMPI_COMM_WORLD_RANK" in os.environ or "HOROVOD_RANK" in os.environ)
-
-    def update_device_type_if_ipu_plugin(self) -> None:
-        # This allows the poptorch.Options that are passed into the IPUStrategy to be the source of truth,
-        # which gives users the flexibility to not have to pass `ipus` flag directly to Trainer
-        if isinstance(self._strategy, IPUStrategy) and self._device_type != _AcceleratorType.IPU:
-            self._device_type = _AcceleratorType.IPU
-
-    def update_device_type_if_strategy_passed(self) -> None:
-        if isinstance(self._strategy_flag, Strategy) or any(isinstance(plug, Strategy) for plug in self.plugins):
-            if self._accelerator_type is not None:
-                if self.use_ipu:
-                    self._device_type = _AcceleratorType.IPU
-                elif self.use_tpu:
-                    self._device_type = _AcceleratorType.TPU
-                elif self.use_gpu:
-                    self._device_type = _AcceleratorType.GPU
-            else:
-                if self.has_ipu:
-                    self._device_type = _AcceleratorType.IPU
-                elif self.has_tpu:
-                    self._device_type = _AcceleratorType.TPU
-                elif self.has_gpu:
-                    self._device_type = _AcceleratorType.GPU
-
-    def _set_strategy_type_if_strategy_passed(self):
-        # This is required as when `Strategy` instance is passed to either `strategy`
-        # or `plugins` flag, `AcceleratorConnector.set_distributed_mode` is not required to be
-        # called and `_strategy_type` is not set.
-        if self._strategy_type is not None:
-            return
-        if self._strategy is not None:
-            self._strategy_type = getattr(self._strategy, "distributed_backend", None)
+    @property
+    def parallel_devices(self) -> List[Union[torch.device, int]]:
+        return self._parallel_devices
 
-    def _is_slurm_managing_tasks(self) -> bool:
-        """Returns whether we let SLURM manage the processes or not.
+    @property
+    def device_type(self) -> str:
+        if isinstance(self.accelerator, CPUAccelerator):
+            return "cpu"
+        if isinstance(self.accelerator, GPUAccelerator):
+            return "gpu"
+        if isinstance(self.accelerator, TPUAccelerator):
+            return "tpu"
+        if isinstance(self.accelerator, IPUAccelerator):
+            return "ipu"
 
-        Returns ``True`` if and only if these conditions match:
+    @property
+    def num_nodes(self) -> int:
+        return self._num_nodes_flag
 
-            - A SLURM cluster is detected
-            - A distributed plugin is being used
-            - The process is not launching in interactive mode
-            - The number of tasks in SLURM matches the requested number of devices and nodes in the Trainer
-        """
-        if (
-            (not self.use_ddp and not self.use_ddp2)
-            or not SLURMEnvironment.detect()
-            or SLURMEnvironment.job_name() == "bash"  # in interactive mode we don't manage tasks
-        ):
-            return False
+    @property
+    def num_processes(self) -> int:
+        return self.devices if self.devices is not None else 1
 
-        total_requested_devices = (self.num_gpus or self.num_processes) * self.num_nodes
-        num_slurm_tasks = int(os.environ["SLURM_NTASKS"], 0)
-        return num_slurm_tasks == total_requested_devices
+    @property
+    def root_gpu(self) -> Optional[int]:
+        return (
+            self.strategy.root_device.index
+            if not isinstance(self.accelerator, (IPUAccelerator, TPUAccelerator))
+            else None
+        )
 
-    def _check_plugin_compatibility(self) -> None:
-        """Checks that selected plugins are compatible with each other.
+    @property
+    def devices(self) -> int:
+        if isinstance(self.strategy, SingleDeviceStrategy):
+            return 1
+        elif isinstance(self.strategy, ParallelStrategy):
+            return len(self.strategy.parallel_devices)
+        return 0
 
-        Raises:
-            ValueError: If an invalid combination of Accelerator, Strategy, PrecisionPlugin is found.
-        """
+    @property
+    def tpu_cores(self) -> Optional[Union[List[int], int]]:
         if isinstance(self.accelerator, TPUAccelerator):
-            if not isinstance(self.strategy.precision_plugin, TPUPrecisionPlugin):
-                raise ValueError(
-                    f"The `TPUAccelerator` can only be used with a `TPUPrecisionPlugin`,"
-                    f" found: {self.strategy.precision_plugin}."
-                )
-            if not isinstance(self.strategy, (SingleTPUStrategy, TPUSpawnStrategy)):
-                raise ValueError(
-                    "The `TPUAccelerator` can only be used with a `SingleTPUStrategy` or `TPUSpawnStrategy`,"
-                    f" found {self.strategy}."
-                )
+            return self._tpu_cores  # type: ignore
+        return 0
+
+    @property
+    def tpu_id(self) -> Optional[int]:
+        if isinstance(self.accelerator, TPUAccelerator):
+            if isinstance(self._tpu_cores, list):
+                return self._tpu_cores[0]
+        return None
+
+    @property
+    def num_ipus(self) -> int:
+        if isinstance(self.accelerator, IPUAccelerator):
+            return self.devices
+        return 0
+
+    @property
+    def num_gpus(self) -> int:
+        if isinstance(self.accelerator, GPUAccelerator):
+            return self.devices
+        return 0
+
+    @property
+    def gpus(self) -> Optional[Union[List[int], str, int]]:
+        return self._gpus
+
+    @property
+    def parallel_device_ids(self) -> List[int]:
+        return [i for i in range(len(self.parallel_devices))] if isinstance(self.accelerator, GPUAccelerator) else []
+
+    @property
+    def is_distributed(self) -> bool:
+        # Used for custom plugins.
+        # Custom plugins should implement is_distributed property.
+        if hasattr(self.strategy, "is_distributed") and not isinstance(self.accelerator, TPUAccelerator):
+            return self.strategy.is_distributed
+        distributed_strategy = (
+            DDP2Strategy,
+            DDPStrategy,
+            DDPSpawnShardedStrategy,
+            DDPShardedStrategy,
+            DDPFullyShardedStrategy,
+            DDPSpawnStrategy,
+            DeepSpeedStrategy,
+            TPUSpawnStrategy,
+            HorovodStrategy,
+        )
+        is_distributed = isinstance(self.strategy, distributed_strategy)
+        if isinstance(self.accelerator, TPUAccelerator):
+            is_distributed |= self.strategy.is_distributed
+        return is_distributed
+
+    @property
+    def has_ipu(self) -> bool:
+        return isinstance(self.accelerator, IPUAccelerator) and isinstance(self.strategy, IPUStrategy)
+
+    @property
+    def use_ipu(self) -> bool:
+        return isinstance(self.accelerator, IPUAccelerator)
+
+    @property
+    def has_tpu(self) -> bool:
+        return isinstance(self.accelerator, TPUAccelerator)
+
+    @property
+    def use_dp(self) -> bool:
+        return isinstance(self.strategy, DataParallelStrategy)
+
+    @property
+    def _strategy_type(self) -> _StrategyType:
+        return self.strategy.strategy_name
diff --git a/pytorch_lightning/trainer/trainer.py b/pytorch_lightning/trainer/trainer.py
index 658c7ed4d09ca..6ed5d6c31f719 100644
--- a/pytorch_lightning/trainer/trainer.py
+++ b/pytorch_lightning/trainer/trainer.py
@@ -138,7 +138,7 @@ def __init__(
         gradient_clip_algorithm: Optional[str] = None,
         process_position: int = 0,
         num_nodes: int = 1,
-        num_processes: int = 1,
+        num_processes: Optional[int] = None,
         devices: Optional[Union[List[int], str, int]] = None,
         gpus: Optional[Union[List[int], str, int]] = None,
         auto_select_gpus: bool = False,
@@ -435,23 +435,23 @@ def __init__(
         self._data_connector = DataConnector(self, multiple_trainloader_mode)
 
         self._accelerator_connector = AcceleratorConnector(
-            num_processes,
-            devices,
-            tpu_cores,
-            ipus,
-            accelerator,
-            strategy,
-            gpus,
-            gpu_ids,
-            num_nodes,
-            sync_batchnorm,
-            benchmark,
-            replace_sampler_ddp,
-            deterministic,
-            precision,
-            amp_backend,
-            amp_level,
-            plugins,
+            num_processes=num_processes,
+            devices=devices,
+            tpu_cores=tpu_cores,
+            ipus=ipus,
+            accelerator=accelerator,
+            strategy=strategy,
+            gpus=gpus,
+            gpu_ids=gpu_ids,
+            num_nodes=num_nodes,
+            sync_batchnorm=sync_batchnorm,
+            benchmark=benchmark,
+            replace_sampler_ddp=replace_sampler_ddp,
+            deterministic=deterministic,
+            precision=precision,
+            amp_type=amp_backend,
+            amp_level=amp_level,
+            plugins=plugins,
         )
         self.logger_connector = LoggerConnector(self, log_gpu_memory)
         self._callback_connector = CallbackConnector(self)
@@ -1964,12 +1964,12 @@ def should_rank_save_checkpoint(self) -> bool:
         )
 
     @property
-    def _strategy_type(self) -> _StrategyType:
-        return self._accelerator_connector._strategy_type
+    def _strategy_type(self) -> str:
+        return self.strategy.strategy_name
 
     @property
     def _device_type(self) -> _AcceleratorType:
-        return self._accelerator_connector._device_type
+        return self._accelerator_connector.device_type
 
     @property
     def num_nodes(self) -> int:
@@ -2001,7 +2001,9 @@ def devices(self) -> Optional[Union[List[int], str, int]]:
 
     @property
     def data_parallel_device_ids(self) -> Optional[List[int]]:
-        return self._accelerator_connector.parallel_device_ids
+        return (
+            self._accelerator_connector.parallel_device_ids if self._accelerator_connector.parallel_device_ids else None
+        )
 
     @property
     def lightning_module(self) -> "pl.LightningModule":
diff --git a/pytorch_lightning/utilities/device_parser.py b/pytorch_lightning/utilities/device_parser.py
index 6fa9ace7f20ec..d7b8a319ea4d2 100644
--- a/pytorch_lightning/utilities/device_parser.py
+++ b/pytorch_lightning/utilities/device_parser.py
@@ -19,9 +19,10 @@
 from pytorch_lightning.tuner.auto_gpu_select import pick_multiple_gpus
 from pytorch_lightning.utilities import _TPU_AVAILABLE
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
+from pytorch_lightning.utilities.types import _DEVICE
 
 
-def determine_root_gpu_device(gpus: List[int]) -> Optional[int]:
+def determine_root_gpu_device(gpus: List[_DEVICE]) -> Optional[_DEVICE]:
     """
     Args:
         gpus: non-empty list of ints representing which gpus to use
@@ -164,7 +165,7 @@ def _sanitize_gpu_ids(gpus: List[int]) -> List[int]:
     for gpu in gpus:
         if gpu not in all_available_gpus:
             raise MisconfigurationException(
-                f"You requested GPUs: {gpus}\n But your machine only has: {all_available_gpus}"
+                f"You requested gpu: {gpus}\n But your machine only has: {all_available_gpus}"
             )
     return gpus
 
diff --git a/tests/accelerators/test_accelerator_connector.py b/tests/accelerators/test_accelerator_connector.py
index 8ceb2de96c59c..76fa6d64f5a56 100644
--- a/tests/accelerators/test_accelerator_connector.py
+++ b/tests/accelerators/test_accelerator_connector.py
@@ -445,18 +445,20 @@ def test_accelerator_choice_multi_node_gpu(
     assert isinstance(trainer.strategy, plugin)
 
 
-@pytest.mark.skipif(torch.cuda.is_available(), reason="test doesn't require GPU")
-def test_accelerator_cpu():
+@mock.patch("torch.cuda.is_available", return_value=False)
+def test_accelerator_cpu(_):
 
     trainer = Trainer(accelerator="cpu")
 
     assert trainer._device_type == "cpu"
     assert isinstance(trainer.accelerator, CPUAccelerator)
 
-    with pytest.raises(MisconfigurationException, match="You passed `accelerator='gpu'`, but GPUs are not available"):
-        trainer = Trainer(accelerator="gpu")
-
-    with pytest.raises(MisconfigurationException, match="You requested GPUs:"):
+    with pytest.raises(MisconfigurationException, match="You requested gpu:"):
+        trainer = Trainer(gpus=1)
+    # TODO enable this test when add device availability check
+    # with pytest.raises(MisconfigurationException, match="You requested gpu, but gpu is not available"):
+    #     trainer = Trainer(accelerator="gpu")
+    with pytest.raises(MisconfigurationException, match="You requested gpu:"):
         trainer = Trainer(accelerator="cpu", gpus=1)
 
 
@@ -468,10 +470,8 @@ def test_accelerator_gpu():
     assert trainer._device_type == "gpu"
     assert isinstance(trainer.accelerator, GPUAccelerator)
 
-    with pytest.raises(
-        MisconfigurationException, match="You passed `accelerator='gpu'`, but you didn't pass `gpus` to `Trainer`"
-    ):
-        trainer = Trainer(accelerator="gpu")
+    trainer = Trainer(accelerator="gpu")
+    assert isinstance(trainer.accelerator, GPUAccelerator)
 
     trainer = Trainer(accelerator="auto", gpus=1)
 
@@ -552,8 +552,9 @@ def test_accelerator_gpu_with_gpus_priority():
 
 def test_validate_accelerator_and_devices():
 
-    with pytest.raises(MisconfigurationException, match="You passed `devices=2` but haven't specified"):
-        Trainer(accelerator="ddp_cpu", devices=2)
+    trainer = Trainer(accelerator="ddp_cpu", devices=2)
+    assert isinstance(trainer.accelerator, CPUAccelerator)
+    assert trainer.num_processes == 2
 
 
 def test_set_devices_if_none_cpu():
@@ -571,8 +572,10 @@ def test_set_devices_if_none_gpu():
 
 def test_devices_with_cpu_only_supports_integer():
 
-    with pytest.raises(MisconfigurationException, match="The flag `devices` must be an int"):
-        Trainer(accelerator="cpu", devices="1,3")
+    with pytest.warns(UserWarning, match="The flag `devices` must be an int"):
+        trainer = Trainer(accelerator="cpu", devices="1,3")
+    assert isinstance(trainer.accelerator, CPUAccelerator)
+    assert trainer.devices == 1
 
 
 @pytest.mark.parametrize("training_type", ["ddp2", "dp"])
@@ -599,8 +602,9 @@ def test_exception_when_strategy_used_with_accelerator():
 
 
 def test_exception_when_strategy_used_with_plugins():
-    with pytest.raises(MisconfigurationException, match="only specify one training type plugin, but you have passed"):
-        Trainer(plugins="ddp_find_unused_parameters_false", strategy="ddp_spawn")
+    with pytest.raises(MisconfigurationException, match="only specify one strategy, but you have passed"):
+        with pytest.deprecated_call(match=r"`strategy` to the `plugins` flag in Trainer has been deprecated"):
+            Trainer(plugins="ddp_find_unused_parameters_false", strategy="ddp_spawn")
 
 
 def test_exception_invalid_strategy():
@@ -896,13 +900,14 @@ def test_unsupported_tpu_choice(monkeypatch):
     with pytest.raises(MisconfigurationException, match=r"accelerator='tpu', precision=64\)` is not implemented"):
         Trainer(accelerator="tpu", precision=64)
 
+    # if user didn't set strategy, AcceleratorConnector will choose the TPUSingleStrategy or TPUSpawnStrategy
     with pytest.raises(ValueError, match="TPUAccelerator` can only be used with a `SingleTPUStrategy`"):
         with pytest.warns(UserWarning, match=r"accelerator='tpu', precision=16\)` but native AMP is not supported"):
-            Trainer(accelerator="tpu", precision=16)
+            Trainer(accelerator="tpu", precision=16, strategy="ddp")
 
     with pytest.raises(ValueError, match="TPUAccelerator` can only be used with a `SingleTPUStrategy`"):
         with pytest.warns(UserWarning, match=r"accelerator='tpu', precision=16\)` but apex AMP is not supported"):
-            Trainer(accelerator="tpu", precision=16, amp_backend="apex")
+            Trainer(accelerator="tpu", precision=16, amp_backend="apex", strategy="single_device")
 
 
 def test_unsupported_ipu_choice(monkeypatch):
@@ -934,3 +939,11 @@ def test_devices_auto_choice_gpu(is_gpu_available_mock, device_count_mock):
     trainer = Trainer(accelerator="auto", devices="auto")
     assert trainer.devices == 2
     assert trainer.gpus == 2
+
+
+def test_passing_zero_and_empty_list_to_devices_flag():
+    with pytest.warns(UserWarning, match=r"switching to `cpu` accelerator"):
+        Trainer(accelerator="gpu", devices=0)
+
+    with pytest.warns(UserWarning, match=r"switching to `cpu` accelerator"):
+        Trainer(accelerator="gpu", devices=[])
diff --git a/tests/accelerators/test_ipu.py b/tests/accelerators/test_ipu.py
index 861b149733c0c..b8f01815704f5 100644
--- a/tests/accelerators/test_ipu.py
+++ b/tests/accelerators/test_ipu.py
@@ -116,7 +116,7 @@ def test_accelerator_selected(tmpdir):
 @RunIf(ipu=True)
 def test_warning_if_ipus_not_used(tmpdir):
     with pytest.warns(UserWarning, match="IPU available but not used. Set the `ipus` flag in your trainer"):
-        Trainer(default_root_dir=tmpdir)
+        Trainer(default_root_dir=tmpdir, accelerator="cpu")
 
 
 @RunIf(ipu=True)
@@ -505,10 +505,8 @@ def test_accelerator_ipu():
     assert trainer._device_type == "ipu"
     assert isinstance(trainer.accelerator, IPUAccelerator)
 
-    with pytest.raises(
-        MisconfigurationException, match="You passed `accelerator='ipu'`, but you didn't pass `ipus` to `Trainer`"
-    ):
-        trainer = Trainer(accelerator="ipu")
+    trainer = Trainer(accelerator="ipu")
+    assert isinstance(trainer.accelerator, IPUAccelerator)
 
     trainer = Trainer(accelerator="auto", ipus=8)
 
diff --git a/tests/accelerators/test_tpu.py b/tests/accelerators/test_tpu.py
index 608d98304c757..d8f99ec4dcedb 100644
--- a/tests/accelerators/test_tpu.py
+++ b/tests/accelerators/test_tpu.py
@@ -13,7 +13,7 @@
 # limitations under the License
 import collections
 from copy import deepcopy
-from unittest.mock import Mock, patch
+from unittest.mock import patch
 
 import pytest
 import torch
@@ -23,7 +23,7 @@
 from pytorch_lightning import Trainer
 from pytorch_lightning.accelerators.cpu import CPUAccelerator
 from pytorch_lightning.accelerators.tpu import TPUAccelerator
-from pytorch_lightning.plugins import TPUPrecisionPlugin, XLACheckpointIO
+from pytorch_lightning.plugins import PrecisionPlugin, TPUPrecisionPlugin, XLACheckpointIO
 from pytorch_lightning.strategies import DDPStrategy, TPUSpawnStrategy
 from pytorch_lightning.utilities import find_shared_parameters
 from pytorch_lightning.utilities.exceptions import MisconfigurationException
@@ -90,10 +90,8 @@ def test_accelerator_tpu():
     assert trainer._device_type == "tpu"
     assert isinstance(trainer.accelerator, TPUAccelerator)
 
-    with pytest.raises(
-        MisconfigurationException, match="You passed `accelerator='tpu'`, but you didn't pass `tpu_cores` to `Trainer`"
-    ):
-        trainer = Trainer(accelerator="tpu")
+    trainer = Trainer(accelerator="tpu")
+    assert isinstance(trainer.accelerator, TPUAccelerator)
 
 
 @RunIf(tpu=True)
@@ -231,9 +229,14 @@ def test_ddp_cpu_not_supported_on_tpus():
 
 
 @RunIf(tpu=True)
-@pytest.mark.parametrize("strategy", ["ddp_spawn", "tpu_spawn_debug"])
-def test_strategy_choice_tpu_str(tmpdir, strategy):
-    trainer = Trainer(strategy=strategy, accelerator="tpu", devices=8)
+def test_strategy_choice_tpu_str_ddp_spawn(tmpdir):
+    with pytest.raises(ValueError, match="TPUAccelerator` can only be used with a `SingleTPUStrategy`"):
+        Trainer(strategy="ddp_spawn", accelerator="tpu", devices=8)
+
+
+@RunIf(tpu=True)
+def test_strategy_choice_tpu_str_tpu_spawn_debug(tmpdir):
+    trainer = Trainer(strategy="tpu_spawn_debug", accelerator="tpu", devices=8)
     assert isinstance(trainer.strategy, TPUSpawnStrategy)
 
 
@@ -290,27 +293,27 @@ def forward(self, x):
 
 
 def test_tpu_invalid_raises():
-    training_type_plugin = TPUSpawnStrategy(accelerator=TPUAccelerator(), precision_plugin=Mock())
+    strategy = TPUSpawnStrategy(accelerator=TPUAccelerator(), precision_plugin=PrecisionPlugin())
     with pytest.raises(ValueError, match="TPUAccelerator` can only be used with a `TPUPrecisionPlugin"):
-        Trainer(strategy=training_type_plugin)
+        Trainer(strategy=strategy)
 
-    training_type_plugin = DDPStrategy(accelerator=TPUAccelerator(), precision_plugin=TPUPrecisionPlugin())
+    strategy = DDPStrategy(accelerator=TPUAccelerator(), precision_plugin=TPUPrecisionPlugin())
     with pytest.raises(ValueError, match="TPUAccelerator` can only be used with a `SingleTPUStrategy`"):
-        Trainer(strategy=training_type_plugin)
+        Trainer(strategy=strategy)
 
 
 def test_tpu_invalid_raises_set_precision_with_strategy():
     accelerator = TPUAccelerator()
-    training_type_plugin = TPUSpawnStrategy(accelerator=accelerator, precision_plugin=object())
+    strategy = TPUSpawnStrategy(accelerator=accelerator, precision_plugin=PrecisionPlugin())
     with pytest.raises(ValueError, match="`TPUAccelerator` can only be used with a `TPUPrecisionPlugin`"):
-        Trainer(strategy=training_type_plugin)
+        Trainer(strategy=strategy)
 
     accelerator = TPUAccelerator()
-    training_type_plugin = DDPStrategy(accelerator=accelerator, precision_plugin=TPUPrecisionPlugin())
+    strategy = DDPStrategy(accelerator=accelerator, precision_plugin=TPUPrecisionPlugin())
     with pytest.raises(
         ValueError, match="The `TPUAccelerator` can only be used with a `SingleTPUStrategy` or `TPUSpawnStrategy"
     ):
-        Trainer(strategy=training_type_plugin)
+        Trainer(strategy=strategy)
 
 
 @RunIf(tpu=True)
diff --git a/tests/models/test_gpu.py b/tests/models/test_gpu.py
index c494c0c1c18e6..d17322e191ff1 100644
--- a/tests/models/test_gpu.py
+++ b/tests/models/test_gpu.py
@@ -242,7 +242,7 @@ def test_torchelastic_gpu_parsing(mocked_device_count, mocked_is_available, gpus
     sanitizing the gpus as only one of the GPUs is visible."""
     trainer = Trainer(gpus=gpus)
     assert isinstance(trainer._accelerator_connector.cluster_environment, TorchElasticEnvironment)
-    assert trainer._accelerator_connector.parallel_device_ids == device_parser.parse_gpu_ids(gpus)
+    assert trainer.data_parallel_device_ids == device_parser.parse_gpu_ids(gpus)
     assert trainer.gpus == gpus
 
 
diff --git a/tests/strategies/test_deepspeed_strategy.py b/tests/strategies/test_deepspeed_strategy.py
index 5eed2578546ba..e5306b0942131 100644
--- a/tests/strategies/test_deepspeed_strategy.py
+++ b/tests/strategies/test_deepspeed_strategy.py
@@ -167,7 +167,12 @@ def test_deepspeed_precision_choice(amp_backend, precision, tmpdir):
     """
 
     trainer = Trainer(
-        fast_dev_run=True, default_root_dir=tmpdir, strategy="deepspeed", amp_backend=amp_backend, precision=precision
+        fast_dev_run=True,
+        default_root_dir=tmpdir,
+        accelerator="gpu",
+        strategy="deepspeed",
+        amp_backend=amp_backend,
+        precision=precision,
     )
 
     assert isinstance(trainer.strategy, DeepSpeedStrategy)
diff --git a/tests/strategies/test_strategy_registry.py b/tests/strategies/test_strategy_registry.py
index ab0629b28b698..89422b3719a29 100644
--- a/tests/strategies/test_strategy_registry.py
+++ b/tests/strategies/test_strategy_registry.py
@@ -31,7 +31,7 @@
 def test_strategy_registry_with_new_strategy():
     class TestStrategy:
 
-        distributed_backend = "test_strategy"
+        strategy_name = "test_strategy"
 
         def __init__(self, param1, param2):
             self.param1 = param1
@@ -45,7 +45,7 @@ def __init__(self, param1, param2):
     assert strategy_name in StrategyRegistry
     assert StrategyRegistry[strategy_name]["description"] == strategy_description
     assert StrategyRegistry[strategy_name]["init_params"] == {"param1": "abc", "param2": 123}
-    assert StrategyRegistry[strategy_name]["distributed_backend"] == "test_strategy"
+    assert StrategyRegistry[strategy_name]["strategy_name"] == "test_strategy"
     assert isinstance(StrategyRegistry.get(strategy_name), TestStrategy)
 
     StrategyRegistry.remove(strategy_name)
diff --git a/tests/trainer/flags/test_env_vars.py b/tests/trainer/flags/test_env_vars.py
index bbcc5447d03ce..0e9e6469d67a8 100644
--- a/tests/trainer/flags/test_env_vars.py
+++ b/tests/trainer/flags/test_env_vars.py
@@ -53,4 +53,4 @@ def test_passing_env_variables_devices(cuda_available_mock, device_count_mock):
     trainer = Trainer()
     assert trainer.devices == 2
     trainer = Trainer(accelerator="gpu", devices=1)
-    assert trainer.devices == 1
+    assert trainer.devices == 2
diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py
index 587ff0b7b9f72..0d2d8bbdc55b6 100644
--- a/tests/trainer/test_trainer.py
+++ b/tests/trainer/test_trainer.py
@@ -47,7 +47,7 @@
     DDPStrategy,
 )
 from pytorch_lightning.trainer.states import TrainerFn
-from pytorch_lightning.utilities import _AcceleratorType, _StrategyType
+from pytorch_lightning.utilities import _AcceleratorType
 from pytorch_lightning.utilities.cloud_io import load as pl_load
 from pytorch_lightning.utilities.exceptions import DeadlockDetectedException, MisconfigurationException
 from pytorch_lightning.utilities.imports import _IS_WINDOWS, _OMEGACONF_AVAILABLE, _TORCH_GREATER_EQUAL_1_8
@@ -1177,81 +1177,75 @@ def val_dataloader(self):
     [
         (
             dict(accelerator=None, gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="single_device", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="dp", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp", num_nodes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp_cpu", num_processes=2, gpus=None),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp2", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator=None, gpus=1),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="single_device", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(accelerator="dp", gpus=1),
-            dict(_strategy_type=_StrategyType.DP, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="dp", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(accelerator="ddp", gpus=1),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(accelerator="ddp_cpu", num_processes=2, gpus=1),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="ddp2", gpus=1),
-            dict(_strategy_type=_StrategyType.DDP2, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="ddp2", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(accelerator=None, gpus=2),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(accelerator="dp", gpus=2),
-            dict(_strategy_type=_StrategyType.DP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="dp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(accelerator="ddp", gpus=2),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(accelerator="ddp2", gpus=2),
-            dict(_strategy_type=_StrategyType.DDP2, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="ddp2", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(accelerator="ddp2", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(accelerator="dp", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
     ],
 )
@@ -1264,9 +1258,9 @@ def test_trainer_config(trainer_kwargs, expected, monkeypatch):
     else:
         with pytest.deprecated_call(match=r"accelerator='.*'\)` has been deprecated in v1.5"):
             trainer = Trainer(**trainer_kwargs)
-    assert len(expected) == 4
+    assert len(expected) == 3
     for k, v in expected.items():
-        assert getattr(trainer, k) == v, f"Failed {k}: {v}"
+        assert getattr(trainer, k) == v, f"Failed on {trainer_kwargs}, where {k}={ getattr(trainer, k)}, not {v}"
 
 
 def test_trainer_subclassing():
@@ -2103,146 +2097,127 @@ def training_step(self, batch, batch_idx):
     [
         (
             dict(strategy=None, gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="single_device", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="dp", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp", num_nodes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp2", gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy=None, gpus=1),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="single_device", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy="dp", gpus=1),
-            dict(_strategy_type=_StrategyType.DP, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="dp", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy="ddp", gpus=1),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy="ddp_spawn", gpus=1),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy="ddp2", gpus=1),
-            dict(_strategy_type=_StrategyType.DDP2, _device_type=_AcceleratorType.GPU, num_gpus=1, num_processes=1),
+            dict(_strategy_type="ddp2", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy=None, gpus=2),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy="dp", gpus=2),
-            dict(_strategy_type=_StrategyType.DP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="dp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy="ddp", gpus=2),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy="ddp2", gpus=2),
-            dict(_strategy_type=_StrategyType.DDP2, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="ddp2", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy="ddp2", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="dp", num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp_spawn", num_processes=2, gpus=None),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp_spawn", num_processes=1, gpus=None),
-            dict(_strategy_type=None, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=1),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy="ddp_fully_sharded", gpus=1),
-            dict(
-                _strategy_type=_StrategyType.DDP_FULLY_SHARDED,
-                _device_type=_AcceleratorType.GPU,
-                num_gpus=1,
-                num_processes=1,
-            ),
+            dict(_strategy_type="ddp_fully_sharded", _device_type=_AcceleratorType.GPU, num_gpus=1),
         ),
         (
             dict(strategy=DDPSpawnStrategy(), num_processes=2, gpus=None),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy=DDPSpawnStrategy(), gpus=2),
-            dict(
-                _strategy_type=_StrategyType.DDP_SPAWN, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1
-            ),
+            dict(_strategy_type="ddp_spawn", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy=DDPStrategy(), num_processes=2, gpus=None),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.CPU, num_gpus=0, num_processes=2),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.CPU, num_gpus=0),
         ),
         (
             dict(strategy=DDPStrategy(), gpus=2),
-            dict(_strategy_type=_StrategyType.DDP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="ddp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy=DDP2Strategy(), gpus=2),
-            dict(_strategy_type=_StrategyType.DDP2, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="ddp2", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy=DataParallelStrategy(), gpus=2),
-            dict(_strategy_type=_StrategyType.DP, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1),
+            dict(_strategy_type="dp", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
         (
             dict(strategy=DDPFullyShardedStrategy(), gpus=2),
             dict(
-                _strategy_type=_StrategyType.DDP_FULLY_SHARDED,
+                _strategy_type="ddp_fully_sharded",
                 _device_type=_AcceleratorType.GPU,
                 num_gpus=2,
-                num_processes=1,
             ),
         ),
         (
             dict(strategy=DDPSpawnShardedStrategy(), gpus=2),
             dict(
-                _strategy_type=_StrategyType.DDP_SHARDED_SPAWN,
+                _strategy_type="ddp_sharded_spawn",
                 _device_type=_AcceleratorType.GPU,
                 num_gpus=2,
-                num_processes=1,
             ),
         ),
         (
             dict(strategy=DDPShardedStrategy(), gpus=2),
-            dict(
-                _strategy_type=_StrategyType.DDP_SHARDED, _device_type=_AcceleratorType.GPU, num_gpus=2, num_processes=1
-            ),
+            dict(_strategy_type="ddp_sharded", _device_type=_AcceleratorType.GPU, num_gpus=2),
         ),
     ],
 )
@@ -2251,6 +2226,6 @@ def test_trainer_config_strategy(trainer_kwargs, expected, monkeypatch):
         monkeypatch.setattr(torch.cuda, "is_available", lambda: True)
         monkeypatch.setattr(torch.cuda, "device_count", lambda: trainer_kwargs["gpus"])
     trainer = Trainer(**trainer_kwargs)
-    assert len(expected) == 4
+    assert len(expected) == 3
     for k, v in expected.items():
-        assert getattr(trainer, k) == v, f"Failed {k}: {v}"
+        assert getattr(trainer, k) == v, f"Failed on {trainer_kwargs}, where {k}={ getattr(trainer, k)}, not {v}"
diff --git a/tests/trainer/test_trainer_cli.py b/tests/trainer/test_trainer_cli.py
index 25221f8111f96..b5713893f769b 100644
--- a/tests/trainer/test_trainer_cli.py
+++ b/tests/trainer/test_trainer_cli.py
@@ -163,7 +163,7 @@ def test_argparse_args_parsing_fast_dev_run(cli_args, expected):
 
 @pytest.mark.parametrize(
     ["cli_args", "expected_parsed", "expected_device_ids"],
-    [("", None, None), ("--accelerator gpu --devices 1", "1", [0]), ("--accelerator gpu --devices 0,", "0,", [0])],
+    [("", None, None), ("--accelerator gpu --devices 1", "1", [0]), ("--accelerator gpu --devices 0,", "0,", None)],
 )
 @RunIf(min_gpus=1)
 def test_argparse_args_parsing_devices(cli_args, expected_parsed, expected_device_ids):
diff --git a/tests/utilities/test_cli.py b/tests/utilities/test_cli.py
index 5ef2cf98cf3e7..2803c0c4601c1 100644
--- a/tests/utilities/test_cli.py
+++ b/tests/utilities/test_cli.py
@@ -324,7 +324,7 @@ def test_lightning_cli_args_cluster_environments(tmpdir):
     class TestModel(BoringModel):
         def on_fit_start(self):
             # Ensure SLURMEnvironment is set, instead of default LightningEnvironment
-            assert isinstance(self.trainer._accelerator_connector._cluster_environment, SLURMEnvironment)
+            assert isinstance(self.trainer._accelerator_connector.cluster_environment, SLURMEnvironment)
             self.trainer.ran_asserts = True
 
     with mock.patch("sys.argv", ["any.py", "fit", f"--trainer.plugins={json.dumps(plugins)}"]):
@@ -580,8 +580,11 @@ def on_fit_start(self):
 @pytest.mark.parametrize(
     "trainer_kwargs",
     (
-        dict(strategy="ddp_spawn"),
-        dict(strategy="ddp"),
+        # dict(strategy="ddp_spawn")
+        # dict(strategy="ddp")
+        # the previous accl_conn will choose singleDeviceStrategy for both strategy=ddp/ddp_spawn
+        # TODO revisit this test as it never worked with DDP or DDPSpawn
+        dict(strategy="single_device"),
         pytest.param({"tpu_cores": 1}, marks=RunIf(tpu=True)),
     ),
 )