Python LightningDistributedDataParallel示例，pytorch_lightning.overrides.data_parallel.LightningDistributedDataParallel Python示例

示例#1

0

显示文件

    def configure_ddp(self, model: LightningModule,
                      device_ids: List[int]) -> DistributedDataParallel:
        """ Override LightningModule ddp if using model parallel.

        Args:
            model (LightningModule): the LightningModule currently being optimized
            device_ids (List[int]): the list of GPU ids.

        Returns:
            DistributedDataParallel: DDP wrapped model
        """

        app_state = AppState()

        if app_state.model_parallel_size is not None:
            logging.info("Configuring DDP for model parallelism.")
            logging.info(
                f"data_parallel_group: {app_state.data_parallel_group}")
            # with model parallelism, multiple GPUs form a large "logical GPU"
            # this means that data parallel groups span multiple GPUs
            # and are non-trivial

            model = LightningDistributedDataParallel(
                model,
                device_ids,
                output_device=device_ids[0],
                process_group=app_state.data_parallel_group)
            return model

        else:
            logging.info(
                "Did not detect model parallel using LightningModule.configure_ddp"
            )
            return LightningModule.configure_ddp(self, model, device_ids)

示例#2

0

显示文件

文件： ddp_cpu_slurm_backend.py 项目： eisene/pytorch-lightning

 def configure_ddp(
     self, model: "LightningModule", device_ids: List[int]
 ) -> DistributedDataParallel:
     model = LightningDistributedDataParallel(
         model, device_ids=device_ids, find_unused_parameters=True
     )
     return model

示例#3

0

显示文件

    def configure_ddp(self, model, device_ids):
        """Override to init DDP in a different way or use your own wrapper.

        :param model:
        :param device_ids:
        :return: DDP wrapped model

        Overwrite to define your own DDP implementation init.
        The only requirement is that:
        1. On a validation batch the call goes to model.validation_step.
        2. On a training batch the call goes to model.training_step.
        3. On a testing batch, the call goes to model.test_step

        .. code-block:: python

            def configure_ddp(self, model, device_ids):
                # Lightning DDP simply routes to test_step, val_step, etc...
                model = LightningDistributedDataParallel(
                    model,
                    device_ids=device_ids,
                    find_unused_parameters=True
                )
                return model


        """
        model = LightningDistributedDataParallel(model,
                                                 device_ids=device_ids,
                                                 find_unused_parameters=True)
        return model

示例#4

0

显示文件

    def configure_ddp(
            self, model: LightningModule,
            device_ids: List[int]) -> LightningDistributedDataParallel:
        """
        Pass through all customizations from constructor to `LightningDistributedDataParallel`.
        Override to define a custom DDP implementation.

        .. note:: Only requirement is that your DDP implementation subclasses LightningDistributedDataParallel


        The default implementation is::

            def configure_ddp(self, model, device_ids):
                model = LightningDistributedDataParallel(
                    model, device_ids=device_ids, find_unused_parameters=False
                )
                return model

        Args:
            model: the lightningModule
            device_ids: the list of devices available

        Returns:
            the model wrapped in LightningDistributedDataParallel

        """
        # if unset, default `find_unused_parameters` `False`
        self._ddp_kwargs["find_unused_parameters"] = self._ddp_kwargs.get(
            "find_unused_parameters", False)
        model = LightningDistributedDataParallel(
            model,
            device_ids=device_ids,
            **self._ddp_kwargs,
        )
        return model

示例#5

0

显示文件

 def block_backward_sync(self, model: LightningDistributedDataParallel):
     """
     Blocks ddp sync gradients behaviour on backwards pass.
     This is useful for skipping sync when accumulating gradients, reducing communication overhead
     Returns: context manager with sync behaviour off
     """
     yield model.no_sync()

示例#6

0

显示文件

文件： triviaqa.py 项目： marcelomata/longformer

 def configure_ddp(self, model, device_ids):
     model = LightningDistributedDataParallel(
         model,
         device_ids=device_ids,
         find_unused_parameters=True
     )
     return model

示例#7

0

显示文件

文件： lightning.py 项目： johndpope/combustion

 def _distributed_model(
         self,
         model: pl.LightningModule) -> LightningDistributedDataParallel:
     model = LightningDistributedDataParallel(model,
                                              device_ids=[0],
                                              find_unused_parameters=True)
     return model

示例#8

0

显示文件

文件： ddp_plugin.py 项目： QuinlanD/pytorch-lightning

    def configure_ddp(
            self, model: LightningModule,
            device_ids: List[int]) -> LightningDistributedDataParallel:
        """
        Override to define a custom DDP implementation.

        .. note:: Only requirement is that your DDP implementation subclasses LightningDistributedDataParallel


        The default implementation is::

            def configure_ddp(self, model, device_ids):
                model = LightningDistributedDataParallel(
                    model, device_ids=device_ids, find_unused_parameters=True
                )
                return model

        Args:
            model: the lightningModule
            device_ids: the list of devices available

        Returns:
            the model wrapped in LightningDistributedDataParallel

        """
        model = LightningDistributedDataParallel(model,
                                                 device_ids=device_ids,
                                                 find_unused_parameters=True)
        return model

示例#9

0

显示文件

 def _configure_ddp(self, models, device_ids, ddp_args=None):
     assert len(models) == 1
     model = models[0]
     assert isinstance(model, ptl.LightningModule)
     model = LightningDistributedDataParallel(model,
                                              device_ids=device_ids,
                                              find_unused_parameters=True)
     return [model]

示例#10

0

显示文件

 def configure_ddp(self, model, device_ids):
     self._ddp_kwargs["find_unused_parameters"] = self._ddp_kwargs.get(
         "find_unused_parameters", False)
     model = LightningDistributedDataParallel(
         model,
         device_ids=device_ids,
         **self._ddp_kwargs["find_unused_parameters"])
     return model

示例#11

0

显示文件

 def configure_ddp(self, model: LightningModule,
                   device_ids: List[int]) -> DistributedDataParallel:
     logging.info(
         f'overriding ddp to set find_unused_parameters to {self._cfg.find_unused_parameters}'
     )
     model = LightningDistributedDataParallel(
         model,
         device_ids=device_ids,
         find_unused_parameters=self._cfg.find_unused_parameters)
     return model

示例#12

0

显示文件

文件： test_remove_1-4.py 项目： ieshreya/pytorch-lightning

 def configure_ddp(self):
     # old, deprecated implementation
     with pytest.deprecated_call(
         match='`LightningDistributedDataParallel` is deprecated since v1.2 and will be removed in v1.4.'
     ):
         self._model = LightningDistributedDataParallel(
             module=self.lightning_module,
             device_ids=self.determine_ddp_device_ids(),
             **self._ddp_kwargs,
         )
         assert isinstance(self.model, torch.nn.parallel.DistributedDataParallel)
         assert isinstance(self.model.module, LightningDistributedModule)

示例#13

0

显示文件

文件： lightning.py 项目： colehurwitz/pytorch-lightning

    def configure_ddp(self, model, device_ids):
        r"""

        Override to init DDP in your own way or with your own wrapper.
        The only requirements are that:

        1. On a validation batch the call goes to model.validation_step.
        2. On a training batch the call goes to model.training_step.
        3. On a testing batch, the call goes to model.test_step

        Args:
            model (LightningModule): the LightningModule currently being optimized
            device_ids (list): the list of GPU ids

        Return:
            DDP wrapped model

        Example
        -------
        .. code-block:: python

            # default implementation used in Trainer
            def configure_ddp(self, model, device_ids):
                # Lightning DDP simply routes to test_step, val_step, etc...
                model = LightningDistributedDataParallel(
                    model,
                    device_ids=device_ids,
                    find_unused_parameters=True
                )
                return model


        """
        model = LightningDistributedDataParallel(
            model,
            device_ids=device_ids,
            find_unused_parameters=True
        )
        return model

示例#14

0

显示文件

 def on_after_manual_backward(self, model: LightningDistributedDataParallel):
     model.reducer_reset_hooks()

示例#15

0

显示文件

 def on_before_manual_backward(self, model: LightningDistributedDataParallel, output: Any):
     model.reducer_prepare_for_backwards(output)