Python Trainer.cumulative_training_time示例

编程语言: Python

命名空间/包名称: fairseq.trainer

类/类型: Trainer

方法/功能: cumulative_training_time

hotexamples.com的示例: 2

Python Trainer.cumulative_training_time - 已找到2个示例。这些是从开源项目中提取的最受好评的fairseq.trainer.Trainer.cumulative_training_time现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

Trainer(30)

lr_step(30)

get_lr(30)

get_num_updates(25)

get_train_iterator(21)

get_model(16)

dummy_train_step(12)

load_checkpoint(4)

_prepare_sample(2)

get_valid_iterator(2)

begin_valid_epoch(2)

cumulative_training_time(2)

begin_epoch(2)

n_validations_since_best(1)

meters_to_device(1)

_model(1)

lr_reinit(1)

load_model_only(1)

init_meters(1)

get_meter(1)

_build_optimizer(1)

get_dec_lr(1)

freeze_old_model(1)

fim(1)

early_stopping(1)

dec_lr_step(1)

best_sari(1)

prepare_ewc(1)

示例#1

显示文件

文件： train.py 项目： lvassertail/natsum

def validate_and_save(
    cfg: DictConfig,
    trainer: Trainer,
    task: tasks.FairseqTask,
    epoch_itr,
    valid_subsets: List[str],
    end_of_epoch: bool,
) -> Tuple[List[Optional[float]], bool]:
    num_updates = trainer.get_num_updates()
    max_update = cfg.optimization.max_update or math.inf

    # Stopping conditions (and an additional one based on validation loss later
    # on)
    should_stop = False
    if num_updates >= max_update:
        should_stop = True
        logger.info(f"Stopping training due to "
                    f"num_updates: {num_updates} >= max_update: {max_update}")

    training_time_hours = trainer.cumulative_training_time() / (60 * 60)
    if (cfg.optimization.stop_time_hours > 0
            and training_time_hours > cfg.optimization.stop_time_hours):
        should_stop = True
        logger.info(
            f"Stopping training due to "
            f"cumulative_training_time: {training_time_hours} > "
            f"stop_time_hours: {cfg.optimization.stop_time_hours} hour(s)")

    do_save = ((end_of_epoch
                and epoch_itr.epoch % cfg.checkpoint.save_interval == 0)
               or should_stop
               or (cfg.checkpoint.save_interval_updates > 0 and num_updates > 0
                   and num_updates % cfg.checkpoint.save_interval_updates == 0
                   and num_updates >= cfg.dataset.validate_after_updates))
    do_validate = (
        (not end_of_epoch and do_save)  # validate during mid-epoch saves
        or
        (end_of_epoch and epoch_itr.epoch % cfg.dataset.validate_interval == 0)
        or should_stop or
        (cfg.dataset.validate_interval_updates > 0 and num_updates > 0
         and num_updates % cfg.dataset.validate_interval_updates
         == 0)) and not cfg.dataset.disable_validation

    # if there is a need to validate and we should keep the N>0 best checkpoints then "do_save" should be "on" anyway
    do_save = do_save or (do_validate
                          and cfg.checkpoint.keep_best_checkpoints > 0)

    # Validate
    valid_losses = [None]
    if do_validate:
        valid_losses = validate(cfg, trainer, task, epoch_itr, valid_subsets)

    should_stop |= should_stop_early(cfg, valid_losses[0])

    # Save checkpoint
    if do_save or should_stop:
        checkpoint_utils.save_checkpoint(cfg.checkpoint, trainer, epoch_itr,
                                         valid_losses[0])

    return valid_losses, should_stop

示例#2

显示文件

文件： train.py 项目： killa1218/fairseq

def validate_and_save(
    cfg: DictConfig,
    trainer: Trainer,
    task: tasks.FairseqTask,
    epoch_itr,
    valid_subsets: List[str],
    end_of_epoch: bool,
) -> Tuple[List[Optional[float]], bool]:
    num_updates = trainer.get_num_updates()
    max_update = cfg.optimization.max_update or math.inf
    do_save = (
        (end_of_epoch and epoch_itr.epoch % cfg.checkpoint.save_interval == 0)
        or num_updates >= max_update
        or (
            cfg.checkpoint.save_interval_updates > 0
            and num_updates > 0
            and num_updates % cfg.checkpoint.save_interval_updates == 0
            and num_updates >= cfg.dataset.validate_after_updates
        )
    )
    do_validate = (
        (not end_of_epoch and do_save)  # validate during mid-epoch saves
        or (end_of_epoch and epoch_itr.epoch % cfg.dataset.validate_interval == 0)
        or num_updates >= max_update
        or (
            cfg.dataset.validate_interval_updates > 0
            and num_updates > 0
            and num_updates % cfg.dataset.validate_interval_updates == 0
        )
    ) and not cfg.dataset.disable_validation

    # Validate
    valid_losses = [None]
    if do_validate:
        valid_losses = validate(cfg, trainer, task, epoch_itr, valid_subsets)

    # Stopping conditions
    should_stop = (
        should_stop_early(cfg, valid_losses[0])
        or num_updates >= max_update
        or (
            cfg.optimization.stop_time_hours > 0
            and trainer.cumulative_training_time() / (60 * 60)
            > cfg.optimization.stop_time_hours
        )
    )

    # Save checkpoint
    if do_save or should_stop:
        logger.info("begin save checkpoint")
        checkpoint_utils.save_checkpoint(
            cfg.checkpoint, trainer, epoch_itr, valid_losses[0]
        )

    return valid_losses, should_stop