예제 #1
0
def test_aggregation_from_distributed_zero_full_precision_adam(device='cuda', checkpoint_dir='checkpoint_dir/distributed_zero/full_precision/adam/'):
    opts = {'device': {'id': device},
            'debug': {'deterministic_compute': True}}

    # extract state dictionaries to compare
    loaded_state_dict, model = create_orttrainer_and_load_checkpoint(device, opts, checkpoint_dir, use_lamb=False)
    test_zero_aggregation(checkpoint_dir, loaded_state_dict, is_mixedprecision=False)
def test_aggregation_from_distributed_zero_full_precision_lamb(
        device="cuda",
        checkpoint_dir="checkpoint_dir/distributed_zero/full_precision/lamb/"):
    opts = {"device": {"id": device}, "debug": {"deterministic_compute": True}}

    # extract state dictionaries to compare
    loaded_state_dict, model = create_orttrainer_and_load_checkpoint(
        device, opts, checkpoint_dir, use_lamb=True)
    test_zero_aggregation(checkpoint_dir,
                          loaded_state_dict,
                          is_mixedprecision=False)