Python ElasticRayExecutor.start示例

编程语言: Python

命名空间/包名称: horovod.ray.elastic

方法/功能: start

hotexamples.com的示例: 2

Python ElasticRayExecutor.start - 已找到2个示例。这些是从开源项目中提取的最受好评的horovod.ray.elastic.ElasticRayExecutor.start现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

ElasticRayExecutor(2)

create_settings(2)

run(2)

start(2)

示例#1

显示文件

文件： test_ray_elastic.py 项目： zuston/horovod

def test_gpu_e2e(ray_8_cpus_gpus):
    with fault_tolerance_patches():
        discovery_schedule = [
            (20, ['host-1:1']),
            (60, ['host-1:1', 'host-4:1', 'host-5:1']),
            (None, ['host-1:1', 'host-4:1', 'host-5:1', 'host-6:1']),
        ]
        nics = list(psutil.net_if_addrs().keys())[0]

        settings = ElasticRayExecutor.create_settings(min_np=4,
                                                      max_np=4,
                                                      nics={nics})
        settings.discovery = SimpleTestDiscovery(discovery_schedule)
        executor = ElasticRayExecutor(settings,
                                      gpus_per_slot=1,
                                      use_gpu=True,
                                      override_discovery=False)

        logger, training_fn = _create_training_function(iterations=100)
        executor.start()
        results = executor.run(training_fn)
        assert len(results) == 4

        events = ray.get(logger.fetch.remote())
        assert sum(int("started" in e) for e in events) == 4, events
        assert sum(int("finished" in e) for e in events) == 4, events

示例#2

显示文件

def test_min_np(ray_8_cpus):
    with fault_tolerance_patches():
        discovery_schedule = [
            (10, ['host-1:1']),
            (10, ['host-1:1', 'host-4:1', 'host-5:1']),
            (None, ['host-1:1', 'host-4:1', 'host-5:1', 'host-6:1']),
        ]
        nics = list(psutil.net_if_addrs().keys())[0]

        settings = ElasticRayExecutor.create_settings(min_np=4,
                                                      max_np=4,
                                                      nics={nics})
        settings.discovery = SimpleTestDiscovery(discovery_schedule)
        executor = ElasticRayExecutor(settings,
                                      cpus_per_slot=1,
                                      override_discovery=False)

        training_fn = _create_training_function(iterations=30)
        executor.start()
        trace = StatusCallback()
        results = executor.run(training_fn, callbacks=[trace])
        assert len(results) == 4

        events = trace.fetch()
        assert sum(int("started" in e) for e in events) == 4, events
        assert sum(int("finished" in e) for e in events) == 4, events