def Prepare(benchmark_spec): """Install and set up NCCL on the target vm. Args: benchmark_spec: The benchmark specification """ benchmark_spec.always_call_cleanup = True if _NCCL_TESTS.value: vm_util.RunThreaded(PrepareVm, benchmark_spec.vms) hpc_util.CreateMachineFile(benchmark_spec.vms, nvidia_driver.QueryNumberOfGpus, HOSTFILE)
def Prepare(benchmark_spec): """Install IOR on the vms. Args: benchmark_spec: The benchmark specification. Contains all data that is required to run the benchmark. """ vms = benchmark_spec.vms master_vm = vms[0] vm_util.RunThreaded(lambda vm: vm.Install('ior'), benchmark_spec.vms) hpc_util.CreateMachineFile(vms) master_vm.AuthenticateVm()
def Prepare(benchmark_spec): """Install and set up Horovod on the target vms. Args: benchmark_spec: The benchmark specification """ vms = benchmark_spec.vms vm_util.RunThreaded(_PrepareHorovod, vms) _UpdateBenchmarkSpecWithFlags(benchmark_spec) vm_util.RunThreaded( lambda vm: _CopyAndUpdateRunScripts(benchmark_spec.model, vm), vms) hpc_util.CreateMachineFile(vms, lambda _: benchmark_spec.gpus_per_node, MACHINEFILE)
def Prepare(benchmark_spec): """Install SHOC and push the machinefile. Args: benchmark_spec: The benchmark specification. Contains all data that is required to run the benchmark. """ vm_util.RunThreaded(_InstallAndAuthenticateVm, benchmark_spec.vms) master_vm = benchmark_spec.vms[0] benchmark_spec.num_gpus = cuda_toolkit_8.QueryNumberOfGpus(master_vm) hpc_util.CreateMachineFile(benchmark_spec.vms, lambda _: benchmark_spec.num_gpus, MACHINEFILE)
def Prepare(benchmark_spec): """Install and set up HPCG on the target vms. Args: benchmark_spec: The benchmark specification """ vms = benchmark_spec.vms vm_util.RunThreaded(_PrepareHpcg, vms) _UpdateBenchmarkSpecWithFlags(benchmark_spec) for vm in vms: _CopyAndUpdateRunScripts(vm, benchmark_spec) hpc_util.CreateMachineFile(vms, lambda _: benchmark_spec.gpus_per_node, os.path.join(hpcg.HPCG_DIR, MACHINEFILE))
def Prepare(benchmark_spec): """Install HPCC on the target vms. Args: benchmark_spec: The benchmark specification. Contains all data that is required to run the benchmark. """ vms = benchmark_spec.vms master_vm = vms[0] PrepareHpcc(master_vm) CreateHpccinf(master_vm, benchmark_spec) hpc_util.CreateMachineFile(vms, remote_path=MACHINEFILE) PrepareBinaries(vms)
def Prepare(benchmark_spec: bm_spec.BenchmarkSpec) -> None: """Install HPCC on the target vms. Args: benchmark_spec: The benchmark specification. Contains all data that is required to run the benchmark. """ vms = benchmark_spec.vms headnode_vm = vms[0] PrepareHpcc(headnode_vm) CreateHpccinf(headnode_vm, benchmark_spec) hpc_util.CreateMachineFile(vms, remote_path=MACHINEFILE) headnode_vm.AuthenticateVm() PrepareBinaries(vms)
def Prepare(benchmark_spec): """Prepares the VMs and other resources for running the benchmark. This is a good place to download binaries onto the VMs, create any data files needed for a benchmark run, etc. Args: benchmark_spec: The benchmark spec for this sample benchmark. """ vms = benchmark_spec.vms vm_util.RunThreaded(lambda vm: vm.Install('openfoam'), vms) # Allow ssh access to other vms. vm_util.RunThreaded(lambda vm: vm.AuthenticateVm(), vms) # Avoids printing ssh warnings and prevents too many auth errors. vm_util.RunThreaded(lambda vm: vm.RemoteCommand(_SSH_CONFIG_CMD), vms) # Tell mpirun about other nodes. hpc_util.CreateMachineFile(vms, remote_path=_MACHINE_FILE)
def Prepare(benchmark_spec): """Install and set up RoBERTa mmlm on the target vm.. Args: benchmark_spec: The benchmark specification. Contains all data that is required to run the benchmark. """ _UpdateBenchmarkSpecWithFlags(benchmark_spec) vms = benchmark_spec.vms benchmark_spec.always_call_cleanup = True list_params = [((benchmark_spec, rank), {}) for rank in range(benchmark_spec.num_vms)] vm_util.RunThreaded(_PrepareVm, list_params) master = vms[0] if nvidia_driver.CheckNvidiaGpuExists(master): gpus_per_vm = nvidia_driver.QueryNumberOfGpus(master) hpc_util.CreateMachineFile(vms, lambda _: gpus_per_vm, HOSTFILE)