forked from yaroslavvb/stuff
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
1 parent
4640980
commit 32d4585
Showing
1 changed file
with
62 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,62 @@ | ||
import subprocess, re, os, sys | ||
|
||
# GPU picking | ||
# http://stackoverflow.com/a/41638727/419116 | ||
# Nvidia-smi GPU memory parsing. | ||
# Tested on nvidia-smi 370.23 | ||
|
||
def run_command(cmd): | ||
"""Run command, return output as string.""" | ||
|
||
output = subprocess.Popen(cmd, stdout=subprocess.PIPE, shell=True).communicate()[0] | ||
return output.decode("ascii") | ||
|
||
def list_available_gpus(): | ||
"""Returns list of available GPU ids.""" | ||
|
||
output = run_command("nvidia-smi -L") | ||
# lines of the form GPU 0: TITAN X | ||
gpu_regex = re.compile(r"GPU (?P<gpu_id>\d+):") | ||
result = [] | ||
for line in output.strip().split("\n"): | ||
m = gpu_regex.match(line) | ||
assert m, "Couldnt parse "+line | ||
result.append(int(m.group("gpu_id"))) | ||
return result | ||
|
||
def gpu_memory_map(): | ||
"""Returns map of GPU id to memory allocated on that GPU.""" | ||
|
||
output = run_command("nvidia-smi") | ||
gpu_output = output[output.find("GPU Memory"):] | ||
# lines of the form | ||
# | 0 8734 C python 11705MiB | | ||
memory_regex = re.compile(r"[|]\s+?(?P<gpu_id>\d+)\D+?(?P<pid>\d+).+[ ](?P<gpu_memory>\d+)MiB") | ||
rows = gpu_output.split("\n") | ||
result = {gpu_id: 0 for gpu_id in list_available_gpus()} | ||
for row in gpu_output.split("\n"): | ||
m = memory_regex.search(row) | ||
if not m: | ||
continue | ||
gpu_id = int(m.group("gpu_id")) | ||
gpu_memory = int(m.group("gpu_memory")) | ||
result[gpu_id] += gpu_memory | ||
return result | ||
|
||
def pick_gpu_lowest_memory(): | ||
"""Returns GPU with the least allocated memory""" | ||
|
||
memory_gpu_map = [(memory, gpu_id) for (gpu_id, memory) in gpu_memory_map().items()] | ||
best_memory, best_gpu = sorted(memory_gpu_map)[0] | ||
return best_gpu | ||
|
||
def setup_one_gpu(): | ||
assert not 'tensorflow' in sys.modules, "GPU setup must happen before importing TensorFlow" | ||
gpu_id = pick_gpu_lowest_memory() | ||
print("Picking GPU "+str(gpu_id)) | ||
os.environ["CUDA_VISIBLE_DEVICES"] = str(gpu_id) | ||
|
||
def setup_no_gpu(): | ||
if 'tensorflow' in sys.modules: | ||
print("Warning, GPU setup must happen before importing TensorFlow") | ||
os.environ["CUDA_VISIBLE_DEVICES"] = '' |