forked from pytorch/rl
-
Notifications
You must be signed in to change notification settings - Fork 0
/
_utils_internal.py
114 lines (94 loc) · 3.79 KB
/
_utils_internal.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
# Copyright (c) Meta Platforms, Inc. and affiliates.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.
import os
import time
from functools import wraps
# Get relative file path
# this returns relative path from current file.
import pytest
import torch.cuda
from torchrl._utils import seed_generator
from torchrl.data import CompositeSpec
from torchrl.data.tensordict.tensordict import TensorDictBase
from torchrl.envs import EnvBase
# Specified for test_utils.py
__version__ = "0.3"
def get_relative_path(curr_file, *path_components):
return os.path.join(os.path.dirname(curr_file), *path_components)
def get_available_devices():
devices = [torch.device("cpu")]
n_cuda = torch.cuda.device_count()
if n_cuda > 0:
for i in range(n_cuda):
devices += [torch.device(f"cuda:{i}")]
return devices
def generate_seeds(seed, repeat):
seeds = [seed]
for _ in range(repeat - 1):
seed = seed_generator(seed)
seeds.append(seed)
return seeds
def _test_fake_tensordict(env: EnvBase):
fake_tensordict = env.fake_tensordict().flatten_keys(".")
real_tensordict = env.rollout(3).flatten_keys(".")
keys1 = set(fake_tensordict.keys())
keys2 = set(real_tensordict.keys())
assert keys1 == keys2
fake_tensordict = fake_tensordict.expand(3).to_tensordict()
fake_tensordict.zero_()
real_tensordict.zero_()
assert (fake_tensordict == real_tensordict).all()
for key in keys2:
assert fake_tensordict[key].shape == real_tensordict[key].shape
# test dtypes
for key, value in real_tensordict.unflatten_keys(".").items():
_check_dtype(key, value, env.observation_spec, env.input_spec)
def _check_dtype(key, value, obs_spec, input_spec):
if key.startswith("next_"):
return
if isinstance(value, TensorDictBase):
for _key, _value in value.items():
if isinstance(obs_spec, CompositeSpec) and "next_" + key in obs_spec.keys():
_check_dtype(_key, _value, obs_spec["next_" + key], input_spec=None)
elif isinstance(input_spec, CompositeSpec) and key in input_spec.keys():
_check_dtype(_key, _value, obs_spec=None, input_spec=input_spec[key])
else:
raise KeyError(f"key '{_key}' is unknown.")
else:
if obs_spec is not None and "next_" + key in obs_spec.keys():
assert (
obs_spec["next_" + key].dtype is value.dtype
), f"{obs_spec['next_' + key].dtype} vs {value.dtype} for {key}"
elif input_spec is not None and key in input_spec.keys():
assert (
input_spec[key].dtype is value.dtype
), f"{input_spec[key].dtype} vs {value.dtype} for {key}"
else:
assert key in {"done", "reward"}, (key, obs_spec, input_spec)
# Decorator to retry upon certain Exceptions.
def retry(ExceptionToCheck, tries=3, delay=3, skip_after_retries=False):
def deco_retry(f):
@wraps(f)
def f_retry(*args, **kwargs):
mtries, mdelay = tries, delay
while mtries > 1:
try:
return f(*args, **kwargs)
except ExceptionToCheck as e:
msg = "%s, Retrying in %d seconds..." % (str(e), mdelay)
print(msg)
time.sleep(mdelay)
mtries -= 1
try:
return f(*args, **kwargs)
except ExceptionToCheck as e:
if skip_after_retries:
raise pytest.skip(
f"Skipping after {tries} consecutive {str(e)}"
) from e
else:
raise e
return f_retry # true decorator
return deco_retry