forked from pytorch/rl
-
Notifications
You must be signed in to change notification settings - Fork 0
/
__init__.py
89 lines (88 loc) · 2.09 KB
/
__init__.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
# Copyright (c) Meta Platforms, Inc. and affiliates.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.
from .postprocs import MultiStep
from .replay_buffers import (
Flat2TED,
FlatStorageCheckpointer,
H5Combine,
H5Split,
H5StorageCheckpointer,
ImmutableDatasetWriter,
LazyMemmapStorage,
LazyTensorStorage,
ListStorage,
ListStorageCheckpointer,
Nested2TED,
NestedStorageCheckpointer,
PrioritizedReplayBuffer,
PrioritizedSampler,
PrioritizedSliceSampler,
RandomSampler,
RemoteTensorDictReplayBuffer,
ReplayBuffer,
ReplayBufferEnsemble,
RoundRobinWriter,
SamplerEnsemble,
SamplerWithoutReplacement,
SliceSampler,
SliceSamplerWithoutReplacement,
Storage,
StorageCheckpointerBase,
StorageEnsemble,
StorageEnsembleCheckpointer,
TED2Flat,
TED2Nested,
TensorDictMaxValueWriter,
TensorDictPrioritizedReplayBuffer,
TensorDictReplayBuffer,
TensorDictRoundRobinWriter,
TensorStorage,
TensorStorageCheckpointer,
Writer,
WriterEnsemble,
)
from .rlhf import (
AdaptiveKLController,
ConstantKLController,
create_infinite_iterator,
get_dataloader,
PairwiseDataset,
PromptData,
PromptTensorDictTokenizer,
RewardData,
RolloutFromModel,
TensorDictTokenizer,
TokenizedDatasetLoader,
)
from .tensor_specs import (
Binary,
BinaryDiscreteTensorSpec,
Bounded,
BoundedTensorSpec,
Categorical,
Composite,
CompositeSpec,
DEVICE_TYPING,
DiscreteTensorSpec,
LazyStackedCompositeSpec,
LazyStackedTensorSpec,
MultiCategorical,
MultiDiscreteTensorSpec,
MultiOneHot,
MultiOneHotDiscreteTensorSpec,
NonTensor,
NonTensorSpec,
OneHot,
OneHotDiscreteTensorSpec,
Stacked,
StackedComposite,
TensorSpec,
Unbounded,
UnboundedContinuous,
UnboundedContinuousTensorSpec,
UnboundedDiscrete,
UnboundedDiscreteTensorSpec,
)
from .utils import check_no_exclusive_keys, consolidate_spec, contains_lazy_spec