trlX
docs
Contents:
Data Elements
RL Models
Orchestrators
Configs
Pipelines
Examples
trlX
»
Index
Edit on GitHub
Index
A
|
B
|
C
|
E
|
F
|
G
|
I
|
L
|
M
|
O
|
P
|
S
|
T
A
AccelerateILQLModel (class in trlx.model.accelerate_ilql_model)
AcceleratePPOModel (class in trlx.model.accelerate_ppo_model)
AccelerateRLBatchElement (class in trlx.data.accelerate_base_datatypes)
AccelerateRLElement (class in trlx.data.accelerate_base_datatypes)
AccelerateRLModel (class in trlx.model.accelerate_base_model)
act() (trlx.model.BaseRLModel method)
add_eval_pipeline() (trlx.model.accelerate_base_model.AccelerateRLModel method)
B
BasePipeline (class in trlx.pipeline)
BaseRLModel (class in trlx.model)
BaseRolloutStore (class in trlx.pipeline)
C
CausalLMWithValueHeads (class in trlx.model.nn.ilql_models)
create_loader() (trlx.pipeline.BasePipeline method)
(trlx.pipeline.BaseRolloutStore method)
(trlx.pipeline.offline_pipeline.ILQLRolloutStorage method)
(trlx.pipeline.offline_pipeline.PromptPipeline method)
(trlx.pipeline.ppo_pipeline.PPORolloutStorage method)
E
evaluate() (trlx.model.accelerate_base_model.AccelerateRLModel method)
F
forward() (trlx.model.nn.ilql_models.CausalLMWithValueHeads method)
(trlx.model.nn.ppo_models.GPTHeadWithValueModel method)
(trlx.model.nn.ppo_models.GPTHydraHeadWithValueModel method)
(trlx.model.nn.ppo_models.ModelBranch method)
G
generate() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.nn.ilql_models.CausalLMWithValueHeads method)
get_arch() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.accelerate_ilql_model.AccelerateILQLModel method)
(trlx.model.accelerate_ppo_model.AcceleratePPOModel method)
get_components() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.BaseRLModel method)
GPTHeadWithValueModel (class in trlx.model.nn.ppo_models)
GPTHydraHeadWithValueModel (class in trlx.model.nn.ppo_models)
I
ILQLBatch (class in trlx.data.ilql_types)
ILQLConfig (class in trlx.data.method_configs)
ILQLElement (class in trlx.data.ilql_types)
ILQLRolloutStorage (class in trlx.pipeline.offline_pipeline)
intervals() (trlx.model.BaseRLModel method)
L
learn() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.BaseRLModel method)
load() (trlx.model.BaseRLModel method)
load_yaml() (trlx.data.configs.TRLConfig class method)
loss() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.accelerate_ilql_model.AccelerateILQLModel method)
(trlx.model.accelerate_ppo_model.AcceleratePPOModel method)
M
make_experience() (trlx.orchestrator.offline_orchestrator.OfflineOrchestrator method)
(trlx.orchestrator.Orchestrator method)
(trlx.orchestrator.ppo_orchestrator.PPOOrchestrator method)
MethodConfig (class in trlx.data.method_configs)
ModelBranch (class in trlx.model.nn.ppo_models)
ModelConfig (class in trlx.data.configs)
O
OfflineOrchestrator (class in trlx.orchestrator.offline_orchestrator)
Orchestrator (class in trlx.orchestrator)
P
post_backward_callback() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.accelerate_ilql_model.AccelerateILQLModel method)
(trlx.model.accelerate_ppo_model.AcceleratePPOModel method)
post_epoch_callback() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.accelerate_ppo_model.AcceleratePPOModel method)
PPOConfig (class in trlx.data.method_configs)
PPOOrchestrator (class in trlx.orchestrator.ppo_orchestrator)
PPORLBatch (class in trlx.data.ppo_types)
PPORLElement (class in trlx.data.ppo_types)
PPORolloutStorage (class in trlx.pipeline.ppo_pipeline)
PromptBatch (class in trlx.data.accelerate_base_datatypes)
PromptElement (class in trlx.data.accelerate_base_datatypes)
PromptPipeline (class in trlx.pipeline.offline_pipeline)
push() (trlx.pipeline.BaseRolloutStore method)
(trlx.pipeline.ppo_pipeline.PPORolloutStorage method)
S
sample() (trlx.model.BaseRLModel method)
save() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.BaseRLModel method)
score() (trlx.orchestrator.ppo_orchestrator.PPOOrchestrator method)
T
to_dict() (trlx.data.configs.TRLConfig method)
tokenize() (trlx.model.accelerate_base_model.AccelerateRLModel method)
(trlx.model.accelerate_ilql_model.AccelerateILQLModel method)
TrainConfig (class in trlx.data.configs)
TRLConfig (class in trlx.data.configs)
Read the Docs
v: docs
Versions
latest
stable
docs
Downloads
On Read the Docs
Project Home
Builds