Index Symbols | A | B | C | D | E | F | G | I | L | M | P | R | S | T Symbols [Trajectory] A AccelerateILQLTrainer (class in trlx.trainer.accelerate_ilql_trainer) AcceleratePPOTrainer (class in trlx.trainer.accelerate_ppo_trainer) AccelerateRLBatchElement (class in trlx.data.accelerate_base_datatypes) AccelerateRLElement (class in trlx.data.accelerate_base_datatypes) AccelerateRLTrainer (class in trlx.trainer.accelerate_base_trainer) Action add_eval_pipeline() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.BaseRLTrainer method) add_prompt_pipeline() (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) Agent B BasePipeline (class in trlx.pipeline) BaseRLTrainer (class in trlx.trainer) BaseRolloutStore (class in trlx.pipeline) C CPU create_loader() (trlx.pipeline.BasePipeline method) (trlx.pipeline.BaseRolloutStore method) (trlx.pipeline.offline_pipeline.ILQLRolloutStorage method) (trlx.pipeline.offline_pipeline.PromptPipeline method) (trlx.pipeline.ppo_pipeline.PPORolloutStorage method) D decode() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) Device E Environment evaluate() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) evolve() (trlx.data.configs.TRLConfig method) F from_dict() (trlx.data.configs.TRLConfig class method) G generate() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) generate_eval() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) get_arch() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.accelerate_ilql_trainer.AccelerateILQLTrainer method) (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) GPU I ILQLBatch (class in trlx.data.ilql_types) ILQLElement (class in trlx.data.ilql_types) ILQLRolloutStorage (class in trlx.pipeline.offline_pipeline) L learn() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.BaseRLTrainer method) load() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.BaseRLTrainer method) load_yaml() (trlx.data.configs.TRLConfig class method) loss() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.accelerate_ilql_trainer.AccelerateILQLTrainer method) (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) M make_experience() (trlx.trainer.accelerate_ilql_trainer.AccelerateILQLTrainer method) (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) make_experience_seq2seq() (trlx.trainer.accelerate_ilql_trainer.AccelerateILQLTrainer method) MethodConfig (class in trlx.data.method_configs) ModelConfig (class in trlx.data.configs) P Policy Policy Gradient post_backward_callback() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.accelerate_ilql_trainer.AccelerateILQLTrainer method) (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) post_epoch_callback() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.accelerate_ppo_trainer.AcceleratePPOTrainer method) PPO PPORLBatch (class in trlx.data.ppo_types) PPORLElement (class in trlx.data.ppo_types) PPORolloutStorage (class in trlx.pipeline.ppo_pipeline) PromptBatch (class in trlx.data.accelerate_base_datatypes) PromptElement (class in trlx.data.accelerate_base_datatypes) PromptPipeline (class in trlx.pipeline.offline_pipeline) push() (trlx.pipeline.BaseRolloutStore method) (trlx.pipeline.ppo_pipeline.PPORolloutStorage method) R Reinforcement Learning Reward Rollout S sample() (trlx.trainer.BaseRLTrainer method) save() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) (trlx.trainer.BaseRLTrainer method) save_pretrained() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) setup_model() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) setup_optimizer() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) setup_scheduler() (trlx.trainer.accelerate_base_trainer.AccelerateRLTrainer method) State Steps T to_dict() (trlx.data.configs.TRLConfig method) TrainConfig (class in trlx.data.configs) TRLConfig (class in trlx.data.configs)