trinity.common package#
Subpackages#
- trinity.common.models package
- trinity.common.rewards package
- Submodules
- trinity.common.rewards.accuracy_reward module
- trinity.common.rewards.agents_reward module
- trinity.common.rewards.countdown_reward module
- trinity.common.rewards.dapo_reward module
- trinity.common.rewards.format_reward module
- trinity.common.rewards.human_reward module
- trinity.common.rewards.math_reward module
- trinity.common.rewards.reward_fn module
- trinity.common.rewards.tool_reward module
- trinity.common.rewards.utils module
- Module contents
- Submodules
- trinity.common.workflows package
- Subpackages
- Submodules
- trinity.common.workflows.agentscope_workflow module
- trinity.common.workflows.customized_math_workflows module
- trinity.common.workflows.customized_toolcall_workflows module
- trinity.common.workflows.eval_workflow module
- trinity.common.workflows.math_rm_workflow module
- trinity.common.workflows.math_ruler_workflow module
- trinity.common.workflows.math_trainable_ruler_workflow module
- trinity.common.workflows.rubric_judge_workflow module
- trinity.common.workflows.simple_mm_workflow module
- trinity.common.workflows.step_wise_workflow module
- trinity.common.workflows.workflow module
- Module contents
TaskWorkflowAsyncSimpleWorkflowSimpleWorkflowAsyncMathWorkflowMathWorkflowWebShopWorkflowAlfworldWorkflowStepWiseAlfworldWorkflowRAFTAlfworldWorkflowRAFTAlfworldWorkflow.can_resetRAFTAlfworldWorkflow.can_repeatRAFTAlfworldWorkflow.is_asyncRAFTAlfworldWorkflow.__init__()RAFTAlfworldWorkflow.reset()RAFTAlfworldWorkflow.create_environment()RAFTAlfworldWorkflow.run_single_rollout()RAFTAlfworldWorkflow.eval_alfworld()RAFTAlfworldWorkflow.run_async()RAFTAlfworldWorkflow.set_repeat_times()
RAFTReflectAlfworldWorkflowSciWorldWorkflowAsyncMathBoxedWorkflowMathBoxedWorkflowAsyncMathRMWorkflowMathRMWorkflowToolCallWorkflowAsyncMathEvalWorkflowMathEvalWorkflowAgentScopeV0ReactMathWorkflowAgentScopeReactMathWorkflowAgentScopeV1ReactSearchWorkflowAgentScopeReActWorkflowEmailSearchWorkflowAsyncMathRULERWorkflowMathRULERWorkflowMathTrainableRULERWorkflowAsyncSimpleMMWorkflowSimpleMMWorkflowRubricJudgeWorkflowAgentScopeWorkflowAdapter
Submodules#
- trinity.common.config module
set_if_none()FormatConfigFormatConfig.prompt_typeFormatConfig.prompt_keyFormatConfig.response_keyFormatConfig.system_prompt_keyFormatConfig.system_promptFormatConfig.messages_keyFormatConfig.tools_keyFormatConfig.image_keyFormatConfig.video_keyFormatConfig.reply_prefixFormatConfig.workflow_keyFormatConfig.reward_fn_keyFormatConfig.chosen_keyFormatConfig.rejected_keyFormatConfig.enable_concatenated_multi_turnFormatConfig.chat_templateFormatConfig.__init__()
GenerationConfigOptimizerConfigLoRAConfigTaskSelectorConfigReplayBufferConfigStorageConfigStorageConfig.nameStorageConfig.storage_typeStorageConfig.pathStorageConfig.repeat_timesStorageConfig.indexStorageConfig.splitStorageConfig.subset_nameStorageConfig.formatStorageConfig.capacityStorageConfig.max_read_timeoutStorageConfig.replay_bufferStorageConfig.max_retry_timesStorageConfig.max_retry_intervalStorageConfig.default_workflow_typeStorageConfig.default_reward_fn_typeStorageConfig.rollout_argsStorageConfig.workflow_argsStorageConfig.reward_fn_argsStorageConfig.task_selectorStorageConfig.enable_progress_barStorageConfig.ray_namespaceStorageConfig.wrap_in_rayStorageConfig.schema_typeStorageConfig.total_epochsStorageConfig.total_stepsStorageConfig.batch_sizeStorageConfig.tokenizer_pathStorageConfig.is_evalStorageConfig.__init__()
TasksetConfigTasksetConfig.nameTasksetConfig.storage_typeTasksetConfig.pathTasksetConfig.default_workflow_typeTasksetConfig.default_reward_fn_typeTasksetConfig.rollout_argsTasksetConfig.workflow_argsTasksetConfig.reward_fn_argsTasksetConfig.task_selectorTasksetConfig.splitTasksetConfig.subset_nameTasksetConfig.formatTasksetConfig.max_retry_timesTasksetConfig.max_retry_intervalTasksetConfig.enable_progress_barTasksetConfig.indexTasksetConfig.repeat_timesTasksetConfig.is_evalTasksetConfig.batch_sizeTasksetConfig.total_epochsTasksetConfig.total_stepsTasksetConfig.to_storage_config()TasksetConfig.__init__()
ExperienceBufferConfigExperienceBufferConfig.nameExperienceBufferConfig.storage_typeExperienceBufferConfig.pathExperienceBufferConfig.capacityExperienceBufferConfig.max_read_timeoutExperienceBufferConfig.replay_bufferExperienceBufferConfig.max_retry_timesExperienceBufferConfig.max_retry_intervalExperienceBufferConfig.splitExperienceBufferConfig.subset_nameExperienceBufferConfig.formatExperienceBufferConfig.enable_progress_barExperienceBufferConfig.schema_typeExperienceBufferConfig.indexExperienceBufferConfig.batch_sizeExperienceBufferConfig.tokenizer_pathExperienceBufferConfig.total_epochsExperienceBufferConfig.total_stepsExperienceBufferConfig.to_storage_config()ExperienceBufferConfig.__init__()
OperatorConfigExperiencePipelineConfigTaskPipelineConfigDataProcessorConfigModelConfigModelConfig.model_pathModelConfig.critic_model_pathModelConfig.custom_chat_templateModelConfig.temperatureModelConfig.top_pModelConfig.top_kModelConfig.logprobsModelConfig.max_model_lenModelConfig.max_prompt_tokensModelConfig.max_response_tokensModelConfig.min_response_tokensModelConfig.lora_configsModelConfig.fully_sharded_lorasModelConfig.max_cpu_lorasModelConfig.__init__()
InferenceModelConfigInferenceModelConfig.model_pathInferenceModelConfig.engine_typeInferenceModelConfig.engine_numInferenceModelConfig.tensor_parallel_sizeInferenceModelConfig.use_v1InferenceModelConfig.enforce_eagerInferenceModelConfig.enable_prefix_cachingInferenceModelConfig.enable_chunked_prefillInferenceModelConfig.gpu_memory_utilizationInferenceModelConfig.dtypeInferenceModelConfig.seedInferenceModelConfig.temperatureInferenceModelConfig.top_pInferenceModelConfig.top_kInferenceModelConfig.logprobsInferenceModelConfig.max_model_lenInferenceModelConfig.max_prompt_tokensInferenceModelConfig.max_response_tokensInferenceModelConfig.min_response_tokensInferenceModelConfig.ignore_eosInferenceModelConfig.chat_templateInferenceModelConfig.enable_thinkingInferenceModelConfig.enable_historyInferenceModelConfig.enable_openai_apiInferenceModelConfig.enable_auto_tool_choiceInferenceModelConfig.tool_call_parserInferenceModelConfig.reasoning_parserInferenceModelConfig.bundle_indicesInferenceModelConfig.enable_loraInferenceModelConfig.lora_modulesInferenceModelConfig.lora_kwargsInferenceModelConfig.__init__()
AlgorithmConfigAlgorithmConfig.algorithm_typeAlgorithmConfig.repeat_timesAlgorithmConfig.optimizerAlgorithmConfig.sample_strategyAlgorithmConfig.sample_strategy_argsAlgorithmConfig.advantage_fnAlgorithmConfig.advantage_fn_argsAlgorithmConfig.kl_penalty_fnAlgorithmConfig.kl_penalty_fn_argsAlgorithmConfig.policy_loss_fnAlgorithmConfig.policy_loss_fn_argsAlgorithmConfig.kl_loss_fnAlgorithmConfig.kl_loss_fn_argsAlgorithmConfig.entropy_loss_fnAlgorithmConfig.entropy_loss_fn_argsAlgorithmConfig.__init__()
ClusterConfigExplorerInputTrainerInputBufferConfigExplorerConfigExplorerConfig.nameExplorerConfig.runner_per_modelExplorerConfig.max_timeoutExplorerConfig.max_retry_timesExplorerConfig.env_varsExplorerConfig.max_repeat_times_per_runnerExplorerConfig.runner_numExplorerConfig.rollout_modelExplorerConfig.auxiliary_modelsExplorerConfig.eval_intervalExplorerConfig.eval_on_startupExplorerConfig.bench_on_latest_checkpointExplorerConfig.api_portExplorerConfig.listen_addressExplorerConfig.service_status_check_intervalExplorerConfig.min_running_model_numExplorerConfig.__init__()
TrainerConfigTrainerConfig.nameTrainerConfig.trainer_typeTrainerConfig.save_intervalTrainerConfig.enable_previewTrainerConfig.total_stepsTrainerConfig.grad_clipTrainerConfig.use_dynamic_bszTrainerConfig.max_token_len_per_gpuTrainerConfig.ulysses_sequence_parallel_sizeTrainerConfig.fix_actor_microbatch_loss_scaleTrainerConfig.save_strategyTrainerConfig.trainer_configTrainerConfig.trainer_config_pathTrainerConfig.__init__()
MonitorConfigSynchronizerConfigDataJuicerServiceConfigServiceConfigLogConfigStageConfigConfigConfig.modeConfig.projectConfig.groupConfig.nameConfig.checkpoint_root_dirConfig.checkpoint_job_dirConfig.ray_namespaceConfig.continue_from_checkpointConfig.algorithmConfig.data_processorConfig.modelConfig.clusterConfig.bufferConfig.explorerConfig.trainerConfig.monitorConfig.synchronizerConfig.serviceConfig.logConfig.stagesConfig.save()Config.check_and_update()Config.flatten()Config.get_envs()Config.__init__()
load_config()
- trinity.common.constants module
- trinity.common.experience module
EIDCustomFieldExperienceExperience.__init__()Experience.eidExperience.rewardExperience.advantagesExperience.returnsExperience.infoExperience.metricsExperience.prompt_lengthExperience.response_textExperience.prompt_textExperience.messagesExperience.toolsExperience.chosen_messagesExperience.rejected_messagesExperience.multi_modal_inputsExperience.tokensExperience.logprobsExperience.action_maskExperience.chosenExperience.rejectedExperience.serialize()Experience.deserialize()Experience.to_dict()Experience.gather()
split_dpo_experience_to_single_turn()ExperiencesExperiences.__init__()Experiences.eidsExperiences.tokensExperiences.rewardsExperiences.advantagesExperiences.returnsExperiences.attention_masksExperiences.action_masksExperiences.prompt_lengthExperiences.logprobsExperiences.multi_modal_inputsExperiences.custom_fieldsExperiences.batch_sizeExperiences.gather_experiences()
empty_experiences()gather_token_ids()gather_action_masks()gather_attention_masks()gather_logprobs()gather_advantages()gather_returns()gather_multi_modal_inputs()group_by()to_hf_datasets()from_hf_datasets()
- trinity.common.verl_config module
DataFusedKernelOptionsActorModelActorModel.pathActorModel.external_libActorModel.override_configActorModel.enable_gradient_checkpointingActorModel.use_remove_paddingActorModel.use_fused_kernelsActorModel.fused_kernel_optionsActorModel.custom_chat_templateActorModel.enable_activation_offloadActorModel.use_shmActorModel.lora_rankActorModel.lora_alphaActorModel.target_modulesActorModel.__init__()
OptimOptim.lrOptim.lr_warmup_stepsOptim.lr_warmup_steps_ratioOptim.min_lr_ratioOptim.warmup_styleOptim.total_training_stepsOptim.betasOptim.optimizerOptim.clip_gradOptim.lr_warmup_initOptim.lr_decay_stepsOptim.lr_decay_styleOptim.min_lrOptim.weight_decayOptim.weight_decay_incr_styleOptim.lr_wsd_decay_styleOptim.lr_wsd_decay_stepsOptim.use_checkpoint_opt_param_schedulerOptim.__init__()
WrapPolicyFSDPConfigCheckpointOverrideTransformerConfigMegatronConfigMegatronConfig.param_offloadMegatronConfig.grad_offloadMegatronConfig.optimizer_offloadMegatronConfig.tensor_model_parallel_sizeMegatronConfig.expert_model_parallel_sizeMegatronConfig.expert_tensor_parallel_sizeMegatronConfig.pipeline_model_parallel_sizeMegatronConfig.virtual_pipeline_model_parallel_sizeMegatronConfig.context_parallel_sizeMegatronConfig.sequence_parallelMegatronConfig.use_distributed_optimizerMegatronConfig.use_dist_checkpointingMegatronConfig.dist_checkpointing_pathMegatronConfig.seedMegatronConfig.override_ddp_configMegatronConfig.override_transformer_configMegatronConfig.use_mbridgeMegatronConfig.__init__()
ProfileConfigActorActor.strategyActor.ppo_mini_batch_sizeActor.ppo_micro_batch_sizeActor.ppo_micro_batch_size_per_gpuActor.use_dynamic_bszActor.ppo_max_token_len_per_gpuActor.fix_actor_microbatch_loss_scaleActor.grad_clipActor.ppo_epochsActor.shuffleActor.ulysses_sequence_parallel_sizeActor.entropy_from_logits_with_chunkingActor.entropy_checkpointingActor.checkpointActor.optimActor.fsdp_configActor.megatronActor.profileActor.data_loader_seedActor.load_weightActor.loss_agg_modeActor.clip_ratioActor.clip_ratio_lowActor.clip_ratio_highActor.entropy_coeffActor.use_kl_lossActor.kl_loss_coefActor.kl_loss_typeActor.__init__()
RefRef.fsdp_configRef.log_prob_micro_batch_sizeRef.log_prob_micro_batch_size_per_gpuRef.log_prob_use_dynamic_bszRef.log_prob_max_token_len_per_gpuRef.ulysses_sequence_parallel_sizeRef.entropy_from_logits_with_chunkingRef.entropy_checkpointingRef.checkpointRef.megatronRef.profileRef.load_weightRef.__init__()
RolloutActorRolloutRefCriticModelCriticCritic.strategyCritic.optimCritic.modelCritic.ppo_mini_batch_sizeCritic.ppo_micro_batch_sizeCritic.ppo_micro_batch_size_per_gpuCritic.forward_micro_batch_sizeCritic.forward_micro_batch_size_per_gpuCritic.use_dynamic_bszCritic.ppo_max_token_len_per_gpuCritic.forward_max_token_len_per_gpuCritic.ulysses_sequence_parallel_sizeCritic.ppo_epochsCritic.shuffleCritic.grad_clipCritic.cliprange_valueCritic.checkpointCritic.rollout_nCritic.loss_agg_modeCritic.megatronCritic.profileCritic.data_loader_seedCritic.load_weightCritic.ray_namespaceCritic.__init__()
RewardModelCustomRewardFunctionKL_CtrlAlgorithmTrainerTrainer.balance_batchTrainer.total_epochsTrainer.total_training_stepsTrainer.project_nameTrainer.group_nameTrainer.experiment_nameTrainer.loggerTrainer.val_generations_to_log_to_wandbTrainer.nnodesTrainer.n_gpus_per_nodeTrainer.save_freqTrainer.resume_modeTrainer.resume_from_pathTrainer.test_freqTrainer.critic_warmupTrainer.default_hdfs_dirTrainer.remove_previous_ckpt_in_saveTrainer.del_local_ckpt_after_loadTrainer.default_local_dirTrainer.val_before_trainTrainer.training_rollout_modeTrainer.enable_exp_bufferTrainer.sync_freqTrainer.max_actor_ckpt_to_keepTrainer.max_critic_ckpt_to_keepTrainer.deviceTrainer.__init__()
veRLConfigload_config()