lightrft.strategyΒΆ
- lightrft.strategy.config
StrategyConfigStrategyConfig.actor_learning_rateStrategyConfig.adam_betasStrategyConfig.adam_offloadStrategyConfig.advantage_clipStrategyConfig.advantage_estimatorStrategyConfig.advantages_normStrategyConfig.bf16StrategyConfig.critic_learning_rateStrategyConfig.critic_pretrainStrategyConfig.dynamic_samplingStrategyConfig.enable_engine_sleepStrategyConfig.engine_tp_sizeStrategyConfig.engine_typeStrategyConfig.extra_argsStrategyConfig.from_args()StrategyConfig.fsdpStrategyConfig.fsdp_cpu_offloadStrategyConfig.fused_linear_logprobStrategyConfig.grad_accum_dtypeStrategyConfig.kl_estimatorStrategyConfig.l2StrategyConfig.local_rankStrategyConfig.lr_warmup_ratioStrategyConfig.max_normStrategyConfig.micro_rollout_batch_sizeStrategyConfig.micro_train_batch_sizeStrategyConfig.mixed_mm_dataStrategyConfig.n_samples_per_promptStrategyConfig.overlap_commStrategyConfig.overlong_bufferStrategyConfig.overlong_buffer_lenStrategyConfig.overlong_buffer_penalty_factorStrategyConfig.plot_everyStrategyConfig.pretrain_dataStrategyConfig.print_config_summary()StrategyConfig.remote_rm_urlStrategyConfig.reward_clipStrategyConfig.reward_running_normStrategyConfig.reward_running_norm_minus_meanStrategyConfig.seedStrategyConfig.sp_sizeStrategyConfig.train_batch_sizeStrategyConfig.use_kl_lossStrategyConfig.use_mp_optStrategyConfig.use_tensorboardStrategyConfig.zero_stageStrategyConfig.zpg
- lightrft.strategy.deepspeed
- lightrft.strategy.fake_strategy
FakeStrategyFakeStrategy.all_gather()FakeStrategy.all_reduce()FakeStrategy.backward()FakeStrategy.create_optimizer()FakeStrategy.engine_generate_local()FakeStrategy.gather_and_generate()FakeStrategy.get_rank()FakeStrategy.init_model_context()FakeStrategy.is_rank_0()FakeStrategy.load_ckpt()FakeStrategy.maybe_load_optimizer()FakeStrategy.maybe_offload_optimizer()FakeStrategy.maybe_sleep_inference_engine()FakeStrategy.optimizer_step()FakeStrategy.prepare()FakeStrategy.save_ckpt()FakeStrategy.setup_distributed()FakeStrategy.setup_inference_engine()FakeStrategy.update_engine_weights()FakeStrategy.wakeup_inference_engine()
get_fake_strategy()
- lightrft.strategy.fsdp
- lightrft.strategy.sglang_utils
- lightrft.strategy.strategy
- lightrft.strategy.strategy_base
- lightrft.strategy.utils
- lightrft.strategy.vllm_utils