LICENSE
README.md
setup.py
chatlearn/__init__.py
chatlearn/entrypoint.py
chatlearn/hooks.py
chatlearn/offline_ckpt_converter.py
chatlearn/algorithm/__init__.py
chatlearn/algorithm/base_algo.py
chatlearn/algorithm/grpo.py
chatlearn/checkpoint/__init__.py
chatlearn/checkpoint/checkpoint_manager.py
chatlearn/configs/__init__.py
chatlearn/configs/fsdp_config.py
chatlearn/configs/megatron_config.py
chatlearn/configs/policy_config.py
chatlearn/configs/runtime_config.py
chatlearn/configs/base/__init__.py
chatlearn/configs/base/base_config.py
chatlearn/configs/base/base_model_config.py
chatlearn/configs/base/common.py
chatlearn/data/__init__.py
chatlearn/data/data.py
chatlearn/data/prompt_dataset.py
chatlearn/data/sampler.py
chatlearn/launcher/__init__.py
chatlearn/launcher/dlc_utils.py
chatlearn/launcher/initialize.py
chatlearn/models/__init__.py
chatlearn/models/base_module.py
chatlearn/models/fsdp_module.py
chatlearn/models/megatron_module.py
chatlearn/models/sglang_module.py
chatlearn/models/torch_module.py
chatlearn/models/vllm_module.py
chatlearn/models/megatron/__init__.py
chatlearn/models/megatron/memory_manager/__init__.py
chatlearn/models/megatron/memory_manager/inference.py
chatlearn/models/megatron/memory_manager/trainer.py
chatlearn/models/reward/__init__.py
chatlearn/models/reward/rule_reward.py
chatlearn/models/vllm/__init__.py
chatlearn/models/vllm/hooks/__init__.py
chatlearn/models/vllm/hooks/vllm_0_8_5/__init__.py
chatlearn/models/vllm/hooks/vllm_0_8_5/async_llm_engine.py
chatlearn/models/vllm/hooks/vllm_0_8_5/llm.py
chatlearn/models/vllm/hooks/vllm_0_8_5/llm_engine.py
chatlearn/models/vllm/hooks/vllm_0_8_5/logits_processor.py
chatlearn/models/vllm/hooks/vllm_0_8_5/ray_distributed_executor.py
chatlearn/models/vllm/hooks/vllm_0_8_5/worker_base.py
chatlearn/runtime/__init__.py
chatlearn/runtime/decorator.py
chatlearn/runtime/dist_actor.py
chatlearn/runtime/engine.py
chatlearn/runtime/environment.py
chatlearn/runtime/evaluator.py
chatlearn/runtime/executor.py
chatlearn/runtime/model_flow.py
chatlearn/runtime/trainer.py
chatlearn/runtime/utils.py
chatlearn/schedule/__init__.py
chatlearn/schedule/metric_manager.py
chatlearn/schedule/model_manager.py
chatlearn/schedule/port_manager.py
chatlearn/schedule/resource_manager.py
chatlearn/synchronizer/__init__.py
chatlearn/synchronizer/base_parameter_sync.py
chatlearn/synchronizer/comm.py
chatlearn/synchronizer/parameter_sync.py
chatlearn/synchronizer/parameter_sync_fsdp.py
chatlearn/synchronizer/structs.py
chatlearn/synchronizer/mappers/__init__.py
chatlearn/synchronizer/mappers/mapper.py
chatlearn/synchronizer/mappers/mapping_helpers.py
chatlearn/synchronizer/planners/__init__.py
chatlearn/synchronizer/planners/base_planner.py
chatlearn/synchronizer/planners/shard_planner.py
chatlearn/synchronizer/planners/tensor_planner.py
chatlearn/utils/__init__.py
chatlearn/utils/arguments.py
chatlearn/utils/communication_op.py
chatlearn/utils/constant.py
chatlearn/utils/error_monitor.py
chatlearn/utils/flat_tensors.py
chatlearn/utils/future.py
chatlearn/utils/global_vars.py
chatlearn/utils/log_monitor.py
chatlearn/utils/logger.py
chatlearn/utils/megatron_utils.py
chatlearn/utils/parse_utils.py
chatlearn/utils/timer.py
chatlearn/utils/utils.py
chatlearn/utils/version.py
chatlearn/utils/vllm_utils.py
chatlearn/utils/mappings/__init__.py
chatlearn/utils/mappings/huggingface_helpers.py
chatlearn/utils/mappings/megatron_helpers.py
chatlearn/utils/mappings/sharded_tensor_info.py
chatlearn/utils/mappings/vllm_helpers.py
chatlearn/utils/rule_reward_score/__init__.py
chatlearn/utils/rule_reward_score/math.py
examples/__init__.py
pai_chatlearn.egg-info/PKG-INFO
pai_chatlearn.egg-info/SOURCES.txt
pai_chatlearn.egg-info/dependency_links.txt
pai_chatlearn.egg-info/top_level.txt
tests/__init__.py
tests/test_main.py
tests/utils.py
tests/parameter_sync/__init__.py
tests/parameter_sync/test_mapper_helpers.py
tests/rlhf/__init__.py
tests/rlhf/test_ckpt.py
tests/rlhf/test_data.py
tests/rlhf/test_grpo.py
tests/rlhf/test_indivisible_batchsz.py
tests/rlhf/test_model_flow.py
tests/rlhf/test_placement.py
tests/rlhf/test_placement_colocate.py
tests/rlhf/test_relay_buffer.py
tests/rlhf/test_rlhf_custom.py
tests/rlhf/test_rlhf_placement_colocate.py
tests/rlhf/test_rlhf_replica.py