LICENSE
MANIFEST.in
README.md
pyproject.toml
requirements.txt
setup.py
src/setuptools_axolotl_dynamic_dependencies.py
src/axolotl/__init__.py
src/axolotl/convert.py
src/axolotl/datasets.py
src/axolotl/evaluate.py
src/axolotl/logging_config.py
src/axolotl/processing_strategies.py
src/axolotl/prompt_tokenizers.py
src/axolotl/prompters.py
src/axolotl/train.py
src/axolotl.egg-info/PKG-INFO
src/axolotl.egg-info/SOURCES.txt
src/axolotl.egg-info/dependency_links.txt
src/axolotl.egg-info/entry_points.txt
src/axolotl.egg-info/requires.txt
src/axolotl.egg-info/top_level.txt
src/axolotl/cli/__init__.py
src/axolotl/cli/args.py
src/axolotl/cli/art.py
src/axolotl/cli/checks.py
src/axolotl/cli/config.py
src/axolotl/cli/delinearize_llama4.py
src/axolotl/cli/evaluate.py
src/axolotl/cli/inference.py
src/axolotl/cli/main.py
src/axolotl/cli/merge_lora.py
src/axolotl/cli/merge_sharded_fsdp_weights.py
src/axolotl/cli/preprocess.py
src/axolotl/cli/quantize.py
src/axolotl/cli/train.py
src/axolotl/cli/vllm_serve.py
src/axolotl/cli/cloud/__init__.py
src/axolotl/cli/cloud/base.py
src/axolotl/cli/cloud/modal_.py
src/axolotl/cli/utils/__init__.py
src/axolotl/cli/utils/args.py
src/axolotl/cli/utils/fetch.py
src/axolotl/cli/utils/load.py
src/axolotl/cli/utils/sweeps.py
src/axolotl/cli/utils/train.py
src/axolotl/common/__init__.py
src/axolotl/common/architectures.py
src/axolotl/common/const.py
src/axolotl/common/datasets.py
src/axolotl/core/__init__.py
src/axolotl/core/training_args.py
src/axolotl/core/training_args_base.py
src/axolotl/core/attention/__init__.py
src/axolotl/core/attention/flex_block_mask.py
src/axolotl/core/builders/__init__.py
src/axolotl/core/builders/base.py
src/axolotl/core/builders/causal.py
src/axolotl/core/builders/rl.py
src/axolotl/core/chat/__init__.py
src/axolotl/core/chat/messages.py
src/axolotl/core/chat/format/__init__.py
src/axolotl/core/chat/format/chatml.py
src/axolotl/core/chat/format/llama3x.py
src/axolotl/core/chat/format/shared.py
src/axolotl/core/datasets/__init__.py
src/axolotl/core/datasets/chat.py
src/axolotl/core/datasets/transforms/__init__.py
src/axolotl/core/datasets/transforms/chat_builder.py
src/axolotl/core/trainers/__init__.py
src/axolotl/core/trainers/base.py
src/axolotl/core/trainers/mamba.py
src/axolotl/core/trainers/trl.py
src/axolotl/core/trainers/utils.py
src/axolotl/core/trainers/dpo/__init__.py
src/axolotl/core/trainers/dpo/args.py
src/axolotl/core/trainers/dpo/trainer.py
src/axolotl/core/trainers/grpo/__init__.py
src/axolotl/core/trainers/grpo/args.py
src/axolotl/core/trainers/grpo/sampler.py
src/axolotl/core/trainers/grpo/trainer.py
src/axolotl/core/trainers/mixins/__init__.py
src/axolotl/core/trainers/mixins/activation_checkpointing.py
src/axolotl/core/trainers/mixins/checkpoints.py
src/axolotl/core/trainers/mixins/distributed_parallel.py
src/axolotl/core/trainers/mixins/optimizer.py
src/axolotl/core/trainers/mixins/packing.py
src/axolotl/core/trainers/mixins/rng_state_loader.py
src/axolotl/core/trainers/mixins/scheduler.py
src/axolotl/integrations/__init__.py
src/axolotl/integrations/base.py
src/axolotl/integrations/config.py
src/axolotl/integrations/cut_cross_entropy/__init__.py
src/axolotl/integrations/cut_cross_entropy/args.py
src/axolotl/integrations/densemixer/__init__.py
src/axolotl/integrations/densemixer/args.py
src/axolotl/integrations/densemixer/plugin.py
src/axolotl/integrations/grokfast/__init__.py
src/axolotl/integrations/grokfast/args.py
src/axolotl/integrations/grokfast/optimizer.py
src/axolotl/integrations/kd/__init__.py
src/axolotl/integrations/kd/args.py
src/axolotl/integrations/kd/callbacks.py
src/axolotl/integrations/kd/chat_template.py
src/axolotl/integrations/kd/collator.py
src/axolotl/integrations/kd/collator_online_teacher.py
src/axolotl/integrations/kd/trainer.py
src/axolotl/integrations/kd/utils.py
src/axolotl/integrations/kd/kernels/__init__.py
src/axolotl/integrations/kd/kernels/liger.py
src/axolotl/integrations/kd/kernels/models.py
src/axolotl/integrations/kd/topk_logprob/__init__.py
src/axolotl/integrations/kd/topk_logprob/forward_kl.py
src/axolotl/integrations/liger/__init__.py
src/axolotl/integrations/liger/args.py
src/axolotl/integrations/liger/plugin.py
src/axolotl/integrations/liger/utils.py
src/axolotl/integrations/liger/models/__init__.py
src/axolotl/integrations/liger/models/base.py
src/axolotl/integrations/liger/models/deepseekv2.py
src/axolotl/integrations/liger/models/jamba.py
src/axolotl/integrations/liger/models/llama4.py
src/axolotl/integrations/liger/models/qwen3.py
src/axolotl/integrations/liger/models/qwen3_moe.py
src/axolotl/integrations/llm_compressor/__init__.py
src/axolotl/integrations/llm_compressor/args.py
src/axolotl/integrations/llm_compressor/plugin.py
src/axolotl/integrations/llm_compressor/utils.py
src/axolotl/integrations/lm_eval/__init__.py
src/axolotl/integrations/lm_eval/args.py
src/axolotl/integrations/lm_eval/cli.py
src/axolotl/integrations/spectrum/__init__.py
src/axolotl/integrations/spectrum/args.py
src/axolotl/kernels/__init__.py
src/axolotl/kernels/geglu.py
src/axolotl/kernels/lora.py
src/axolotl/kernels/quantize.py
src/axolotl/kernels/swiglu.py
src/axolotl/kernels/utils.py
src/axolotl/loaders/__init__.py
src/axolotl/loaders/adapter.py
src/axolotl/loaders/constants.py
src/axolotl/loaders/model.py
src/axolotl/loaders/patch_manager.py
src/axolotl/loaders/processor.py
src/axolotl/loaders/tokenizer.py
src/axolotl/loaders/utils.py
src/axolotl/loaders/adapters/__init__.py
src/axolotl/models/__init__.py
src/axolotl/models/mamba/__init__.py
src/axolotl/models/mamba/configuration_mamba.py
src/axolotl/models/mamba/modeling_mamba.py
src/axolotl/monkeypatch/__init__.py
src/axolotl/monkeypatch/btlm_attn_hijack_flash.py
src/axolotl/monkeypatch/fsdp2_qlora.py
src/axolotl/monkeypatch/llama_attn_hijack_flash.py
src/axolotl/monkeypatch/llama_attn_hijack_xformers.py
src/axolotl/monkeypatch/llama_expand_mask.py
src/axolotl/monkeypatch/llama_patch_multipack.py
src/axolotl/monkeypatch/lora_kernels.py
src/axolotl/monkeypatch/mistral_attn_hijack_flash.py
src/axolotl/monkeypatch/multipack.py
src/axolotl/monkeypatch/relora.py
src/axolotl/monkeypatch/stablelm_attn_hijack_flash.py
src/axolotl/monkeypatch/trainer_accelerator_args.py
src/axolotl/monkeypatch/trainer_fsdp_optim.py
src/axolotl/monkeypatch/transformers_fa_utils.py
src/axolotl/monkeypatch/unsloth_.py
src/axolotl/monkeypatch/utils.py
src/axolotl/monkeypatch/accelerate/__init__.py
src/axolotl/monkeypatch/accelerate/fsdp2.py
src/axolotl/monkeypatch/accelerate/parallelism_config.py
src/axolotl/monkeypatch/attention/__init__.py
src/axolotl/monkeypatch/attention/flex_attn.py
src/axolotl/monkeypatch/attention/xformers.py
src/axolotl/monkeypatch/data/__init__.py
src/axolotl/monkeypatch/data/batch_dataset_fetcher.py
src/axolotl/monkeypatch/gradient_checkpointing/__init__.py
src/axolotl/monkeypatch/gradient_checkpointing/offload_cpu.py
src/axolotl/monkeypatch/gradient_checkpointing/offload_disk.py
src/axolotl/monkeypatch/loss/__init__.py
src/axolotl/monkeypatch/loss/chunked.py
src/axolotl/monkeypatch/mixtral/__init__.py
src/axolotl/monkeypatch/models/__init__.py
src/axolotl/monkeypatch/models/llama4/__init__.py
src/axolotl/monkeypatch/models/llama4/modeling.py
src/axolotl/monkeypatch/models/voxtral/__init__.py
src/axolotl/monkeypatch/models/voxtral/modeling.py
src/axolotl/monkeypatch/peft/__init__.py
src/axolotl/monkeypatch/peft/utils.py
src/axolotl/monkeypatch/ring_attn/__init__.py
src/axolotl/monkeypatch/ring_attn/patch.py
src/axolotl/monkeypatch/ring_attn/adapters/__init__.py
src/axolotl/monkeypatch/ring_attn/adapters/batch.py
src/axolotl/monkeypatch/tiled_mlp/__init__.py
src/axolotl/monkeypatch/tiled_mlp/base.py
src/axolotl/monkeypatch/tiled_mlp/patch.py
src/axolotl/monkeypatch/trainer/__init__.py
src/axolotl/monkeypatch/trainer/lr.py
src/axolotl/monkeypatch/trainer/trl.py
src/axolotl/monkeypatch/transformers/__init__.py
src/axolotl/monkeypatch/transformers/modeling_flash_attention_utils.py
src/axolotl/monkeypatch/transformers/trainer_loss_calc.py
src/axolotl/monkeypatch/xformers_/__init__.py
src/axolotl/prompt_strategies/__init__.py
src/axolotl/prompt_strategies/alpaca_chat.py
src/axolotl/prompt_strategies/alpaca_instruct.py
src/axolotl/prompt_strategies/alpaca_w_system.py
src/axolotl/prompt_strategies/base.py
src/axolotl/prompt_strategies/chat_template.py
src/axolotl/prompt_strategies/completion.py
src/axolotl/prompt_strategies/context_qa.py
src/axolotl/prompt_strategies/creative_acr.py
src/axolotl/prompt_strategies/input_output.py
src/axolotl/prompt_strategies/jinja_template_analyzer.py
src/axolotl/prompt_strategies/llama2_chat.py
src/axolotl/prompt_strategies/metharme.py
src/axolotl/prompt_strategies/orcamini.py
src/axolotl/prompt_strategies/pretrain.py
src/axolotl/prompt_strategies/pygmalion.py
src/axolotl/prompt_strategies/stepwise_supervised.py
src/axolotl/prompt_strategies/user_defined.py
src/axolotl/prompt_strategies/bradley_terry/__init__.py
src/axolotl/prompt_strategies/bradley_terry/chat_template.py
src/axolotl/prompt_strategies/bradley_terry/llama3.py
src/axolotl/prompt_strategies/dpo/__init__.py
src/axolotl/prompt_strategies/dpo/chat_template.py
src/axolotl/prompt_strategies/dpo/chatml.py
src/axolotl/prompt_strategies/dpo/llama3.py
src/axolotl/prompt_strategies/dpo/passthrough.py
src/axolotl/prompt_strategies/dpo/user_defined.py
src/axolotl/prompt_strategies/dpo/zephyr.py
src/axolotl/prompt_strategies/kto/__init__.py
src/axolotl/prompt_strategies/kto/chatml.py
src/axolotl/prompt_strategies/kto/llama3.py
src/axolotl/prompt_strategies/kto/user_defined.py
src/axolotl/prompt_strategies/messages/__init__.py
src/axolotl/prompt_strategies/messages/chat.py
src/axolotl/prompt_strategies/orpo/__init__.py
src/axolotl/prompt_strategies/orpo/chat_template.py
src/axolotl/utils/__init__.py
src/axolotl/utils/bench.py
src/axolotl/utils/comet_.py
src/axolotl/utils/datasets.py
src/axolotl/utils/dict.py
src/axolotl/utils/distributed.py
src/axolotl/utils/environment.py
src/axolotl/utils/freeze.py
src/axolotl/utils/import_helper.py
src/axolotl/utils/logging.py
src/axolotl/utils/lora.py
src/axolotl/utils/mlflow_.py
src/axolotl/utils/model_shard_quant.py
src/axolotl/utils/quantization.py
src/axolotl/utils/schedulers.py
src/axolotl/utils/tokenization.py
src/axolotl/utils/trainer.py
src/axolotl/utils/wandb_.py
src/axolotl/utils/callbacks/__init__.py
src/axolotl/utils/callbacks/comet_.py
src/axolotl/utils/callbacks/lisa.py
src/axolotl/utils/callbacks/mlflow_.py
src/axolotl/utils/callbacks/models.py
src/axolotl/utils/callbacks/perplexity.py
src/axolotl/utils/callbacks/profiler.py
src/axolotl/utils/callbacks/qat.py
src/axolotl/utils/chat_templates/__init__.py
src/axolotl/utils/chat_templates/base.py
src/axolotl/utils/chat_templates/templates/alpaca.jinja
src/axolotl/utils/chat_templates/templates/aya.jinja
src/axolotl/utils/chat_templates/templates/chatml.jinja
src/axolotl/utils/chat_templates/templates/cohere.jinja
src/axolotl/utils/chat_templates/templates/command_a.jinja
src/axolotl/utils/chat_templates/templates/command_a_rag.jinja
src/axolotl/utils/chat_templates/templates/command_a_tool_use.jinja
src/axolotl/utils/chat_templates/templates/deepseek_v2.jinja
src/axolotl/utils/chat_templates/templates/deepseek_v3.jinja
src/axolotl/utils/chat_templates/templates/exaone.jinja
src/axolotl/utils/chat_templates/templates/falcon_h1.jinja
src/axolotl/utils/chat_templates/templates/gemma.jinja
src/axolotl/utils/chat_templates/templates/gemma3.jinja
src/axolotl/utils/chat_templates/templates/gemma3n.jinja
src/axolotl/utils/chat_templates/templates/jamba.jinja
src/axolotl/utils/chat_templates/templates/llama3.jinja
src/axolotl/utils/chat_templates/templates/llama3_2_vision.jinja
src/axolotl/utils/chat_templates/templates/llama4.jinja
src/axolotl/utils/chat_templates/templates/llava.jinja
src/axolotl/utils/chat_templates/templates/metharme.jinja
src/axolotl/utils/chat_templates/templates/mistral_v1.jinja
src/axolotl/utils/chat_templates/templates/mistral_v2v3.jinja
src/axolotl/utils/chat_templates/templates/mistral_v3_tekken.jinja
src/axolotl/utils/chat_templates/templates/mistral_v7_tekken.jinja
src/axolotl/utils/chat_templates/templates/phi_3.jinja
src/axolotl/utils/chat_templates/templates/phi_35.jinja
src/axolotl/utils/chat_templates/templates/phi_4.jinja
src/axolotl/utils/chat_templates/templates/pixtral.jinja
src/axolotl/utils/chat_templates/templates/qwen2_vl.jinja
src/axolotl/utils/chat_templates/templates/qwen3.jinja
src/axolotl/utils/chat_templates/templates/qwen_25.jinja
src/axolotl/utils/collators/__init__.py
src/axolotl/utils/collators/batching.py
src/axolotl/utils/collators/core.py
src/axolotl/utils/collators/mamba.py
src/axolotl/utils/collators/mm_chat.py
src/axolotl/utils/config/__init__.py
src/axolotl/utils/config/models/__init__.py
src/axolotl/utils/ctx_managers/__init__.py
src/axolotl/utils/ctx_managers/sequence_parallel.py
src/axolotl/utils/data/__init__.py
src/axolotl/utils/data/lock.py
src/axolotl/utils/data/pretraining.py
src/axolotl/utils/data/rl.py
src/axolotl/utils/data/sft.py
src/axolotl/utils/data/shared.py
src/axolotl/utils/data/utils.py
src/axolotl/utils/data/wrappers.py
src/axolotl/utils/mistral/__init__.py
src/axolotl/utils/mistral/mistral_tokenizer.py
src/axolotl/utils/optimizers/__init__.py
src/axolotl/utils/optimizers/adopt.py
src/axolotl/utils/samplers/__init__.py
src/axolotl/utils/samplers/multipack.py
src/axolotl/utils/samplers/utils.py
src/axolotl/utils/schemas/__init__.py
src/axolotl/utils/schemas/config.py
src/axolotl/utils/schemas/datasets.py
src/axolotl/utils/schemas/deprecated.py
src/axolotl/utils/schemas/enums.py
src/axolotl/utils/schemas/integrations.py
src/axolotl/utils/schemas/model.py
src/axolotl/utils/schemas/multimodal.py
src/axolotl/utils/schemas/peft.py
src/axolotl/utils/schemas/quantization.py
src/axolotl/utils/schemas/training.py
src/axolotl/utils/schemas/trl.py
src/axolotl/utils/schemas/utils.py
src/axolotl/utils/schemas/validation.py
src/axolotl/utils/schemas/vllm.py
src/axolotl/utils/schemas/internal/__init__.py