LICENSE
MANIFEST.in
README.md
pyproject.toml
optimum/commands/env.py
optimum/commands/export/neuron.py
optimum/commands/export/neuronx.py
optimum/commands/neuron/base.py
optimum/commands/neuron/cache.py
optimum/commands/neuron/subcommands.py
optimum/commands/register/register_export.py
optimum/commands/register/register_neuron.py
optimum/exporters/neuron/__init__.py
optimum/exporters/neuron/__main__.py
optimum/exporters/neuron/base.py
optimum/exporters/neuron/config.py
optimum/exporters/neuron/convert.py
optimum/exporters/neuron/model_configs.py
optimum/exporters/neuron/model_wrappers.py
optimum/exporters/neuron/utils.py
optimum/neuron/__init__.py
optimum/neuron/configuration_utils.py
optimum/neuron/hf_argparser.py
optimum/neuron/modeling.py
optimum/neuron/modeling_base.py
optimum/neuron/modeling_decoder.py
optimum/neuron/modeling_diffusion.py
optimum/neuron/modeling_seq2seq.py
optimum/neuron/modeling_traced.py
optimum/neuron/trainers.py
optimum/neuron/training_args.py
optimum/neuron/version.py
optimum/neuron/accelerate/__init__.py
optimum/neuron/accelerate/accelerator.py
optimum/neuron/accelerate/optimizer.py
optimum/neuron/accelerate/scheduler.py
optimum/neuron/accelerate/state.py
optimum/neuron/accelerate/utils/__init__.py
optimum/neuron/accelerate/utils/dataclasses.py
optimum/neuron/accelerate/utils/misc.py
optimum/neuron/accelerate/utils/operations.py
optimum/neuron/cache/__init__.py
optimum/neuron/cache/hub_cache.py
optimum/neuron/cache/optimum_neuron_cc_wrapper.py
optimum/neuron/cache/traced.py
optimum/neuron/cache/training.py
optimum/neuron/cache/entries/cache_entry.py
optimum/neuron/cache/entries/multi_model.py
optimum/neuron/cache/entries/single_model.py
optimum/neuron/generation/__init__.py
optimum/neuron/generation/logits_process.py
optimum/neuron/generation/token_selector.py
optimum/neuron/generation/utils.py
optimum/neuron/models/__init__.py
optimum/neuron/models/auto_model.py
optimum/neuron/models/neuron_config.py
optimum/neuron/models/inference/auto_models.py
optimum/neuron/models/inference/backend/__init__.py
optimum/neuron/models/inference/backend/cache.py
optimum/neuron/models/inference/backend/config.py
optimum/neuron/models/inference/backend/model_wrapper.py
optimum/neuron/models/inference/backend/pretrained_model.py
optimum/neuron/models/inference/backend/modules/autobucketing.py
optimum/neuron/models/inference/backend/modules/checkpoint.py
optimum/neuron/models/inference/backend/modules/custom_calls.py
optimum/neuron/models/inference/backend/modules/moe.py
optimum/neuron/models/inference/backend/modules/attention/__init__.py
optimum/neuron/models/inference/backend/modules/attention/attention_base.py
optimum/neuron/models/inference/backend/modules/attention/gqa.py
optimum/neuron/models/inference/backend/modules/attention/utils.py
optimum/neuron/models/inference/backend/modules/decoder/__init__.py
optimum/neuron/models/inference/backend/modules/decoder/decoder_wrapper.py
optimum/neuron/models/inference/backend/modules/decoder/modeling_decoder.py
optimum/neuron/models/inference/backend/modules/flashdecode/README.md
optimum/neuron/models/inference/backend/modules/flashdecode/utils.py
optimum/neuron/models/inference/backend/modules/generation/__init__.py
optimum/neuron/models/inference/backend/modules/generation/generation_utils.py
optimum/neuron/models/inference/backend/modules/generation/sampling.py
optimum/neuron/models/inference/backend/modules/kvcache/kv_cache_manager.py
optimum/neuron/models/inference/backend/modules/kvcache/utils.py
optimum/neuron/models/inference/backend/utils/__init__.py
optimum/neuron/models/inference/backend/utils/distributed.py
optimum/neuron/models/inference/backend/utils/random.py
optimum/neuron/models/inference/bert/__init__.py
optimum/neuron/models/inference/bert/modeling_bert.py
optimum/neuron/models/inference/clip/__init__.py
optimum/neuron/models/inference/clip/modeling_clip.py
optimum/neuron/models/inference/flux/modeling_flux.py
optimum/neuron/models/inference/flux/modules/activations.py
optimum/neuron/models/inference/flux/modules/embeddings.py
optimum/neuron/models/inference/flux/modules/normalization.py
optimum/neuron/models/inference/granite/modeling_granite.py
optimum/neuron/models/inference/llama/modeling_llama.py
optimum/neuron/models/inference/mixtral/modeling_mixtral.py
optimum/neuron/models/inference/phi3/modeling_phi3.py
optimum/neuron/models/inference/qwen2/modeling_qwen2.py
optimum/neuron/models/inference/qwen3/modeling_qwen3.py
optimum/neuron/models/inference/t5/modeling_t5.py
optimum/neuron/models/inference/whisper/__init__.py
optimum/neuron/models/inference/whisper/modeling_whisper.py
optimum/neuron/models/inference/yolos/__init__.py
optimum/neuron/models/inference/yolos/modeling_yolos.py
optimum/neuron/models/training/__init__.py
optimum/neuron/models/training/auto_models.py
optimum/neuron/models/training/checkpointing.py
optimum/neuron/models/training/config.py
optimum/neuron/models/training/loss_utils.py
optimum/neuron/models/training/modeling_auto.py
optimum/neuron/models/training/modeling_utils.py
optimum/neuron/models/training/pipeline_utils.py
optimum/neuron/models/training/transformations_utils.py
optimum/neuron/models/training/granite/__init__.py
optimum/neuron/models/training/granite/modeling_granite.py
optimum/neuron/models/training/llama/modeling_llama.py
optimum/neuron/models/training/qwen3/__init__.py
optimum/neuron/models/training/qwen3/modeling_qwen3.py
optimum/neuron/peft/__init__.py
optimum/neuron/peft/mapping.py
optimum/neuron/peft/mapping_func.py
optimum/neuron/peft/peft_model.py
optimum/neuron/peft/tuners/__init__.py
optimum/neuron/peft/tuners/lora/__init__.py
optimum/neuron/peft/tuners/lora/layer.py
optimum/neuron/peft/tuners/lora/model.py
optimum/neuron/peft/utils/__init__.py
optimum/neuron/peft/utils/save_and_load.py
optimum/neuron/pipelines/__init__.py
optimum/neuron/pipelines/diffusers/__init__.py
optimum/neuron/pipelines/diffusers/pipeline_controlnet.py
optimum/neuron/pipelines/diffusers/pipeline_controlnet_sd_xl.py
optimum/neuron/pipelines/diffusers/pipeline_utils.py
optimum/neuron/pipelines/transformers/__init__.py
optimum/neuron/pipelines/transformers/base.py
optimum/neuron/pipelines/transformers/sentence_transformers.py
optimum/neuron/utils/__init__.py
optimum/neuron/utils/argument_utils.py
optimum/neuron/utils/cache_utils.py
optimum/neuron/utils/constant.py
optimum/neuron/utils/deprecate_utils.py
optimum/neuron/utils/doc.py
optimum/neuron/utils/import_utils.py
optimum/neuron/utils/input_generators.py
optimum/neuron/utils/misc.py
optimum/neuron/utils/model_utils.py
optimum/neuron/utils/neuron_cc_wrapper
optimum/neuron/utils/neuron_parallel_compile.py
optimum/neuron/utils/optimization_utils.py
optimum/neuron/utils/patching.py
optimum/neuron/utils/require_utils.py
optimum/neuron/utils/runner.py
optimum/neuron/utils/system.py
optimum/neuron/utils/testing_utils.py
optimum/neuron/utils/torch_xla_and_neuronx_initialization.py
optimum/neuron/utils/training_utils.py
optimum/neuron/utils/trl_utils.py
optimum/neuron/utils/version_utils.py
optimum/neuron/vllm/__init__.py
optimum/neuron/vllm/model_loader.py
optimum/neuron/vllm/platform.py
optimum/neuron/vllm/plugin.py
optimum/neuron/vllm/runner.py
optimum/neuron/vllm/worker.py
optimum_neuron.egg-info/PKG-INFO
optimum_neuron.egg-info/SOURCES.txt
optimum_neuron.egg-info/dependency_links.txt
optimum_neuron.egg-info/entry_points.txt
optimum_neuron.egg-info/requires.txt
optimum_neuron.egg-info/top_level.txt
tests/test_distributed_utils.py