LICENSE
MANIFEST.in
README.md
pyproject.toml
setup.cfg
setup.py
megatron/core/__init__.py
megatron/core/enums.py
megatron/core/inference_params.py
megatron/core/jit.py
megatron/core/model_parallel_config.py
megatron/core/package_info.py
megatron/core/packed_seq_params.py
megatron/core/parallel_state.py
megatron/core/requirements.txt
megatron/core/timers.py
megatron/core/utils.py
megatron/core/datasets/__init__.py
megatron/core/datasets/bert_dataset.py
megatron/core/datasets/blended_dataset.py
megatron/core/datasets/blended_megatron_dataset_builder.py
megatron/core/datasets/blended_megatron_dataset_config.py
megatron/core/datasets/gpt_dataset.py
megatron/core/datasets/helpers.cpp
megatron/core/datasets/indexed_dataset.py
megatron/core/datasets/masked_dataset.py
megatron/core/datasets/megatron_dataset.py
megatron/core/datasets/megatron_tokenizer.py
megatron/core/datasets/multimodal_dataset.py
megatron/core/datasets/t5_dataset.py
megatron/core/datasets/utils.py
megatron/core/datasets/retro/__init__.py
megatron/core/datasets/retro/external_libs.py
megatron/core/datasets/retro/utils.py
megatron/core/datasets/retro/config/__init__.py
megatron/core/datasets/retro/config/bert_embedders.py
megatron/core/datasets/retro/config/config.py
megatron/core/datasets/retro/config/gpt_chunk_datasets.py
megatron/core/datasets/retro/config/tokenizers.py
megatron/core/datasets/retro/db/__init__.py
megatron/core/datasets/retro/db/build.py
megatron/core/datasets/retro/db/dataset.py
megatron/core/datasets/retro/db/utils.py
megatron/core/datasets/retro/index/__init__.py
megatron/core/datasets/retro/index/build.py
megatron/core/datasets/retro/index/factory.py
megatron/core/datasets/retro/index/index.py
megatron/core/datasets/retro/index/utils.py
megatron/core/datasets/retro/index/validate.py
megatron/core/datasets/retro/index/indexes/__init__.py
megatron/core/datasets/retro/index/indexes/faiss_base.py
megatron/core/datasets/retro/index/indexes/faiss_par_add.py
megatron/core/datasets/retro/query/__init__.py
megatron/core/datasets/retro/query/gpt_chunk_dataset.py
megatron/core/datasets/retro/query/multi_split_gpt_dataset.py
megatron/core/datasets/retro/query/query.py
megatron/core/datasets/retro/query/retro_dataset.py
megatron/core/datasets/retro/query/utils.py
megatron/core/dist_checkpointing/__init__.py
megatron/core/dist_checkpointing/core.py
megatron/core/dist_checkpointing/dict_utils.py
megatron/core/dist_checkpointing/mapping.py
megatron/core/dist_checkpointing/optimizer.py
megatron/core/dist_checkpointing/serialization.py
megatron/core/dist_checkpointing/utils.py
megatron/core/dist_checkpointing/strategies/__init__.py
megatron/core/dist_checkpointing/strategies/base.py
megatron/core/dist_checkpointing/strategies/filesystem_async.py
megatron/core/dist_checkpointing/strategies/state_dict_saver.py
megatron/core/dist_checkpointing/strategies/tensorstore.py
megatron/core/dist_checkpointing/strategies/torch.py
megatron/core/dist_checkpointing/strategies/two_stage.py
megatron/core/dist_checkpointing/strategies/zarr.py
megatron/core/distributed/__init__.py
megatron/core/distributed/distributed_data_parallel.py
megatron/core/distributed/finalize_model_grads.py
megatron/core/distributed/param_and_grad_buffer.py
megatron/core/fusions/__init__.py
megatron/core/fusions/fused_bias_dropout.py
megatron/core/fusions/fused_bias_geglu.py
megatron/core/fusions/fused_bias_gelu.py
megatron/core/fusions/fused_bias_swiglu.py
megatron/core/fusions/fused_layer_norm.py
megatron/core/fusions/fused_softmax.py
megatron/core/inference/__init__.py
megatron/core/inference/gpt/__init__.py
megatron/core/inference/gpt/model_specs.py
megatron/core/inference/gpt/state_dict_hooks.py
megatron/core/models/__init__.py
megatron/core/models/T5/__init__.py
megatron/core/models/T5/t5_model.py
megatron/core/models/T5/t5_spec.py
megatron/core/models/bert/__init__.py
megatron/core/models/bert/bert_layer_specs.py
megatron/core/models/bert/bert_lm_head.py
megatron/core/models/bert/bert_model.py
megatron/core/models/bert/pooler.py
megatron/core/models/common/__init__.py
megatron/core/models/common/embeddings/__init__.py
megatron/core/models/common/embeddings/language_model_embedding.py
megatron/core/models/common/embeddings/rotary_pos_embedding.py
megatron/core/models/common/language_module/__init__.py
megatron/core/models/common/language_module/language_module.py
megatron/core/models/common/vision_module/__init__.py
megatron/core/models/common/vision_module/vision_module.py
megatron/core/models/gpt/__init__.py
megatron/core/models/gpt/gpt_layer_specs.py
megatron/core/models/gpt/gpt_model.py
megatron/core/models/multimodal/__init__.py
megatron/core/models/multimodal/llava_model.py
megatron/core/models/retro/__init__.py
megatron/core/models/retro/base_attention.py
megatron/core/models/retro/config.py
megatron/core/models/retro/decoder_attention.py
megatron/core/models/retro/decoder_spec.py
megatron/core/models/retro/encoder_attention.py
megatron/core/models/retro/encoder_spec.py
megatron/core/models/retro/model.py
megatron/core/models/retro/utils.py
megatron/core/models/vision/__init__.py
megatron/core/models/vision/clip_vit_model.py
megatron/core/models/vision/multimodal_projector.py
megatron/core/optimizer/__init__.py
megatron/core/optimizer/clip_grads.py
megatron/core/optimizer/distrib_optimizer.py
megatron/core/optimizer/grad_scaler.py
megatron/core/optimizer/optimizer.py
megatron/core/optimizer/optimizer_config.py
megatron/core/pipeline_parallel/__init__.py
megatron/core/pipeline_parallel/p2p_communication.py
megatron/core/pipeline_parallel/schedules.py
megatron/core/tensor_parallel/__init__.py
megatron/core/tensor_parallel/cross_entropy.py
megatron/core/tensor_parallel/data.py
megatron/core/tensor_parallel/layers.py
megatron/core/tensor_parallel/mappings.py
megatron/core/tensor_parallel/random.py
megatron/core/tensor_parallel/utils.py
megatron/core/transformer/__init__.py
megatron/core/transformer/attention.py
megatron/core/transformer/dot_product_attention.py
megatron/core/transformer/enums.py
megatron/core/transformer/identity_op.py
megatron/core/transformer/mlp.py
megatron/core/transformer/module.py
megatron/core/transformer/spec_utils.py
megatron/core/transformer/transformer_block.py
megatron/core/transformer/transformer_config.py
megatron/core/transformer/transformer_layer.py
megatron/core/transformer/utils.py
megatron/core/transformer/custom_layers/__init__.py
megatron/core/transformer/custom_layers/transformer_engine.py
megatron/core/transformer/moe/__init__.py
megatron/core/transformer/moe/experts.py
megatron/core/transformer/moe/grouped_gemm_util.py
megatron/core/transformer/moe/moe_layer.py
megatron/core/transformer/moe/moe_utils.py
megatron/core/transformer/moe/router.py
megatron/core/transformer/moe/token_dispatcher.py
megatron_core.egg-info/PKG-INFO
megatron_core.egg-info/SOURCES.txt
megatron_core.egg-info/dependency_links.txt
megatron_core.egg-info/top_level.txt