megatron-core

View on PyPIReverse Dependencies (2)

0.9.0 megatron_core-0.9.0-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl
megatron_core-0.9.0-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl

Wheel Details

Project: megatron-core
Version: 0.9.0
Filename: megatron_core-0.9.0-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl
Download: [link]
Size: 1608958
MD5: 88fbaaa28dd341803bf1cb0c2fb48d32
SHA256: b2c73c9e6fa58c93f3b1833ffd32bc08dc29b5d28fda7375c5a5e3a8aaeb3db8
Uploaded: 2024-10-24 10:42:08 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: megatron_core
Version: 0.9.0
Summary: Megatron Core - a library for efficient and scalable training of transformer based models
Author: NVIDIA
Author-Email: nemo-toolkit[at]nvidia.com
Maintainer: NVIDIA
Maintainer-Email: nemo-toolkit[at]nvidia.com
Home-Page: https://github.com/NVIDIA/Megatron-LM/megatron/core
Download-Url: https://github.com/NVIDIA/Megatron-LM/releases
License: BSD-3
Keywords: deep learning,machine learning,gpu,NLP,NLU,language,transformer,nvidia,pytorch,torch
Classifier: Development Status :: 5 - Production/Stable
Classifier: Intended Audience :: Developers
Classifier: Intended Audience :: Science/Research
Classifier: Intended Audience :: Information Technology
Classifier: Topic :: Scientific/Engineering
Classifier: Topic :: Scientific/Engineering :: Mathematics
Classifier: Topic :: Scientific/Engineering :: Image Recognition
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Classifier: Topic :: Software Development :: Libraries
Classifier: Topic :: Software Development :: Libraries :: Python Modules
Classifier: Topic :: Utilities
Classifier: License :: OSI Approved :: BSD License
Classifier: Programming Language :: Python :: 3
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Environment :: Console
Classifier: Natural Language :: English
Classifier: Operating System :: OS Independent
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 2096 characters]

WHEEL

Wheel-Version: 1.0
Generator: setuptools (75.2.0)
Root-Is-Purelib: false
Tag: cp311-cp311-manylinux_2_24_x86_64
Tag: cp311-cp311-manylinux_2_28_x86_64

RECORD

Path Digest Size
megatron/core/optimizer_param_scheduler.py sha256=-PvioN4fSJ_f90ycQKdWQCZ2YvvlPzaSYrVV2GlXOdc 11410
megatron/core/packed_seq_params.py sha256=g6PiGyJVwsxP_x8jlovetWnJy0hgk4NKvxR8_JcrWbc 421
megatron/core/parallel_state.py sha256=4B0GjX_CIDTSf0rHeQntgPCbart3TmpNtP4jv1jYLZM 66502
megatron/core/config_logger.py sha256=DXgQhA0gSXwi98QXQsfNeCckoT8PMfMmlv2AWTgkjKs 3446
megatron/core/__init__.py sha256=JTHUjHpjfIjRebYW49yGYZTL3fEm9qLo27lNV-ZkqNM 905
megatron/core/package_info.py sha256=H8gP-PVCE6GZHnacTnZMvwt6g9ZmfMH_M7mQpHuoTwQ 994
megatron/core/utils.py sha256=_az2LGGEw9KbdW9_KdSR0-9T2AUnEWt06ptCelWTewI 49060
megatron/core/jit.py sha256=eve_fNxWf_sI_n0OcfRWB4dkeXrfyr-DxnsQFqwk6rE 362
megatron/core/timers.py sha256=tAc5rIyyKGVvGPxT6xyBOUJQ-kuuZJWp7_b3ZTFi8sc 14960
megatron/core/enums.py sha256=OIc-mEyKwE-d3iYoSkhAN4ch3mIrFui9cgaLrMW6j8o 205
megatron/core/inference_params.py sha256=v6FOGDJzEb4IjfcsVuakHmkMeu0kjRyWSIT_CiMUgqA 1601
megatron/core/model_parallel_config.py sha256=M-wxFmHD5LzU4rrMe3SqJOc8WLGSrSxkn1_PBFj7Gd8 13915
megatron/core/requirements.txt sha256=dNfbHaSDwcqPAHqG937D_zI4ORSupsxCb-qK3EVKDuI 16
megatron/core/README.md sha256=pq0pdMfbLIqupJ8TNH6rNa2uO7HFoLsOKtTJAjOPjDA 2096
megatron/core/num_microbatches_calculator.py sha256=5fanLEPDzQ3prrE_7E6mGVPsUCRV5f7cuajRo5XC-94 18748
megatron/core/fusions/fused_bias_dropout.py sha256=wlMrWpQehmP3N4M9pDTd_KrkztprCfoxD6CiiikX_24 2895
megatron/core/fusions/fused_layer_norm.py sha256=5gFtgiAcIPxSf5Ns_9aHv-MiiGYK4CrCwNPRwYG2WwA 5687
megatron/core/fusions/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/fusions/fused_softmax.py sha256=Hicykgpfoaf7dU2WSw1Z7dRp7q4T83ClOeNMTqg91yw 7623
megatron/core/fusions/fused_bias_geglu.py sha256=6JmbmIno-yESd4mf2DfCvvouIvnrx1772Q2NJABQSOY 2361
megatron/core/fusions/fused_bias_gelu.py sha256=RsbZdwWHScFPX_I-smDXjj4Wv2BGgbP_Cb3XI3wriqM 1544
megatron/core/fusions/fused_bias_swiglu.py sha256=8zqeEnXUkBOpKKt4fR9p9hqGXvGllaMo38Dc55bDvLY 2676
megatron/core/fusions/fused_cross_entropy.py sha256=Y5CtT3FARxSrXUYDzF0Vth9wuU82CORexHfuXlByCZA 4922
megatron/core/datasets/indexed_dataset.py sha256=rVD_o6UpbKZhFNE3Z6gHRiGdnzKZI04l90DzVhlS1S4 30341
megatron/core/datasets/blended_megatron_dataset_builder.py sha256=II3B-avMGCLkyEW4scKDQsdp7NsA-UrezdJMr6tatpo 22764
megatron/core/datasets/helpers.cpp sha256=KKM2v_374A0Ysmzf2MtofpwjwBhD2H6eNFH-y2bW1GE 29557
megatron/core/datasets/blended_megatron_dataset_config.py sha256=kBfW-zggz_kec16gp7_IW7ok8ZfiEQCl1JVR9STU6hc 7259
megatron/core/datasets/t5_dataset.py sha256=HG_dEvJFAvNqZzavULoU32f6mzMg-W3d37AJjSnpLZs 8256
megatron/core/datasets/masked_dataset.py sha256=wqKatuyvhqluIkfeZy5BNAwkX3wms7LOrXnHg6C3sA4 17006
megatron/core/datasets/megatron_dataset.py sha256=ft7s9cw-x9nEtvnjwwkKkN6fjVtMguISSaoku0TscsU 4974
megatron/core/datasets/bert_dataset.py sha256=g2AGIVkXWXsBpi1eINxt0mjj8GOZVORbUXkX_u845xo 7108
megatron/core/datasets/multimodal_dataset.py sha256=lRpC4GOlCElrDTOeE4sVhE5WARhfzWmYvr6FuXBR_Os 1907
megatron/core/datasets/megatron_tokenizer.py sha256=Jt5dD0KdfIO97qtVe6CgnKmfMBFbzhNLmYaynvi09QE 3839
megatron/core/datasets/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/datasets/helpers.cpython-311-x86_64-linux-gnu.so sha256=CnFjtWTeRh-SQ36Qw0vY45o0KSmeYemUZTTqu08hMMU 4351736
megatron/core/datasets/gpt_dataset.py sha256=D2Fsa92S0rw0sseMHhBAI3PAVoZDKYagEAt0x5AhDqA 28565
megatron/core/datasets/utils.py sha256=Yp28I9bICWNghUhwL5zZ7MTFQSBraNKgGCJ29g7DkaI 2723
megatron/core/datasets/blended_dataset.py sha256=N2kBArSO5QXsz4Y-XpBkU5aS752eGAMr6jy7dQ_xnBA 8042
megatron/core/datasets/utils_s3.py sha256=mV-o5-A9TLomVz2QTlLPPR7_pTFEBRi-oYOe-Xrl1AQ 5224
megatron/core/datasets/retro/__init__.py sha256=qRMVBbNTh1tNiF3dboxFUPbwrt52EX0U0rxuhEYjUts 251
megatron/core/datasets/retro/utils.py sha256=MEgioRidXAtclkSa8yoR-dzYuPIC2XY_qga8BY4klgY 12328
megatron/core/datasets/retro/external_libs.py sha256=gvzZaGQ3s-Y4OIsXlfw-xDE2GCAFPOgPp_U0sIj0ggk 491
megatron/core/datasets/retro/query/gpt_chunk_dataset.py sha256=uqErXLrpGie4V-NLvfbYayBlLCVehcUmZO8AY4MYOCA 3816
megatron/core/datasets/retro/query/query.py sha256=MfJm4v_fA4MJDs2bbvfz1rM_Kx2BrG6bQCM60MlXl2U 14313
megatron/core/datasets/retro/query/__init__.py sha256=k_Cvc2yxTe93EhbgoQAhhk7CNTjCzLm8sws66Jj55n4 64
megatron/core/datasets/retro/query/utils.py sha256=CcQklrl2ZwTDOXiYmSpDi_vCLO61vc1VjvK5IRfvSGw 1111
megatron/core/datasets/retro/query/retro_dataset.py sha256=rFDmREle7pUq7EbTY8LBFq5VE3PFXqa8JSoMFN3ch6k 9300
megatron/core/datasets/retro/query/multi_split_gpt_dataset.py sha256=7LG94UYT6OTgMgY0F2bk0_S9KQWsWj_mgHE8kSB8dsc 4198
megatron/core/datasets/retro/index/index.py sha256=4QAOYnerl_TUKZ0nLVH2zQhgPZXmLH75603oON9d_8k 4943
megatron/core/datasets/retro/index/__init__.py sha256=hm55AK1FGTWvuaNriGg1WgV0-T0F9NAygBRR61TThPM 317
megatron/core/datasets/retro/index/factory.py sha256=J5BclHsqQLwz24g_ClAiHlPX3G9yS0GMtv30nXh-dr0 1375
megatron/core/datasets/retro/index/validate.py sha256=yuHAQN3zM_wZW7-eI9Nv9KCMpRlzTNIup5r8WZrAoSI 6071
megatron/core/datasets/retro/index/utils.py sha256=3mKYb4Lk5V8GlYFA01tdjKO5xMoCU3-5JNnA5hfoQUw 3964
megatron/core/datasets/retro/index/build.py sha256=Aeuqkv-TBGdgzJuZR0ukPjh-cB6d27XES7rJ09xB5Zw 9249
megatron/core/datasets/retro/index/indexes/faiss_base.py sha256=mCJ88s0bNXyQHfyWYvQkgLrAmHA-adrAr162pyd3Ud0 4987
megatron/core/datasets/retro/index/indexes/faiss_par_add.py sha256=fa1T_PYNRhw7dBtOliRCmKAxa-oga688cRrloOQ6TB4 7551
megatron/core/datasets/retro/index/indexes/__init__.py sha256=YftO_ZxhxOzW61fD2Ga2-Ebx7UtyVrr7dWHDt4PoH4Q 285
megatron/core/datasets/retro/db/__init__.py sha256=WdGDuNtiJ5_-H27yxJyDfGxdgECk0k3E_OiHVuFK44M 182
megatron/core/datasets/retro/db/utils.py sha256=Kc3UQojOTS4kqol722q3m9v2lMs_UoIM7WEY_hVYxDk 12740
megatron/core/datasets/retro/db/dataset.py sha256=uloEiS07M8vX8O2ikchyiX9Ed7zDO747WbfHwXFrWq0 3569
megatron/core/datasets/retro/db/build.py sha256=wYmRkDAlcu3cP6U9VN6btnMp6j3jEDZOnNV6AYNoDMo 23738
megatron/core/datasets/retro/config/config.py sha256=Gr2UTnVwN7qD6jnwdh46Aslw6ZBIJuKLWDPI9IG7ghg 9117
megatron/core/datasets/retro/config/tokenizers.py sha256=H8SprrOWcSCXOA1vLdgBMt1umbAYgr4MgQUCb3foFpQ 385
megatron/core/datasets/retro/config/__init__.py sha256=IffC2zcSCB_YEVBoJKTmucCl8Agq_xYkgOv3WIxDmAk 634
megatron/core/datasets/retro/config/gpt_chunk_datasets.py sha256=UuwnMf0VQBobCgAHyVudbrrosE61FQByIaJB3sxto2k 417
megatron/core/datasets/retro/config/bert_embedders.py sha256=QdLlK05x-oPoUlxXk60v1N42hc6LYOk7kBoFmLzxoCE 1327
megatron/core/optimizer/optimizer.py sha256=IlkZkqWLaJGOs8y7XobFNS3ffgbhLKE6S9Dd3Kmvn8Q 41443
megatron/core/optimizer/clip_grads.py sha256=SWwhGGhyfunASpxjN6NqcPBJ1Tnax-1G7DdzPEztC_o 6847
megatron/core/optimizer/__init__.py sha256=VxWx1TwCnwLX9Q_6vLzV3wyXd0e0dcC1hJIBh5oftoY 17352
megatron/core/optimizer/distrib_optimizer.py sha256=sKIM6C94G-Rh7ApyTLGL1MrYkm-9k6oJKhQKxjXcFN8 88131
megatron/core/optimizer/grad_scaler.py sha256=wvNBlVyDM71uJVT8x8NPdOd2sLG9TOS8tTrdmlSgV4I 5161
megatron/core/optimizer/optimizer_config.py sha256=F0jQrEFs5XwMQcCbNEyLotDmZhwk_jG3bZl5MqSIxyk 4041
megatron/core/extensions/transformer_engine.py sha256=-kAGnccpTO-U85Cvl64OcgEpPRMeF2hKX8xKkU-Z_HI 39023
megatron/core/extensions/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/inference/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/scheduler.py sha256=xGMK0Jm7U3kPFtwFD_Ctpx7sXs3VPZ-ZKzx4teQqtVM 5056
megatron/core/inference/inference_request.py sha256=lKKi_1FBItZLmlZ6AXIfIqzl2HMp-_ElwoN_nE2t960 739
megatron/core/inference/utils.py sha256=vmPJSvR9BfsK_765P0jks7dF4WBXs8_y0j8dNLkeDZk 427
megatron/core/inference/communication_utils.py sha256=uF88r7Nqhkmuyh8mhrm1zZL2w6H1x0FCtdNYlkrT-kc 1787
megatron/core/inference/common_inference_params.py sha256=w9MknNQjHTGu5B3fKYyjLZyk_Jt72TEHT0BqG4Acew0 1139
megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py sha256=dff7Zt8MexhbR0KwJNEVk2glOZFXX4dKmCmxPBQRCBU 1527
megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py sha256=nXirWtpE0HrZ-QG1pz4_gu-rxhHaZbmcqUUP11WvJuI 10649
megatron/core/inference/model_inference_wrappers/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/model_inference_wrappers/gpt/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py sha256=vECFVElbSa_QFFlworrGt8Lu-qJ2UV_VyWF4xRqVHHw 3638
megatron/core/inference/engines/abstract_engine.py sha256=NzmE2s4mlNFGI3MwbVM_-H9EoPAd9olzvaior2oq8fM 521
megatron/core/inference/engines/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/engines/mcore_engine.py sha256=5RDjJKoPm4xjA07f82bbzxncSNQg4wwQfQLWHQBt5QQ 4059
megatron/core/inference/ammo_support/__init__.py sha256=KV8WsGuGugoVAf-PpIoFMlqrr8D5r4InTnrAK2aqEt4 300
megatron/core/inference/ammo_support/gpt/state_dict_hooks.py sha256=D7qIpflYCnGfcB8BbC_AsIMelJ-V114LXHFAAm53jKY 231
megatron/core/inference/ammo_support/gpt/model_specs.py sha256=y7i0CR-QcDt8EBhyu_ZZCweoh9EZ0WhyqeiX0DZXB3E 160
megatron/core/inference/text_generation_controllers/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py sha256=pWEMBdr1H2jG1b5AZ_QJMhT-VZWgNiuS3RyGnEE9zdE 17675
megatron/core/inference/modelopt_support/__init__.py sha256=Dj52aVe2p55UV9c5lCjD0op6sQvn46SBFi4LBODHBI4 584
megatron/core/inference/modelopt_support/gpt/state_dict_hooks.py sha256=jOechATpv6xOlb9swq8DxiA3jvyIRMUXMTp3jqfpZ58 5549
megatron/core/inference/modelopt_support/gpt/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/modelopt_support/gpt/model_specs.py sha256=AwLdV0tGx_Z1pVe_t6Ht68yLbxaGVY-liAaxAigtAR4 2588
megatron/core/tensor_parallel/__init__.py sha256=mE3W1UiVgbkZ1dAmyUanArOwllfw1cxgJ4i5i3jcsRI 2600
megatron/core/tensor_parallel/cross_entropy.py sha256=WY8ogQYZggl0sgGlKyW0ZUM3Af_n4wDaWLx7K85TgD4 9067
megatron/core/tensor_parallel/data.py sha256=B1eYjFFuElvlmZFy8AAGE0Q0b6AjIIXQl4toYFLseSk 3365
megatron/core/tensor_parallel/utils.py sha256=FYCQzKmRpJVavdJNd-gr-BTjxZNZaonZSX93MNiRbJ8 4105
megatron/core/tensor_parallel/mappings.py sha256=mwF2jbQZShoBV45j8fYrDXVk8NfxwLPEoUBZqJFheI0 21168
megatron/core/tensor_parallel/random.py sha256=YocKplkHrb2jno1EaiE5CSHGZWxGLER2fjfyLesByn0 11738
megatron/core/tensor_parallel/layers.py sha256=hJcNgZ-cWw5HNkNVzEbR2iHBGPOht4ZEdKnSM76rIUA 46226
megatron/core/transformer/dot_product_attention.py sha256=Oc7Epk8hPRwDkAXNSUw-GQ8kq7GjI5MeCDTD8fTK86c 7903
megatron/core/transformer/module.py sha256=UK-YaNBOsMYDoDo0HcHEICOs_NUlzdiJ7WM0cL8tgnE 7096
megatron/core/transformer/spec_utils.py sha256=cq2u5dNgZnJIH8WO019qFnfbSSNpR1O8Z9bMA5hCY5E 4057
megatron/core/transformer/mlp.py sha256=-8S2IjkT4OXg0D9FPyL4YSHs_fwsBco13FB5PJ3-l_8 10126
megatron/core/transformer/__init__.py sha256=XpcTTt2xON-6IFG6h4uipx3c0U5HvJkuZmwnOh1frJY 274
megatron/core/transformer/torch_layer_norm.py sha256=aebSLqgCUFPQF4oiGyb51Nz54pHzEYJD_exP09XeNCI 1477
megatron/core/transformer/cuda_graphs.py sha256=O0Uim7f63ES_ufuCvE5WtdjY_f-Fr8O26BfPOcAyExI 12827
megatron/core/transformer/utils.py sha256=dUCethYv_7ekoB884x3_vmIKuYY6T4nm9uEqo2uWe9E 6943
megatron/core/transformer/identity_op.py sha256=w35Qyy0lmN-huMJhQF-Cq29R9gTIfkklKi4TKsWEm1c 713
megatron/core/transformer/attention.py sha256=2VjlgyLLCl7UoAd_RVxGx5aGQ9SL_oM0z_-KP6nOg8o 21537
megatron/core/transformer/enums.py sha256=9JtRWcLSNZjw-HnhGKLTeNyaXpagefN4aue2pICicBo 533
megatron/core/transformer/transformer_block.py sha256=MRN9mC45Z5KS06rU_vgoLuNX1PmPCYYGO5VGZuoyaUs 24376
megatron/core/transformer/transformer_layer.py sha256=lYlIMsBzh5Aw28bT7LawHuF8yMD6FfAQMoIBZ_i8UMQ 16060
megatron/core/transformer/transformer_config.py sha256=nvevgeXEM3iZMjeb7uOfb8oJ_-u4jh7OIdPSirxt0Qo 21845
megatron/core/transformer/moe/upcycling_utils.py sha256=5JS28SJvF1TS3WjwGhrWrEwKz8cSkTo2bDB97E7LH6I 8588
megatron/core/transformer/moe/legacy_a2a_token_dispatcher.py sha256=6NZUQG2txs2udl6AKbckQfnAmKIvNZBmKQNqt9nK7EA 14232
megatron/core/transformer/moe/grouped_gemm_util.py sha256=GYzirbRITTUzRUmOgsP9UVAFSsL0UV_DeCu8LpzIwG4 591
megatron/core/transformer/moe/router.py sha256=LnSPO5khsRn6MzW9Fa8C7I16LlLmM1b6U50rLoKPHu4 11325
megatron/core/transformer/moe/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/transformer/moe/moe_layer.py sha256=9fOKHeAC60QXrpoboiDvz9d-KAOsarUD0DoK9r1_TMI 5446
megatron/core/transformer/moe/experts.py sha256=KYWwcrme1-q8KiSoEiA20a7SVomg6APiGrcUVBERB3k 25611
megatron/core/transformer/moe/moe_utils.py sha256=V1L3hPOaac50TaIZD2xKVePlVSPiXjXtFDiFYzYEQQs 23504
megatron/core/transformer/moe/token_dispatcher.py sha256=nCZmOjXxYOi4jmEvXK9I92zJxw2geklazPhR6DUv0Wc 27572
megatron/core/transformer/custom_layers/transformer_engine.py sha256=QiuumLn4vXdPwX7QqAGJwg_CwFku6DQ7ZYcMnWAOSB0 402
megatron/core/transformer/custom_layers/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/ssm/mamba_mixer.py sha256=eEngsZOeK5X5IV2gn9e-7PUWQbtpokvY6S1ay1B61Eo 27707
megatron/core/ssm/mamba_layer.py sha256=7cvnlwnWfT9XoWZ4fp5ZZFEK_cjhsvvyTV6xon7OceE 2843
megatron/core/ssm/mamba_block.py sha256=wRo4LDACMJ1DwgycgCpmmHycSqNk0sFQqYZcEnkOlb4 13929
megatron/core/ssm/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/ssm/triton_cache_manager.py sha256=tBnvVoaasrYpF2e-xF8ELYOl1ldwpkvwhAvK3gFzmsA 1598
megatron/core/ssm/mamba_hybrid_layer_allocation.py sha256=PwfjUnFcLmQQBcONy6hL16j-ooYKgpGwiJY0e7-OrLA 7136
megatron/core/models/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/multimodal/llava_model.py sha256=9J1aYP6IcUnCqwNhhLC9UK4pumSauPL4cJw8KnFtYtQ 26457
megatron/core/models/multimodal/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/models/multimodal/llava_spec.py sha256=AYDn1cNWDDxC95KD2YwIaduHv0uTy8fCxmKppoO66Zo 3443
megatron/core/models/retro/encoder_attention.py sha256=-78pUkEfSkpfGGIANTYPxGOVurybSpidmv8p96t9UOg 8028
megatron/core/models/retro/config.py sha256=8vrOypZs46yk4io5omiSH6wWsUbLTYFo9VJ2NicrMus 3084
megatron/core/models/retro/__init__.py sha256=wBWEz9cWtITwx_zWX9NXZQMnVXp6ADm6cR9bXfU-56w 371
megatron/core/models/retro/decoder_attention.py sha256=-gs_1mUgR42XPcTSj9wffHloeOAjFONOVxbxbIkpP5o 11420
megatron/core/models/retro/base_attention.py sha256=0qn1cwvJLi2uGC87npnCFzj5pfZLSg2CNIbLytD0HFU 1596
megatron/core/models/retro/utils.py sha256=yhI3b4VcURObUqw1_Iw_HIJ-ENMBQG2qjubYVa0PANo 749
megatron/core/models/retro/model.py sha256=MQa_OeLqNg3rqGUCxY19NMvcT7S0qZ0fZWHTb4oHe_A 3760
megatron/core/models/retro/decoder_spec.py sha256=axTr9NC3wfKnAYpTaWZKmXibF1sw9TpEmR-lQUtIi5g 6695
megatron/core/models/retro/encoder_spec.py sha256=Vj-4CURBlOXs217f8tzP9MaC0rI8DFSjezOW5cns57E 6249
megatron/core/models/T5/t5_spec.py sha256=_oXkG9L86EzOOuIMIywptLhI7LDiF02pfKlDtWphqyU 9065
megatron/core/models/T5/t5_model.py sha256=N0tL3px7Imvz1J6w3NrASOGxexyKwt_2W7jenJjw47Q 16138
megatron/core/models/T5/__init__.py sha256=PidBNqxDgX7sIVX0wm9lX6AHDpBNJV51Q_vHl3Cs8a4 93
megatron/core/models/vision/vit_layer_specs.py sha256=nMe89KuRfyHx7CZrbudwiH-0A1G20wFq7y5Gof3fh-U 3514
megatron/core/models/vision/clip_vit_model.py sha256=EcmSxebpyamDnWIWgKD1Maq67gAltRtKJM0T5HjNsqU 6277
megatron/core/models/vision/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/vision/multimodal_projector.py sha256=LhkwtIyIjWvzNQfmHWrwnn0z-vcS0P7gZ6XWguEQYnA 2631
megatron/core/models/mamba/mamba_layer_specs.py sha256=mb_H0BWYi9Pt4jwHGRxImzy4Xsdbjdj3b8ds_kVrq94 2815
megatron/core/models/mamba/__init__.py sha256=cCEAU0SMUgMgV7W6PbyEiP1UvAN-l0V6HcV7kGnHy9g 99
megatron/core/models/mamba/mamba_model.py sha256=5ByebL_4DRKQspyiS8zgpU1TaQZZzsGPX_zLWRwU3p0 10198
megatron/core/models/gpt/gpt_layer_specs.py sha256=a3woPO_MnVK199ifWJnWUiUkR9AEebLNbRlOwNptWK4 6663
megatron/core/models/gpt/__init__.py sha256=Vs2iy0MeLf3CISnsQiam9V964paf77a0GiXgoAEVZvw 95
megatron/core/models/gpt/gpt_model.py sha256=8n2sw3eSYejmt5J0f3niGDC6PaYJBwZ0xH59l5YPAI8 12161
megatron/core/models/common/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/embeddings/rotary_pos_embedding.py sha256=S-91zAdKhndXMnrpIN8mhFoqFhcWYSqHVU38h1bxvCQ 9425
megatron/core/models/common/embeddings/language_model_embedding.py sha256=BFmfe8IjRFRVfYI3UaexNKi-smR1F9YDpeFHC9XD8WQ 5731
megatron/core/models/common/embeddings/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/language_module/language_module.py sha256=k1IekDw27glal8WESBpKILLZjlVJO2pPouuQQxeEp4Q 9251
megatron/core/models/common/language_module/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/vision_module/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/vision_module/vision_module.py sha256=SUwBfItrNKZdEHtw_NCCRgF0PBsaBX_lqTAnPpC4zCE 635
megatron/core/models/bert/bert_model.py sha256=809DO6dcWAeooNurruFQFJpGlWKm39on4Oejq0_4AeE 15931
megatron/core/models/bert/pooler.py sha256=-QAoY3T-SMDUz4p4uZ-FveF01bPB2cw9WwVtAR_8-kM 1886
megatron/core/models/bert/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/bert/bert_lm_head.py sha256=QQpqm0YmvZgkJoZZbPvnbMkHnJDljmFLjoqFyM2AnVk 1723
megatron/core/models/bert/bert_layer_specs.py sha256=zoHf-F28XAqQBmts1ue0MNwYyVzab-nTI1goDqWiewA 3455
megatron/core/distributed/finalize_model_grads.py sha256=qeb58K0FgarwfBifoXQfIGtN_QOqXgJUsA4Bc0xWw7U 6900
megatron/core/distributed/distributed_data_parallel_config.py sha256=WV1bmMgE75qaMS3Fgq9bCmPRW3vAEJJ7qYeapUqY7GY 1728
megatron/core/distributed/distributed_data_parallel.py sha256=enbmHZ-OkOqmwn69v0YQ5Sq4U9FRhP1zb9CoxPf-S1w 22018
megatron/core/distributed/__init__.py sha256=-cN5nE1vEvnbW_2YDa36y_mhzuS3Wb8tW1FRRrDZOYg 525
megatron/core/distributed/param_and_grad_buffer.py sha256=-iSeffbaOxUJjXP46h_1V2vuocAVBZizolJ5b2Gs_qI 33780
megatron/core/pipeline_parallel/__init__.py sha256=W84Ic3_NAV9s_YXvgKaYcv2-uUd0T8e9ZPalT0PA1wM 112
megatron/core/pipeline_parallel/p2p_communication.py sha256=IRXgmmWlmHbt9bsyX7cjfsZ4kpqMLlbB_JdA3LG8pfU 22274
megatron/core/pipeline_parallel/schedules.py sha256=5ZqcVtME9LJzlkRmWD0dStcGBOTTqBS6DuKdsfoXXv0 64946
megatron/core/dist_checkpointing/optimizer.py sha256=X-rrX0qKrTr5buFq6xYJuaXSYTC-tidUTON1nbZfenw 5483
megatron/core/dist_checkpointing/mapping.py sha256=G5jlP-bEgf23OLgwhCZI2_HMrdeqRJzcwBOtm7vtIk4 28454
megatron/core/dist_checkpointing/dict_utils.py sha256=GjZ0esYOH7gkOHYKk6pe1BsNhSF-ADmdrWqB3_Wp8z0 9006
megatron/core/dist_checkpointing/exchange_utils.py sha256=wyIdJ_nfuGKwOe9TitR7zpV37JngN5CdSanF1fU0PGE 22733
megatron/core/dist_checkpointing/__init__.py sha256=KTsvwvVpJVEZW2gQLxGFZgjNUXJJcamMKr_o-P0wjnA 336
megatron/core/dist_checkpointing/core.py sha256=X-xJIGAuv8SQhvQIyuJl6wL07u_fwSh_TPiRnhQ8i3A 2182
megatron/core/dist_checkpointing/state_dict_transformation.py sha256=H5BV8fmrH9nUhckzJTded8Ugkg_xZA84yx9k3kcUDUc 10477
megatron/core/dist_checkpointing/serialization.py sha256=-3jebM0QkSaVUH_h8dEzT7N3yof2bfrp16Qv5aThKss 17306
megatron/core/dist_checkpointing/utils.py sha256=2ApsjlpcOfjPnFlMkqpglua-OltcMo6cuoUPcsrqTWc 7876
megatron/core/dist_checkpointing/validation.py sha256=h2NlH-0Vmlh1VjJ6lZA9egEO0lmk74i_HT2rq7N-Uho 22112
megatron/core/dist_checkpointing/strategies/common.py sha256=Q2kluMk0JVfs35z_wgBfCiNSi8tQ1NF_Agd20FdM2uM 6173
megatron/core/dist_checkpointing/strategies/async_utils.py sha256=XXK0mzmexnz1786UUUFRKFBW9kN6Oq7D011PHCPGm2w 8409
megatron/core/dist_checkpointing/strategies/state_dict_saver.py sha256=UycrUTqeBuWLIBOSAO6rzevLUKbUG42qXuIqJP9Q7Oo 6938
megatron/core/dist_checkpointing/strategies/fully_parallel.py sha256=y-uVTroG0ElVU8S2PE2djDEiuXPJb0G2lzQozSAUHh8 18944
megatron/core/dist_checkpointing/strategies/base.py sha256=McYIrlPN_0-yrIGVtoIoo81mZOlpA_cWK99qpA7DCDo 8178
megatron/core/dist_checkpointing/strategies/__init__.py sha256=jUZuiVe1Flxld2HmcduP475MtoqIIUef8yrdg_DouyU 316
megatron/core/dist_checkpointing/strategies/tensorstore.py sha256=OT4q3y82i1gEu8LpnWEoikN8NNZev4O43XEGLMAi-lE 4765
megatron/core/dist_checkpointing/strategies/two_stage.py sha256=1ZRUYf-yzJQWvXac99pu98_mLzuwkhmhttKbH-Dkhng 10160
megatron/core/dist_checkpointing/strategies/torch.py sha256=S1csE_s0cxkEmxF_a_hHGuJ5x7Je6kk7pJquuKdQTuc 35363
megatron/core/dist_checkpointing/strategies/filesystem_async.py sha256=UjlwigclM8EmjrMrNPAQjS0fA0R4Z2vym6-SD_hyq-U 14637
megatron/core/dist_checkpointing/strategies/resharding.py sha256=HuUl-6FY52E3IgaBPGj0aD1cgjR73hKWd18ORC8hMd4 13090
megatron/core/dist_checkpointing/strategies/zarr.py sha256=hquh4apuhgeXx13oT7k06FOHreK-RSTDWmnXS-X6p2c 11492
megatron_core-0.9.0.dist-info/top_level.txt sha256=OEOs4V4xHotpQFOUHkfPkLmqcuKfSffSlV17EmZVBjg 9
megatron_core-0.9.0.dist-info/LICENSE sha256=S9UMoyZlNvYp9CHuKhuT2Or5L7idfS9Y_t_pAtaMaOg 14692
megatron_core-0.9.0.dist-info/WHEEL sha256=UCJN9pzXq2OrEh3slrcZ0BR8J6AybiEimpKIcvW2yn0 152
megatron_core-0.9.0.dist-info/RECORD
megatron_core-0.9.0.dist-info/METADATA sha256=FwoKOFr2Ag7KgPjnGBCByuy__X0wjP6RfC3lQGL_JIE 3588

top_level.txt

megatron