Path |
Digest |
Size |
megatron/core/optimizer_param_scheduler.py |
sha256=-PvioN4fSJ_f90ycQKdWQCZ2YvvlPzaSYrVV2GlXOdc
|
11410 |
megatron/core/packed_seq_params.py |
sha256=g6PiGyJVwsxP_x8jlovetWnJy0hgk4NKvxR8_JcrWbc
|
421 |
megatron/core/parallel_state.py |
sha256=4B0GjX_CIDTSf0rHeQntgPCbart3TmpNtP4jv1jYLZM
|
66502 |
megatron/core/config_logger.py |
sha256=DXgQhA0gSXwi98QXQsfNeCckoT8PMfMmlv2AWTgkjKs
|
3446 |
megatron/core/__init__.py |
sha256=JTHUjHpjfIjRebYW49yGYZTL3fEm9qLo27lNV-ZkqNM
|
905 |
megatron/core/package_info.py |
sha256=H8gP-PVCE6GZHnacTnZMvwt6g9ZmfMH_M7mQpHuoTwQ
|
994 |
megatron/core/utils.py |
sha256=_az2LGGEw9KbdW9_KdSR0-9T2AUnEWt06ptCelWTewI
|
49060 |
megatron/core/jit.py |
sha256=eve_fNxWf_sI_n0OcfRWB4dkeXrfyr-DxnsQFqwk6rE
|
362 |
megatron/core/timers.py |
sha256=tAc5rIyyKGVvGPxT6xyBOUJQ-kuuZJWp7_b3ZTFi8sc
|
14960 |
megatron/core/enums.py |
sha256=OIc-mEyKwE-d3iYoSkhAN4ch3mIrFui9cgaLrMW6j8o
|
205 |
megatron/core/inference_params.py |
sha256=v6FOGDJzEb4IjfcsVuakHmkMeu0kjRyWSIT_CiMUgqA
|
1601 |
megatron/core/model_parallel_config.py |
sha256=M-wxFmHD5LzU4rrMe3SqJOc8WLGSrSxkn1_PBFj7Gd8
|
13915 |
megatron/core/requirements.txt |
sha256=dNfbHaSDwcqPAHqG937D_zI4ORSupsxCb-qK3EVKDuI
|
16 |
megatron/core/README.md |
sha256=pq0pdMfbLIqupJ8TNH6rNa2uO7HFoLsOKtTJAjOPjDA
|
2096 |
megatron/core/num_microbatches_calculator.py |
sha256=5fanLEPDzQ3prrE_7E6mGVPsUCRV5f7cuajRo5XC-94
|
18748 |
megatron/core/fusions/fused_bias_dropout.py |
sha256=wlMrWpQehmP3N4M9pDTd_KrkztprCfoxD6CiiikX_24
|
2895 |
megatron/core/fusions/fused_layer_norm.py |
sha256=5gFtgiAcIPxSf5Ns_9aHv-MiiGYK4CrCwNPRwYG2WwA
|
5687 |
megatron/core/fusions/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/fusions/fused_softmax.py |
sha256=Hicykgpfoaf7dU2WSw1Z7dRp7q4T83ClOeNMTqg91yw
|
7623 |
megatron/core/fusions/fused_bias_geglu.py |
sha256=6JmbmIno-yESd4mf2DfCvvouIvnrx1772Q2NJABQSOY
|
2361 |
megatron/core/fusions/fused_bias_gelu.py |
sha256=RsbZdwWHScFPX_I-smDXjj4Wv2BGgbP_Cb3XI3wriqM
|
1544 |
megatron/core/fusions/fused_bias_swiglu.py |
sha256=8zqeEnXUkBOpKKt4fR9p9hqGXvGllaMo38Dc55bDvLY
|
2676 |
megatron/core/fusions/fused_cross_entropy.py |
sha256=Y5CtT3FARxSrXUYDzF0Vth9wuU82CORexHfuXlByCZA
|
4922 |
megatron/core/datasets/indexed_dataset.py |
sha256=rVD_o6UpbKZhFNE3Z6gHRiGdnzKZI04l90DzVhlS1S4
|
30341 |
megatron/core/datasets/blended_megatron_dataset_builder.py |
sha256=II3B-avMGCLkyEW4scKDQsdp7NsA-UrezdJMr6tatpo
|
22764 |
megatron/core/datasets/helpers.cpp |
sha256=KKM2v_374A0Ysmzf2MtofpwjwBhD2H6eNFH-y2bW1GE
|
29557 |
megatron/core/datasets/blended_megatron_dataset_config.py |
sha256=kBfW-zggz_kec16gp7_IW7ok8ZfiEQCl1JVR9STU6hc
|
7259 |
megatron/core/datasets/t5_dataset.py |
sha256=HG_dEvJFAvNqZzavULoU32f6mzMg-W3d37AJjSnpLZs
|
8256 |
megatron/core/datasets/masked_dataset.py |
sha256=wqKatuyvhqluIkfeZy5BNAwkX3wms7LOrXnHg6C3sA4
|
17006 |
megatron/core/datasets/megatron_dataset.py |
sha256=ft7s9cw-x9nEtvnjwwkKkN6fjVtMguISSaoku0TscsU
|
4974 |
megatron/core/datasets/bert_dataset.py |
sha256=g2AGIVkXWXsBpi1eINxt0mjj8GOZVORbUXkX_u845xo
|
7108 |
megatron/core/datasets/multimodal_dataset.py |
sha256=lRpC4GOlCElrDTOeE4sVhE5WARhfzWmYvr6FuXBR_Os
|
1907 |
megatron/core/datasets/megatron_tokenizer.py |
sha256=Jt5dD0KdfIO97qtVe6CgnKmfMBFbzhNLmYaynvi09QE
|
3839 |
megatron/core/datasets/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/datasets/helpers.cpython-311-x86_64-linux-gnu.so |
sha256=CnFjtWTeRh-SQ36Qw0vY45o0KSmeYemUZTTqu08hMMU
|
4351736 |
megatron/core/datasets/gpt_dataset.py |
sha256=D2Fsa92S0rw0sseMHhBAI3PAVoZDKYagEAt0x5AhDqA
|
28565 |
megatron/core/datasets/utils.py |
sha256=Yp28I9bICWNghUhwL5zZ7MTFQSBraNKgGCJ29g7DkaI
|
2723 |
megatron/core/datasets/blended_dataset.py |
sha256=N2kBArSO5QXsz4Y-XpBkU5aS752eGAMr6jy7dQ_xnBA
|
8042 |
megatron/core/datasets/utils_s3.py |
sha256=mV-o5-A9TLomVz2QTlLPPR7_pTFEBRi-oYOe-Xrl1AQ
|
5224 |
megatron/core/datasets/retro/__init__.py |
sha256=qRMVBbNTh1tNiF3dboxFUPbwrt52EX0U0rxuhEYjUts
|
251 |
megatron/core/datasets/retro/utils.py |
sha256=MEgioRidXAtclkSa8yoR-dzYuPIC2XY_qga8BY4klgY
|
12328 |
megatron/core/datasets/retro/external_libs.py |
sha256=gvzZaGQ3s-Y4OIsXlfw-xDE2GCAFPOgPp_U0sIj0ggk
|
491 |
megatron/core/datasets/retro/query/gpt_chunk_dataset.py |
sha256=uqErXLrpGie4V-NLvfbYayBlLCVehcUmZO8AY4MYOCA
|
3816 |
megatron/core/datasets/retro/query/query.py |
sha256=MfJm4v_fA4MJDs2bbvfz1rM_Kx2BrG6bQCM60MlXl2U
|
14313 |
megatron/core/datasets/retro/query/__init__.py |
sha256=k_Cvc2yxTe93EhbgoQAhhk7CNTjCzLm8sws66Jj55n4
|
64 |
megatron/core/datasets/retro/query/utils.py |
sha256=CcQklrl2ZwTDOXiYmSpDi_vCLO61vc1VjvK5IRfvSGw
|
1111 |
megatron/core/datasets/retro/query/retro_dataset.py |
sha256=rFDmREle7pUq7EbTY8LBFq5VE3PFXqa8JSoMFN3ch6k
|
9300 |
megatron/core/datasets/retro/query/multi_split_gpt_dataset.py |
sha256=7LG94UYT6OTgMgY0F2bk0_S9KQWsWj_mgHE8kSB8dsc
|
4198 |
megatron/core/datasets/retro/index/index.py |
sha256=4QAOYnerl_TUKZ0nLVH2zQhgPZXmLH75603oON9d_8k
|
4943 |
megatron/core/datasets/retro/index/__init__.py |
sha256=hm55AK1FGTWvuaNriGg1WgV0-T0F9NAygBRR61TThPM
|
317 |
megatron/core/datasets/retro/index/factory.py |
sha256=J5BclHsqQLwz24g_ClAiHlPX3G9yS0GMtv30nXh-dr0
|
1375 |
megatron/core/datasets/retro/index/validate.py |
sha256=yuHAQN3zM_wZW7-eI9Nv9KCMpRlzTNIup5r8WZrAoSI
|
6071 |
megatron/core/datasets/retro/index/utils.py |
sha256=3mKYb4Lk5V8GlYFA01tdjKO5xMoCU3-5JNnA5hfoQUw
|
3964 |
megatron/core/datasets/retro/index/build.py |
sha256=Aeuqkv-TBGdgzJuZR0ukPjh-cB6d27XES7rJ09xB5Zw
|
9249 |
megatron/core/datasets/retro/index/indexes/faiss_base.py |
sha256=mCJ88s0bNXyQHfyWYvQkgLrAmHA-adrAr162pyd3Ud0
|
4987 |
megatron/core/datasets/retro/index/indexes/faiss_par_add.py |
sha256=fa1T_PYNRhw7dBtOliRCmKAxa-oga688cRrloOQ6TB4
|
7551 |
megatron/core/datasets/retro/index/indexes/__init__.py |
sha256=YftO_ZxhxOzW61fD2Ga2-Ebx7UtyVrr7dWHDt4PoH4Q
|
285 |
megatron/core/datasets/retro/db/__init__.py |
sha256=WdGDuNtiJ5_-H27yxJyDfGxdgECk0k3E_OiHVuFK44M
|
182 |
megatron/core/datasets/retro/db/utils.py |
sha256=Kc3UQojOTS4kqol722q3m9v2lMs_UoIM7WEY_hVYxDk
|
12740 |
megatron/core/datasets/retro/db/dataset.py |
sha256=uloEiS07M8vX8O2ikchyiX9Ed7zDO747WbfHwXFrWq0
|
3569 |
megatron/core/datasets/retro/db/build.py |
sha256=wYmRkDAlcu3cP6U9VN6btnMp6j3jEDZOnNV6AYNoDMo
|
23738 |
megatron/core/datasets/retro/config/config.py |
sha256=Gr2UTnVwN7qD6jnwdh46Aslw6ZBIJuKLWDPI9IG7ghg
|
9117 |
megatron/core/datasets/retro/config/tokenizers.py |
sha256=H8SprrOWcSCXOA1vLdgBMt1umbAYgr4MgQUCb3foFpQ
|
385 |
megatron/core/datasets/retro/config/__init__.py |
sha256=IffC2zcSCB_YEVBoJKTmucCl8Agq_xYkgOv3WIxDmAk
|
634 |
megatron/core/datasets/retro/config/gpt_chunk_datasets.py |
sha256=UuwnMf0VQBobCgAHyVudbrrosE61FQByIaJB3sxto2k
|
417 |
megatron/core/datasets/retro/config/bert_embedders.py |
sha256=QdLlK05x-oPoUlxXk60v1N42hc6LYOk7kBoFmLzxoCE
|
1327 |
megatron/core/optimizer/optimizer.py |
sha256=IlkZkqWLaJGOs8y7XobFNS3ffgbhLKE6S9Dd3Kmvn8Q
|
41443 |
megatron/core/optimizer/clip_grads.py |
sha256=SWwhGGhyfunASpxjN6NqcPBJ1Tnax-1G7DdzPEztC_o
|
6847 |
megatron/core/optimizer/__init__.py |
sha256=VxWx1TwCnwLX9Q_6vLzV3wyXd0e0dcC1hJIBh5oftoY
|
17352 |
megatron/core/optimizer/distrib_optimizer.py |
sha256=sKIM6C94G-Rh7ApyTLGL1MrYkm-9k6oJKhQKxjXcFN8
|
88131 |
megatron/core/optimizer/grad_scaler.py |
sha256=wvNBlVyDM71uJVT8x8NPdOd2sLG9TOS8tTrdmlSgV4I
|
5161 |
megatron/core/optimizer/optimizer_config.py |
sha256=F0jQrEFs5XwMQcCbNEyLotDmZhwk_jG3bZl5MqSIxyk
|
4041 |
megatron/core/extensions/transformer_engine.py |
sha256=-kAGnccpTO-U85Cvl64OcgEpPRMeF2hKX8xKkU-Z_HI
|
39023 |
megatron/core/extensions/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/inference/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/scheduler.py |
sha256=xGMK0Jm7U3kPFtwFD_Ctpx7sXs3VPZ-ZKzx4teQqtVM
|
5056 |
megatron/core/inference/inference_request.py |
sha256=lKKi_1FBItZLmlZ6AXIfIqzl2HMp-_ElwoN_nE2t960
|
739 |
megatron/core/inference/utils.py |
sha256=vmPJSvR9BfsK_765P0jks7dF4WBXs8_y0j8dNLkeDZk
|
427 |
megatron/core/inference/communication_utils.py |
sha256=uF88r7Nqhkmuyh8mhrm1zZL2w6H1x0FCtdNYlkrT-kc
|
1787 |
megatron/core/inference/common_inference_params.py |
sha256=w9MknNQjHTGu5B3fKYyjLZyk_Jt72TEHT0BqG4Acew0
|
1139 |
megatron/core/inference/model_inference_wrappers/inference_wrapper_config.py |
sha256=dff7Zt8MexhbR0KwJNEVk2glOZFXX4dKmCmxPBQRCBU
|
1527 |
megatron/core/inference/model_inference_wrappers/abstract_model_inference_wrapper.py |
sha256=nXirWtpE0HrZ-QG1pz4_gu-rxhHaZbmcqUUP11WvJuI
|
10649 |
megatron/core/inference/model_inference_wrappers/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/model_inference_wrappers/gpt/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/model_inference_wrappers/gpt/gpt_inference_wrapper.py |
sha256=vECFVElbSa_QFFlworrGt8Lu-qJ2UV_VyWF4xRqVHHw
|
3638 |
megatron/core/inference/engines/abstract_engine.py |
sha256=NzmE2s4mlNFGI3MwbVM_-H9EoPAd9olzvaior2oq8fM
|
521 |
megatron/core/inference/engines/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/engines/mcore_engine.py |
sha256=5RDjJKoPm4xjA07f82bbzxncSNQg4wwQfQLWHQBt5QQ
|
4059 |
megatron/core/inference/ammo_support/__init__.py |
sha256=KV8WsGuGugoVAf-PpIoFMlqrr8D5r4InTnrAK2aqEt4
|
300 |
megatron/core/inference/ammo_support/gpt/state_dict_hooks.py |
sha256=D7qIpflYCnGfcB8BbC_AsIMelJ-V114LXHFAAm53jKY
|
231 |
megatron/core/inference/ammo_support/gpt/model_specs.py |
sha256=y7i0CR-QcDt8EBhyu_ZZCweoh9EZ0WhyqeiX0DZXB3E
|
160 |
megatron/core/inference/text_generation_controllers/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/text_generation_controllers/simple_text_generation_controller.py |
sha256=pWEMBdr1H2jG1b5AZ_QJMhT-VZWgNiuS3RyGnEE9zdE
|
17675 |
megatron/core/inference/modelopt_support/__init__.py |
sha256=Dj52aVe2p55UV9c5lCjD0op6sQvn46SBFi4LBODHBI4
|
584 |
megatron/core/inference/modelopt_support/gpt/state_dict_hooks.py |
sha256=jOechATpv6xOlb9swq8DxiA3jvyIRMUXMTp3jqfpZ58
|
5549 |
megatron/core/inference/modelopt_support/gpt/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/modelopt_support/gpt/model_specs.py |
sha256=AwLdV0tGx_Z1pVe_t6Ht68yLbxaGVY-liAaxAigtAR4
|
2588 |
megatron/core/tensor_parallel/__init__.py |
sha256=mE3W1UiVgbkZ1dAmyUanArOwllfw1cxgJ4i5i3jcsRI
|
2600 |
megatron/core/tensor_parallel/cross_entropy.py |
sha256=WY8ogQYZggl0sgGlKyW0ZUM3Af_n4wDaWLx7K85TgD4
|
9067 |
megatron/core/tensor_parallel/data.py |
sha256=B1eYjFFuElvlmZFy8AAGE0Q0b6AjIIXQl4toYFLseSk
|
3365 |
megatron/core/tensor_parallel/utils.py |
sha256=FYCQzKmRpJVavdJNd-gr-BTjxZNZaonZSX93MNiRbJ8
|
4105 |
megatron/core/tensor_parallel/mappings.py |
sha256=mwF2jbQZShoBV45j8fYrDXVk8NfxwLPEoUBZqJFheI0
|
21168 |
megatron/core/tensor_parallel/random.py |
sha256=YocKplkHrb2jno1EaiE5CSHGZWxGLER2fjfyLesByn0
|
11738 |
megatron/core/tensor_parallel/layers.py |
sha256=hJcNgZ-cWw5HNkNVzEbR2iHBGPOht4ZEdKnSM76rIUA
|
46226 |
megatron/core/transformer/dot_product_attention.py |
sha256=Oc7Epk8hPRwDkAXNSUw-GQ8kq7GjI5MeCDTD8fTK86c
|
7903 |
megatron/core/transformer/module.py |
sha256=UK-YaNBOsMYDoDo0HcHEICOs_NUlzdiJ7WM0cL8tgnE
|
7096 |
megatron/core/transformer/spec_utils.py |
sha256=cq2u5dNgZnJIH8WO019qFnfbSSNpR1O8Z9bMA5hCY5E
|
4057 |
megatron/core/transformer/mlp.py |
sha256=-8S2IjkT4OXg0D9FPyL4YSHs_fwsBco13FB5PJ3-l_8
|
10126 |
megatron/core/transformer/__init__.py |
sha256=XpcTTt2xON-6IFG6h4uipx3c0U5HvJkuZmwnOh1frJY
|
274 |
megatron/core/transformer/torch_layer_norm.py |
sha256=aebSLqgCUFPQF4oiGyb51Nz54pHzEYJD_exP09XeNCI
|
1477 |
megatron/core/transformer/cuda_graphs.py |
sha256=O0Uim7f63ES_ufuCvE5WtdjY_f-Fr8O26BfPOcAyExI
|
12827 |
megatron/core/transformer/utils.py |
sha256=dUCethYv_7ekoB884x3_vmIKuYY6T4nm9uEqo2uWe9E
|
6943 |
megatron/core/transformer/identity_op.py |
sha256=w35Qyy0lmN-huMJhQF-Cq29R9gTIfkklKi4TKsWEm1c
|
713 |
megatron/core/transformer/attention.py |
sha256=2VjlgyLLCl7UoAd_RVxGx5aGQ9SL_oM0z_-KP6nOg8o
|
21537 |
megatron/core/transformer/enums.py |
sha256=9JtRWcLSNZjw-HnhGKLTeNyaXpagefN4aue2pICicBo
|
533 |
megatron/core/transformer/transformer_block.py |
sha256=MRN9mC45Z5KS06rU_vgoLuNX1PmPCYYGO5VGZuoyaUs
|
24376 |
megatron/core/transformer/transformer_layer.py |
sha256=lYlIMsBzh5Aw28bT7LawHuF8yMD6FfAQMoIBZ_i8UMQ
|
16060 |
megatron/core/transformer/transformer_config.py |
sha256=nvevgeXEM3iZMjeb7uOfb8oJ_-u4jh7OIdPSirxt0Qo
|
21845 |
megatron/core/transformer/moe/upcycling_utils.py |
sha256=5JS28SJvF1TS3WjwGhrWrEwKz8cSkTo2bDB97E7LH6I
|
8588 |
megatron/core/transformer/moe/legacy_a2a_token_dispatcher.py |
sha256=6NZUQG2txs2udl6AKbckQfnAmKIvNZBmKQNqt9nK7EA
|
14232 |
megatron/core/transformer/moe/grouped_gemm_util.py |
sha256=GYzirbRITTUzRUmOgsP9UVAFSsL0UV_DeCu8LpzIwG4
|
591 |
megatron/core/transformer/moe/router.py |
sha256=LnSPO5khsRn6MzW9Fa8C7I16LlLmM1b6U50rLoKPHu4
|
11325 |
megatron/core/transformer/moe/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/transformer/moe/moe_layer.py |
sha256=9fOKHeAC60QXrpoboiDvz9d-KAOsarUD0DoK9r1_TMI
|
5446 |
megatron/core/transformer/moe/experts.py |
sha256=KYWwcrme1-q8KiSoEiA20a7SVomg6APiGrcUVBERB3k
|
25611 |
megatron/core/transformer/moe/moe_utils.py |
sha256=V1L3hPOaac50TaIZD2xKVePlVSPiXjXtFDiFYzYEQQs
|
23504 |
megatron/core/transformer/moe/token_dispatcher.py |
sha256=nCZmOjXxYOi4jmEvXK9I92zJxw2geklazPhR6DUv0Wc
|
27572 |
megatron/core/transformer/custom_layers/transformer_engine.py |
sha256=QiuumLn4vXdPwX7QqAGJwg_CwFku6DQ7ZYcMnWAOSB0
|
402 |
megatron/core/transformer/custom_layers/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/ssm/mamba_mixer.py |
sha256=eEngsZOeK5X5IV2gn9e-7PUWQbtpokvY6S1ay1B61Eo
|
27707 |
megatron/core/ssm/mamba_layer.py |
sha256=7cvnlwnWfT9XoWZ4fp5ZZFEK_cjhsvvyTV6xon7OceE
|
2843 |
megatron/core/ssm/mamba_block.py |
sha256=wRo4LDACMJ1DwgycgCpmmHycSqNk0sFQqYZcEnkOlb4
|
13929 |
megatron/core/ssm/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/ssm/triton_cache_manager.py |
sha256=tBnvVoaasrYpF2e-xF8ELYOl1ldwpkvwhAvK3gFzmsA
|
1598 |
megatron/core/ssm/mamba_hybrid_layer_allocation.py |
sha256=PwfjUnFcLmQQBcONy6hL16j-ooYKgpGwiJY0e7-OrLA
|
7136 |
megatron/core/models/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/multimodal/llava_model.py |
sha256=9J1aYP6IcUnCqwNhhLC9UK4pumSauPL4cJw8KnFtYtQ
|
26457 |
megatron/core/models/multimodal/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/models/multimodal/llava_spec.py |
sha256=AYDn1cNWDDxC95KD2YwIaduHv0uTy8fCxmKppoO66Zo
|
3443 |
megatron/core/models/retro/encoder_attention.py |
sha256=-78pUkEfSkpfGGIANTYPxGOVurybSpidmv8p96t9UOg
|
8028 |
megatron/core/models/retro/config.py |
sha256=8vrOypZs46yk4io5omiSH6wWsUbLTYFo9VJ2NicrMus
|
3084 |
megatron/core/models/retro/__init__.py |
sha256=wBWEz9cWtITwx_zWX9NXZQMnVXp6ADm6cR9bXfU-56w
|
371 |
megatron/core/models/retro/decoder_attention.py |
sha256=-gs_1mUgR42XPcTSj9wffHloeOAjFONOVxbxbIkpP5o
|
11420 |
megatron/core/models/retro/base_attention.py |
sha256=0qn1cwvJLi2uGC87npnCFzj5pfZLSg2CNIbLytD0HFU
|
1596 |
megatron/core/models/retro/utils.py |
sha256=yhI3b4VcURObUqw1_Iw_HIJ-ENMBQG2qjubYVa0PANo
|
749 |
megatron/core/models/retro/model.py |
sha256=MQa_OeLqNg3rqGUCxY19NMvcT7S0qZ0fZWHTb4oHe_A
|
3760 |
megatron/core/models/retro/decoder_spec.py |
sha256=axTr9NC3wfKnAYpTaWZKmXibF1sw9TpEmR-lQUtIi5g
|
6695 |
megatron/core/models/retro/encoder_spec.py |
sha256=Vj-4CURBlOXs217f8tzP9MaC0rI8DFSjezOW5cns57E
|
6249 |
megatron/core/models/T5/t5_spec.py |
sha256=_oXkG9L86EzOOuIMIywptLhI7LDiF02pfKlDtWphqyU
|
9065 |
megatron/core/models/T5/t5_model.py |
sha256=N0tL3px7Imvz1J6w3NrASOGxexyKwt_2W7jenJjw47Q
|
16138 |
megatron/core/models/T5/__init__.py |
sha256=PidBNqxDgX7sIVX0wm9lX6AHDpBNJV51Q_vHl3Cs8a4
|
93 |
megatron/core/models/vision/vit_layer_specs.py |
sha256=nMe89KuRfyHx7CZrbudwiH-0A1G20wFq7y5Gof3fh-U
|
3514 |
megatron/core/models/vision/clip_vit_model.py |
sha256=EcmSxebpyamDnWIWgKD1Maq67gAltRtKJM0T5HjNsqU
|
6277 |
megatron/core/models/vision/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/vision/multimodal_projector.py |
sha256=LhkwtIyIjWvzNQfmHWrwnn0z-vcS0P7gZ6XWguEQYnA
|
2631 |
megatron/core/models/mamba/mamba_layer_specs.py |
sha256=mb_H0BWYi9Pt4jwHGRxImzy4Xsdbjdj3b8ds_kVrq94
|
2815 |
megatron/core/models/mamba/__init__.py |
sha256=cCEAU0SMUgMgV7W6PbyEiP1UvAN-l0V6HcV7kGnHy9g
|
99 |
megatron/core/models/mamba/mamba_model.py |
sha256=5ByebL_4DRKQspyiS8zgpU1TaQZZzsGPX_zLWRwU3p0
|
10198 |
megatron/core/models/gpt/gpt_layer_specs.py |
sha256=a3woPO_MnVK199ifWJnWUiUkR9AEebLNbRlOwNptWK4
|
6663 |
megatron/core/models/gpt/__init__.py |
sha256=Vs2iy0MeLf3CISnsQiam9V964paf77a0GiXgoAEVZvw
|
95 |
megatron/core/models/gpt/gpt_model.py |
sha256=8n2sw3eSYejmt5J0f3niGDC6PaYJBwZ0xH59l5YPAI8
|
12161 |
megatron/core/models/common/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/embeddings/rotary_pos_embedding.py |
sha256=S-91zAdKhndXMnrpIN8mhFoqFhcWYSqHVU38h1bxvCQ
|
9425 |
megatron/core/models/common/embeddings/language_model_embedding.py |
sha256=BFmfe8IjRFRVfYI3UaexNKi-smR1F9YDpeFHC9XD8WQ
|
5731 |
megatron/core/models/common/embeddings/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/language_module/language_module.py |
sha256=k1IekDw27glal8WESBpKILLZjlVJO2pPouuQQxeEp4Q
|
9251 |
megatron/core/models/common/language_module/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/vision_module/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/vision_module/vision_module.py |
sha256=SUwBfItrNKZdEHtw_NCCRgF0PBsaBX_lqTAnPpC4zCE
|
635 |
megatron/core/models/bert/bert_model.py |
sha256=809DO6dcWAeooNurruFQFJpGlWKm39on4Oejq0_4AeE
|
15931 |
megatron/core/models/bert/pooler.py |
sha256=-QAoY3T-SMDUz4p4uZ-FveF01bPB2cw9WwVtAR_8-kM
|
1886 |
megatron/core/models/bert/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/bert/bert_lm_head.py |
sha256=QQpqm0YmvZgkJoZZbPvnbMkHnJDljmFLjoqFyM2AnVk
|
1723 |
megatron/core/models/bert/bert_layer_specs.py |
sha256=zoHf-F28XAqQBmts1ue0MNwYyVzab-nTI1goDqWiewA
|
3455 |
megatron/core/distributed/finalize_model_grads.py |
sha256=qeb58K0FgarwfBifoXQfIGtN_QOqXgJUsA4Bc0xWw7U
|
6900 |
megatron/core/distributed/distributed_data_parallel_config.py |
sha256=WV1bmMgE75qaMS3Fgq9bCmPRW3vAEJJ7qYeapUqY7GY
|
1728 |
megatron/core/distributed/distributed_data_parallel.py |
sha256=enbmHZ-OkOqmwn69v0YQ5Sq4U9FRhP1zb9CoxPf-S1w
|
22018 |
megatron/core/distributed/__init__.py |
sha256=-cN5nE1vEvnbW_2YDa36y_mhzuS3Wb8tW1FRRrDZOYg
|
525 |
megatron/core/distributed/param_and_grad_buffer.py |
sha256=-iSeffbaOxUJjXP46h_1V2vuocAVBZizolJ5b2Gs_qI
|
33780 |
megatron/core/pipeline_parallel/__init__.py |
sha256=W84Ic3_NAV9s_YXvgKaYcv2-uUd0T8e9ZPalT0PA1wM
|
112 |
megatron/core/pipeline_parallel/p2p_communication.py |
sha256=IRXgmmWlmHbt9bsyX7cjfsZ4kpqMLlbB_JdA3LG8pfU
|
22274 |
megatron/core/pipeline_parallel/schedules.py |
sha256=5ZqcVtME9LJzlkRmWD0dStcGBOTTqBS6DuKdsfoXXv0
|
64946 |
megatron/core/dist_checkpointing/optimizer.py |
sha256=X-rrX0qKrTr5buFq6xYJuaXSYTC-tidUTON1nbZfenw
|
5483 |
megatron/core/dist_checkpointing/mapping.py |
sha256=G5jlP-bEgf23OLgwhCZI2_HMrdeqRJzcwBOtm7vtIk4
|
28454 |
megatron/core/dist_checkpointing/dict_utils.py |
sha256=GjZ0esYOH7gkOHYKk6pe1BsNhSF-ADmdrWqB3_Wp8z0
|
9006 |
megatron/core/dist_checkpointing/exchange_utils.py |
sha256=wyIdJ_nfuGKwOe9TitR7zpV37JngN5CdSanF1fU0PGE
|
22733 |
megatron/core/dist_checkpointing/__init__.py |
sha256=KTsvwvVpJVEZW2gQLxGFZgjNUXJJcamMKr_o-P0wjnA
|
336 |
megatron/core/dist_checkpointing/core.py |
sha256=X-xJIGAuv8SQhvQIyuJl6wL07u_fwSh_TPiRnhQ8i3A
|
2182 |
megatron/core/dist_checkpointing/state_dict_transformation.py |
sha256=H5BV8fmrH9nUhckzJTded8Ugkg_xZA84yx9k3kcUDUc
|
10477 |
megatron/core/dist_checkpointing/serialization.py |
sha256=-3jebM0QkSaVUH_h8dEzT7N3yof2bfrp16Qv5aThKss
|
17306 |
megatron/core/dist_checkpointing/utils.py |
sha256=2ApsjlpcOfjPnFlMkqpglua-OltcMo6cuoUPcsrqTWc
|
7876 |
megatron/core/dist_checkpointing/validation.py |
sha256=h2NlH-0Vmlh1VjJ6lZA9egEO0lmk74i_HT2rq7N-Uho
|
22112 |
megatron/core/dist_checkpointing/strategies/common.py |
sha256=Q2kluMk0JVfs35z_wgBfCiNSi8tQ1NF_Agd20FdM2uM
|
6173 |
megatron/core/dist_checkpointing/strategies/async_utils.py |
sha256=XXK0mzmexnz1786UUUFRKFBW9kN6Oq7D011PHCPGm2w
|
8409 |
megatron/core/dist_checkpointing/strategies/state_dict_saver.py |
sha256=UycrUTqeBuWLIBOSAO6rzevLUKbUG42qXuIqJP9Q7Oo
|
6938 |
megatron/core/dist_checkpointing/strategies/fully_parallel.py |
sha256=y-uVTroG0ElVU8S2PE2djDEiuXPJb0G2lzQozSAUHh8
|
18944 |
megatron/core/dist_checkpointing/strategies/base.py |
sha256=McYIrlPN_0-yrIGVtoIoo81mZOlpA_cWK99qpA7DCDo
|
8178 |
megatron/core/dist_checkpointing/strategies/__init__.py |
sha256=jUZuiVe1Flxld2HmcduP475MtoqIIUef8yrdg_DouyU
|
316 |
megatron/core/dist_checkpointing/strategies/tensorstore.py |
sha256=OT4q3y82i1gEu8LpnWEoikN8NNZev4O43XEGLMAi-lE
|
4765 |
megatron/core/dist_checkpointing/strategies/two_stage.py |
sha256=1ZRUYf-yzJQWvXac99pu98_mLzuwkhmhttKbH-Dkhng
|
10160 |
megatron/core/dist_checkpointing/strategies/torch.py |
sha256=S1csE_s0cxkEmxF_a_hHGuJ5x7Je6kk7pJquuKdQTuc
|
35363 |
megatron/core/dist_checkpointing/strategies/filesystem_async.py |
sha256=UjlwigclM8EmjrMrNPAQjS0fA0R4Z2vym6-SD_hyq-U
|
14637 |
megatron/core/dist_checkpointing/strategies/resharding.py |
sha256=HuUl-6FY52E3IgaBPGj0aD1cgjR73hKWd18ORC8hMd4
|
13090 |
megatron/core/dist_checkpointing/strategies/zarr.py |
sha256=hquh4apuhgeXx13oT7k06FOHreK-RSTDWmnXS-X6p2c
|
11492 |
megatron_core-0.9.0.dist-info/top_level.txt |
sha256=OEOs4V4xHotpQFOUHkfPkLmqcuKfSffSlV17EmZVBjg
|
9 |
megatron_core-0.9.0.dist-info/LICENSE |
sha256=S9UMoyZlNvYp9CHuKhuT2Or5L7idfS9Y_t_pAtaMaOg
|
14692 |
megatron_core-0.9.0.dist-info/WHEEL |
sha256=UCJN9pzXq2OrEh3slrcZ0BR8J6AybiEimpKIcvW2yn0
|
152 |
megatron_core-0.9.0.dist-info/RECORD |
— |
— |
megatron_core-0.9.0.dist-info/METADATA |
sha256=FwoKOFr2Ag7KgPjnGBCByuy__X0wjP6RfC3lQGL_JIE
|
3588 |