megatron-core

View on PyPIReverse Dependencies (3)

0.6.0 megatron_core-0.6.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
megatron_core-0.6.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl

Wheel Details

Project: megatron-core
Version: 0.6.0
Filename: megatron_core-0.6.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
Download: [link]
Size: 1371679
MD5: a1841e8f65f1b643ec6989c62d7906de
SHA256: 8e98d3b29284275d5f0eebc8fea3aafbe87cf6de6f6dc317f79e84eee4fbffd3
Uploaded: 2024-04-19 23:50:13 +0000

dist-info

METADATA

Metadata-Version: 2.1
Name: megatron_core
Version: 0.6.0
Summary: Megatron Core - a library for efficient and scalable training of transformer based models
Author: NVIDIA
Author-Email: nemo-toolkit[at]nvidia.com
Maintainer: NVIDIA
Maintainer-Email: nemo-toolkit[at]nvidia.com
Home-Page: https://github.com/NVIDIA/Megatron-LM/megatron/core
Download-Url: https://github.com/NVIDIA/Megatron-LM/releases
License: BSD-3
Keywords: deep learning,machine learning,gpu,NLP,NLU,language,transformer,nvidia,pytorch,torch
Classifier: Development Status :: 5 - Production/Stable
Classifier: Intended Audience :: Developers
Classifier: Intended Audience :: Science/Research
Classifier: Intended Audience :: Information Technology
Classifier: Topic :: Scientific/Engineering
Classifier: Topic :: Scientific/Engineering :: Mathematics
Classifier: Topic :: Scientific/Engineering :: Image Recognition
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
Classifier: Topic :: Software Development :: Libraries
Classifier: Topic :: Software Development :: Libraries :: Python Modules
Classifier: Topic :: Utilities
Classifier: License :: OSI Approved :: BSD License
Classifier: Programming Language :: Python :: 3
Classifier: Programming Language :: Python :: 3.8
Classifier: Programming Language :: Python :: 3.9
Classifier: Environment :: Console
Classifier: Natural Language :: English
Classifier: Operating System :: OS Independent
Description-Content-Type: text/markdown
License-File: LICENSE
[Description omitted; length: 92 characters]

WHEEL

Wheel-Version: 1.0
Generator: bdist_wheel (0.43.0)
Root-Is-Purelib: false
Tag: cp311-cp311-manylinux_2_17_x86_64
Tag: cp311-cp311-manylinux2014_x86_64

RECORD

Path Digest Size
megatron/core/requirements.txt sha256=N79Rv7pGmalAzjE0lCKySlvFWisXnteux0RZqa6NV7c 5
megatron/core/utils.py sha256=fKd6wQWYVKN49I051LjAKHthbDOpf5Y3ZiAEPTK9OwE 11810
megatron/core/package_info.py sha256=NIZcPzkVvewdWsyePDIUDoFF1p31dLRD-z87o_uqHN8 994
megatron/core/parallel_state.py sha256=B1a9ilsnvrjuT3KGa1_6z5JM_FHj3LVnJXJV96VWOYI 44946
megatron/core/jit.py sha256=eve_fNxWf_sI_n0OcfRWB4dkeXrfyr-DxnsQFqwk6rE 362
megatron/core/packed_seq_params.py sha256=9UCfT8-YrgLb-rfxxdikxSxWymAzPDChma5tPyDoIYY 358
megatron/core/__init__.py sha256=9IxLMwIkZYFhrOLn24_6olzO3PxryY3msBA1tnLuzQU 571
megatron/core/inference_params.py sha256=FaCRNoD5Z-9DDHRwGckHhext0q_DfiFc9ZTFDQupVdc 1241
megatron/core/enums.py sha256=OIc-mEyKwE-d3iYoSkhAN4ch3mIrFui9cgaLrMW6j8o 205
megatron/core/timers.py sha256=6Ocbn9nFQIQ_G8ZmAuVZwOvKbZ6qtFigMf8MrJC5390 14987
megatron/core/model_parallel_config.py sha256=15EJqaU_tA2a2XikaW6uG74_UiUieIrOpyD2UQrDZ3g 12283
megatron/core/pipeline_parallel/__init__.py sha256=e_qNyIBDy0CW-kzKxLwo1uMkWdCaVXPVy1s0GEH0wb4 49
megatron/core/pipeline_parallel/schedules.py sha256=3Up5_aTL5ReRNyBUqqNoOxBdXdLuyeaDYTe8WCRok0U 55130
megatron/core/pipeline_parallel/p2p_communication.py sha256=i3bUt97ar7h5jJT03h4N8IFsHprrAQz9wI6yhK5VA8M 19593
megatron/core/dist_checkpointing/serialization.py sha256=zLtk56R-A6Gr8tyApflUrKxa_f1z7VdDDFqAc3dxZbE 19949
megatron/core/dist_checkpointing/utils.py sha256=DmNu5ctRxV_fpRephFDiAbqO6NYesTvXffN5KhKVNrY 5668
megatron/core/dist_checkpointing/optimizer.py sha256=PBtv0FkEG8COYI9K1Zf78_pWZfqzDRBoOEIDCmUX3GQ 5423
megatron/core/dist_checkpointing/mapping.py sha256=FV31H5y_-1mq--PLBF4i41vOVlZCsJRrYnfVYdBavnI 13516
megatron/core/dist_checkpointing/__init__.py sha256=w43C479LFnwuTUgM-LHg_wlvCG87xN79XJ98DV_-NDU 310
megatron/core/dist_checkpointing/core.py sha256=9Y1GhAe-J0J2DIicxnTtYLBJFO83nuqPh2tIYTwxcpk 2189
megatron/core/dist_checkpointing/dict_utils.py sha256=QxSomKWQ7VGbSAvrRRtSIrjfvAngEewjgDhUPVStPfQ 8397
megatron/core/dist_checkpointing/strategies/torch.py sha256=3EZHTvkH_uo8934R0fgxnUKZe-hZYRTVTGavcPfIpnM 21080
megatron/core/dist_checkpointing/strategies/tensorstore.py sha256=03TOpEzECuFexLHc2FRgZ0LqfbiLwd3bhbraRZZm8x8 4574
megatron/core/dist_checkpointing/strategies/two_stage.py sha256=sUqQHRRPqquitT9m6kqXlfxNgjty-figRGtuU9ROxOs 10184
megatron/core/dist_checkpointing/strategies/base.py sha256=vffljwyqFrTsjYj608-bqgmTk8OPS5ufQuoeJqDhNvw 4041
megatron/core/dist_checkpointing/strategies/__init__.py sha256=HhfhTHPqqEQW39LaWTPdel9MwKRMbFZNCiILZeGyPHw 116
megatron/core/dist_checkpointing/strategies/zarr.py sha256=Um4YDKo-Tbuync3yt7tr563CDHJrqmcWcLRWsbz2UcE 10873
megatron/core/dist_checkpointing/strategies/state_dict_saver.py sha256=RjoAgfNsoEy76cgnNE_siYqC3oZFDCBYI93G0f1BTWY 5395
megatron/core/dist_checkpointing/strategies/filesystem_async.py sha256=PmFf14SoPZ_DQSWoyiFHEW21Dek99-8rUeNsSl9v2-U 10779
megatron/core/distributed/__init__.py sha256=XKCTnGgnZt4yccdJ35Ez-tGCU9xv_SXfBe4Aa8K1CUI 250
megatron/core/distributed/finalize_model_grads.py sha256=HXlfi4SteRhRoCVvXPxARo2bLMqN3_ap9gPMdCghbX8 5546
megatron/core/distributed/distributed_data_parallel.py sha256=veTvlW7Vontwj7ihART-cOnT_glF39dSA5dSNvf6Gmk 12045
megatron/core/distributed/param_and_grad_buffer.py sha256=Qx6LfH8Flfx-QZelffI-lYbzGk_4a4D3FLISKHJMUlQ 23140
megatron/core/fusions/fused_bias_geglu.py sha256=6JmbmIno-yESd4mf2DfCvvouIvnrx1772Q2NJABQSOY 2361
megatron/core/fusions/fused_bias_dropout.py sha256=p8YvmcNVl7ak6pM3AJMBebZaxt2svaXAZ-MW5OLU1a8 2897
megatron/core/fusions/fused_bias_swiglu.py sha256=s9Cohuph4dfKlTlFnRsHhOxtz69YIMvx5rAe9YtYkmE 2033
megatron/core/fusions/fused_softmax.py sha256=Hicykgpfoaf7dU2WSw1Z7dRp7q4T83ClOeNMTqg91yw 7623
megatron/core/fusions/fused_bias_gelu.py sha256=Tvi022WliITbshUzz50bTAp5F5l-hydHUGdWEUcFf-0 1400
megatron/core/fusions/fused_layer_norm.py sha256=uFsZY3xhhOkro3JGuK5m5S_MoF9nOC1BzSpZ-Ni6xDQ 5548
megatron/core/fusions/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/tensor_parallel/utils.py sha256=NgKfgebwaJsSfvnMoVOg5gPRu_hNzw7eyNbRNl0-SRQ 4030
megatron/core/tensor_parallel/mappings.py sha256=qod6146HOIM_UAXSAgy1So_0bKEsqaXe4yh11cXUkDY 15517
megatron/core/tensor_parallel/random.py sha256=Daxx-QsJ_us1fO67kfusCnfODS_oZ6S3XM-0Q3sWsyo 10265
megatron/core/tensor_parallel/__init__.py sha256=NYklUTAS4r1DCQ11LBmtKtGHHww4QQn873oqkQukWoI 2312
megatron/core/tensor_parallel/layers.py sha256=VZic_plTzd4QmT345Xj6rNms_ApAdRd9Hb9kze5qXnU 40998
megatron/core/tensor_parallel/data.py sha256=iY-Cc0s9uEjIvnBes1l9HfP87_KVDTG-I8y1bZ295u4 3355
megatron/core/tensor_parallel/cross_entropy.py sha256=L0b5MKGN5sW6z4CflnmXkjQl4ZRXVz7_VS5LIex_k0k 6314
megatron/core/datasets/helpers.cpython-311-x86_64-linux-gnu.so sha256=V3tgha5vjdXigij00zEFuD43Gom78QU7JLt4mQVmr_o 4097248
megatron/core/datasets/utils.py sha256=9VSI-jMJBy4M1AnvpWEiVWsDZXf_pZNC2KTTAFpocqI 1641
megatron/core/datasets/blended_dataset.py sha256=k3TbIjpN9toZ2h-fPDMlbtypnpygHGbhE4P1ANgFDLI 7163
megatron/core/datasets/blended_megatron_dataset_config.py sha256=ejnk5UE7uxeulYc2BGrNpDM1v-YUyfa6gzR6ixaegko 5624
megatron/core/datasets/gpt_dataset.py sha256=YHa_uSad2XUVIdMuXfzRwn-Kn_II32t_Z-gnIHPZVuM 25889
megatron/core/datasets/helpers.cpp sha256=E0s4qkHpKErMAx2SocYrIlV59jwZodwiuC90glLSa5o 26731
megatron/core/datasets/megatron_dataset.py sha256=CiTlDwMcqUqHUkGJ7tHB0bp_KJUMdVKcXD934sDP27U 6937
megatron/core/datasets/indexed_dataset.py sha256=uFbhsJXQuWxb2MFh0qr02gBnkVXm-7-iVhjNkBRgLUU 24630
megatron/core/datasets/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/datasets/megatron_tokenizer.py sha256=ShKv9KAayvtZfIRFlfQNxiZBKKCrOJNgXAlu-5xqHKM 3792
megatron/core/datasets/bert_dataset.py sha256=igBtkLpW_rikrkt3uT20NWojvZr_bk6NxopCZeEHdrE 7196
megatron/core/datasets/multimodal_dataset.py sha256=lRpC4GOlCElrDTOeE4sVhE5WARhfzWmYvr6FuXBR_Os 1907
megatron/core/datasets/blended_megatron_dataset_builder.py sha256=VuX64eCX_GTHxO07P9SzzAeP1dLdtppIWvmclAV_QqU 13373
megatron/core/datasets/t5_dataset.py sha256=v0BdzKjooAausMvdtuWpYoYwWkJZczRWw7T6hwNXi54 8298
megatron/core/datasets/masked_dataset.py sha256=Eib8J1kFcmALRXB8aY4slsTPOGlSNgEcmU87Wcu8IHE 16773
megatron/core/datasets/retro/external_libs.py sha256=KKcgrQCfO1Tg-qftxzGM0WZH7X8TN3dqWpwKHc0AT8w 506
megatron/core/datasets/retro/utils.py sha256=Jbr81V6nXlYMaksGUQZvuwwwzOZKeRAmPTQ1NPFHZ8k 12319
megatron/core/datasets/retro/__init__.py sha256=qRMVBbNTh1tNiF3dboxFUPbwrt52EX0U0rxuhEYjUts 251
megatron/core/datasets/retro/query/utils.py sha256=pPTwyY-z4LcTk_JjYVuWoUXdEbaGAZEqlV1nWWc2HBg 1112
megatron/core/datasets/retro/query/multi_split_gpt_dataset.py sha256=4dBCQnlE_AFdG_YeduBmWMXMQGmwONzOF96dLdKdb1g 4167
megatron/core/datasets/retro/query/retro_dataset.py sha256=t6Fo_JtGsSS8oetnBMTJrgHdWnocMpXW_ouV6PmaC3w 9334
megatron/core/datasets/retro/query/query.py sha256=yMIc9BVCzkZ8IZKkRSLlkjs61454CWTh7k9V49k54ZM 14333
megatron/core/datasets/retro/query/__init__.py sha256=k_Cvc2yxTe93EhbgoQAhhk7CNTjCzLm8sws66Jj55n4 64
megatron/core/datasets/retro/query/gpt_chunk_dataset.py sha256=ilflgHX-vG6QLQtQUh_ZMw9jl_8lHN3xz6B6slC_BZc 3800
megatron/core/datasets/retro/index/utils.py sha256=r53plTOcFthQf4xHwfpIW8o4YrYQhLpKiy13klwIcwY 3965
megatron/core/datasets/retro/index/index.py sha256=jW1jf_D5Y03kXeVAok16yIImZawnTgiOHCcDXVr3SrM 4946
megatron/core/datasets/retro/index/factory.py sha256=vnI271LXG6tBKtUkeDKT9XnDa_uHIMDSjhtPrHUL6mM 1376
megatron/core/datasets/retro/index/__init__.py sha256=hm55AK1FGTWvuaNriGg1WgV0-T0F9NAygBRR61TThPM 317
megatron/core/datasets/retro/index/build.py sha256=Cl6q1jRzWpV6USy7V4nXnfzNnyvIsEifHq0TfKeuUiY 9253
megatron/core/datasets/retro/index/validate.py sha256=HluCM0m8U8fIxoDWhUTN7PkZa8fJhmXbPnamAfdebWA 6073
megatron/core/datasets/retro/index/indexes/faiss_par_add.py sha256=gKYMJrOW7lig1iOGWTl7GTcuZ3pV_CWwaALwNeaVzNc 7557
megatron/core/datasets/retro/index/indexes/__init__.py sha256=YftO_ZxhxOzW61fD2Ga2-Ebx7UtyVrr7dWHDt4PoH4Q 285
megatron/core/datasets/retro/index/indexes/faiss_base.py sha256=Mb41GBWtpKdybw-94slb0rZvB9ZRk3ZNe-XaVNSLvAI 4988
megatron/core/datasets/retro/db/utils.py sha256=7QZs6Furqe7W2Xn5oim6vH7oJDszlUHw4_Z4I4nLu9o 12767
megatron/core/datasets/retro/db/dataset.py sha256=IOcRiHbgat8RIrcqmjGs0fRItAaaLAc6zgFNOjBrilQ 3608
megatron/core/datasets/retro/db/__init__.py sha256=WdGDuNtiJ5_-H27yxJyDfGxdgECk0k3E_OiHVuFK44M 182
megatron/core/datasets/retro/db/build.py sha256=BA9C_hwvYFwyNTn3_-7HMKKlXe7cZAJFACK9H8qnH7U 23712
megatron/core/datasets/retro/config/tokenizers.py sha256=H8SprrOWcSCXOA1vLdgBMt1umbAYgr4MgQUCb3foFpQ 385
megatron/core/datasets/retro/config/bert_embedders.py sha256=QdLlK05x-oPoUlxXk60v1N42hc6LYOk7kBoFmLzxoCE 1327
megatron/core/datasets/retro/config/gpt_chunk_datasets.py sha256=UuwnMf0VQBobCgAHyVudbrrosE61FQByIaJB3sxto2k 417
megatron/core/datasets/retro/config/__init__.py sha256=IffC2zcSCB_YEVBoJKTmucCl8Agq_xYkgOv3WIxDmAk 634
megatron/core/datasets/retro/config/config.py sha256=Gr2UTnVwN7qD6jnwdh46Aslw6ZBIJuKLWDPI9IG7ghg 9117
megatron/core/models/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/T5/t5_model.py sha256=MJTwVl7X3aQsBNLV7GKcx76j90_PciKHkjou4HcLhDc 17391
megatron/core/models/T5/t5_spec.py sha256=SM4I3Y6HrwxhPhvITbIITKIH8jJqZpl0dc-GuJX11sM 8521
megatron/core/models/T5/__init__.py sha256=qWLhaTIZdpSDNSNGdW5Ll0kmiQ7Jua6iqr5roko3EOY 30
megatron/core/models/multimodal/llava_model.py sha256=rmmce_K6OTebC4Q1tuWWTdfthgQrPs6_uaa3iJqJazo 5470
megatron/core/models/multimodal/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/bert/bert_lm_head.py sha256=ki5Rd7K5JfUIdLZ-sDTOzSOCt3btbBpYsQYYBCqdMxw 1373
megatron/core/models/bert/bert_model.py sha256=z5QSGnDtfatjA1h17GFZXs5wP7NuKIdvysp84qvlw6o 11571
megatron/core/models/bert/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/bert/pooler.py sha256=Q8ZYHDFEdWwhV1NxCL9UxHPsHkauKiir5CuXB4zdlWc 1823
megatron/core/models/bert/bert_layer_specs.py sha256=zHWdrkSdg9dPk_QStEQRnHd7KM3-HQbxOac3i5ixoXk 3024
megatron/core/models/common/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/vision_module/vision_module.py sha256=SUwBfItrNKZdEHtw_NCCRgF0PBsaBX_lqTAnPpC4zCE 635
megatron/core/models/common/vision_module/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/language_module/language_module.py sha256=TDHCtcXEw9pvYCVwaCjIsGYPdMqRpsuA9kXuIy6BQI0 8963
megatron/core/models/common/language_module/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/common/embeddings/rotary_pos_embedding.py sha256=QsXFoUcE7QkcWQuckEdp9jZqBfGzfbuF_MYoyfSY3d4 9036
megatron/core/models/common/embeddings/language_model_embedding.py sha256=RgiuVS8ibSUANFyIRbhB8G7L3Hb6xgw1wmrGgP8y9Tc 5357
megatron/core/models/common/embeddings/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/retro/utils.py sha256=yhI3b4VcURObUqw1_Iw_HIJ-ENMBQG2qjubYVa0PANo 749
megatron/core/models/retro/decoder_attention.py sha256=Vqj9B4-XhXufW8aCrjCGSZa-l1lTTVcvxAnblVdak8Q 11441
megatron/core/models/retro/encoder_spec.py sha256=1lQEMoiGt0Xn9yX16cPqtIhhJXVLAmKB0bXvaPW24DI 5890
megatron/core/models/retro/__init__.py sha256=wBWEz9cWtITwx_zWX9NXZQMnVXp6ADm6cR9bXfU-56w 371
megatron/core/models/retro/model.py sha256=ES5DUr8gqkHYWJJWWdsA5s-FSW9aoCE0Ex3so2lmHSY 3762
megatron/core/models/retro/encoder_attention.py sha256=8KhGAMQBEQTa1A49oTC93fSykMMuYp49xydbcShgzmo 8070
megatron/core/models/retro/base_attention.py sha256=zmUMSvFLle9NTbafl7z_7CXkFUlyBtoszZTmw9Qmfl8 1597
megatron/core/models/retro/config.py sha256=teSnaLkRZ5ssI7WMPt8GeKZhHseIQSpIm4CL2VByK4A 3188
megatron/core/models/retro/decoder_spec.py sha256=ZSmJ1NtC8Qb6ZZiOYJDR-zmjKomP6WuMzdDL7Gowg_0 6238
megatron/core/models/gpt/gpt_layer_specs.py sha256=Ly5DeOz1I1hkybvzEqDfZod9oqgWjUW11EERY9oaelE 4561
megatron/core/models/gpt/gpt_model.py sha256=KWHhXAdaT8tYQXqY5fb9McCGQQLcB18jxoZVHZujc5E 11091
megatron/core/models/gpt/__init__.py sha256=Iuxx8BuK1ufLEvpXRr3YWDpLoL3QhesGC94LFy349cU 32
megatron/core/models/vision/multimodal_projector.py sha256=iCrg9YaRlQBksAPFuFvX3Gdsj7h2WX-7Sd3uc5YTonY 2192
megatron/core/models/vision/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/models/vision/clip_vit_model.py sha256=KwGS7fsBmflNujVUwkyJnx57jgUS7UHg4T0WagQbeL8 5447
megatron/core/inference/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/gpt/model_specs.py sha256=z4qx9RqL4qAxEt2PAAT7MzXPZhlReh_Jdv_VVH65XGQ 2258
megatron/core/inference/gpt/__init__.py sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI 63
megatron/core/inference/gpt/state_dict_hooks.py sha256=AYKwsZo450RtfWz-J1SgPGaHXyDrXwdDu3DDWBVjUQs 5545
megatron/core/optimizer/optimizer.py sha256=7DErugGeyPm-ym6haf-8ntrXqC-q0JFbNt9YzAyhLs0 32371
megatron/core/optimizer/distrib_optimizer.py sha256=N6VWFmzB7W13JvNtcMh6BH-j8lzdjLlCeZG-qx1o6Eg 69587
megatron/core/optimizer/__init__.py sha256=DrGGpksfouKJZxOFrND_aHc9v9h6jridGyH5YnWMhE4 13021
megatron/core/optimizer/clip_grads.py sha256=b9zakg_stxy87uKAvULQ0Y3Fu1oXWbvG-r01iu-9eBw 5797
megatron/core/optimizer/grad_scaler.py sha256=wvNBlVyDM71uJVT8x8NPdOd2sLG9TOS8tTrdmlSgV4I 5161
megatron/core/optimizer/optimizer_config.py sha256=03zEzuPjnzEdHxj8D-BfiDZyUcZkN8TkquMDhWryWhU 3453
megatron/core/transformer/module.py sha256=_6_jWf-1aEAfGZJa7PRrVJM2XY_aOmafMzUywvNWv6k 6759
megatron/core/transformer/attention.py sha256=DbqS-l3sW-uT-gmE9o0EWcNl4ffwNo9DcCa6wjHRFVk 22494
megatron/core/transformer/utils.py sha256=YSG_zoTaTew6Y_gQSN6wRWgxRZqLTOLfZvHKLGGEkGs 6949
megatron/core/transformer/transformer_layer.py sha256=oN87rFfw3pBfyEaQzYNn-hf8dQccASrNC-l4Fo-OoFQ 10273
megatron/core/transformer/transformer_config.py sha256=mHkcsFp87-QpzcHWoAjatuwdTKyJhosWeJxA7_GTRTg 17055
megatron/core/transformer/identity_op.py sha256=w35Qyy0lmN-huMJhQF-Cq29R9gTIfkklKi4TKsWEm1c 713
megatron/core/transformer/spec_utils.py sha256=Oecza11kH8i27kbXpiwxSYwPHklebks4lK1vL8IKx8c 4102
megatron/core/transformer/__init__.py sha256=XpcTTt2xON-6IFG6h4uipx3c0U5HvJkuZmwnOh1frJY 274
megatron/core/transformer/dot_product_attention.py sha256=dz_J70cOQTAOtI6xffjCk_FbBBDAWFvEx_h8SvitTow 7980
megatron/core/transformer/enums.py sha256=RFBiMep8Jn66dCN91RkqsCQ4GaWKaT5Jggc1s36_rZY 461
megatron/core/transformer/transformer_block.py sha256=PCiFxtzelDDU4pWpVsS98dlz8h-Z3ee8aBnj6vH1Kwk 17909
megatron/core/transformer/mlp.py sha256=AKnAiZB7F_Bg_W78eVJBwy92B6RiJ2Qh7Ko_X-9YBTQ 7428
megatron/core/transformer/moe/moe_utils.py sha256=F3_NSt60ncJPbGLaab9J9ep5rCs-ow-DVeb04dOQZiY 8976
megatron/core/transformer/moe/token_dispatcher.py sha256=X8yTrkHaEI3VmZomWBvk8NAjm0sgd6JXCMqx9F-4yn8 22073
megatron/core/transformer/moe/experts.py sha256=bJ9fQMebfJA9Gd_kzmTS-mAk5bNw-Gyc80hqAbkUmcQ 10642
megatron/core/transformer/moe/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/transformer/moe/moe_layer.py sha256=GPgTiSKjFvprGNKo-5i7l-UhFt7fqXHRzXu5OVdXzR4 3877
megatron/core/transformer/moe/router.py sha256=55saWInrL5vC9wXpewKWAOe6ryQOo8gJpfFKX72lTHw 9632
megatron/core/transformer/moe/grouped_gemm_util.py sha256=nPraA87A6pUnTj75bqesTuWGvawr9oMGY8V_aZZt44U 494
megatron/core/transformer/custom_layers/__init__.py sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU 0
megatron/core/transformer/custom_layers/transformer_engine.py sha256=8g6_PgKXQQec9ILwccIRsAHNqdf941OLW6KoA0NQjlM 20919
megatron_core-0.6.0.dist-info/LICENSE sha256=YPUqGUE6eK-6bsAAlFQlgAQ_6j_nubkbKOe54M8Bof0 15679
megatron_core-0.6.0.dist-info/METADATA sha256=HAGF6Icug-I-xni0b9MOk0JdQH3Z-87hcEbrm0CwGnc 1584
megatron_core-0.6.0.dist-info/top_level.txt sha256=OEOs4V4xHotpQFOUHkfPkLmqcuKfSffSlV17EmZVBjg 9
megatron_core-0.6.0.dist-info/WHEEL sha256=-7Vwsd-KuPOtdyxdAC8drxF7lN4th9mKINh8g6MaZ9k 152
megatron_core-0.6.0.dist-info/RECORD

top_level.txt

megatron