Path |
Digest |
Size |
megatron/core/requirements.txt |
sha256=N79Rv7pGmalAzjE0lCKySlvFWisXnteux0RZqa6NV7c
|
5 |
megatron/core/utils.py |
sha256=fKd6wQWYVKN49I051LjAKHthbDOpf5Y3ZiAEPTK9OwE
|
11810 |
megatron/core/package_info.py |
sha256=NIZcPzkVvewdWsyePDIUDoFF1p31dLRD-z87o_uqHN8
|
994 |
megatron/core/parallel_state.py |
sha256=B1a9ilsnvrjuT3KGa1_6z5JM_FHj3LVnJXJV96VWOYI
|
44946 |
megatron/core/jit.py |
sha256=eve_fNxWf_sI_n0OcfRWB4dkeXrfyr-DxnsQFqwk6rE
|
362 |
megatron/core/packed_seq_params.py |
sha256=9UCfT8-YrgLb-rfxxdikxSxWymAzPDChma5tPyDoIYY
|
358 |
megatron/core/__init__.py |
sha256=9IxLMwIkZYFhrOLn24_6olzO3PxryY3msBA1tnLuzQU
|
571 |
megatron/core/inference_params.py |
sha256=FaCRNoD5Z-9DDHRwGckHhext0q_DfiFc9ZTFDQupVdc
|
1241 |
megatron/core/enums.py |
sha256=OIc-mEyKwE-d3iYoSkhAN4ch3mIrFui9cgaLrMW6j8o
|
205 |
megatron/core/timers.py |
sha256=6Ocbn9nFQIQ_G8ZmAuVZwOvKbZ6qtFigMf8MrJC5390
|
14987 |
megatron/core/model_parallel_config.py |
sha256=15EJqaU_tA2a2XikaW6uG74_UiUieIrOpyD2UQrDZ3g
|
12283 |
megatron/core/pipeline_parallel/__init__.py |
sha256=e_qNyIBDy0CW-kzKxLwo1uMkWdCaVXPVy1s0GEH0wb4
|
49 |
megatron/core/pipeline_parallel/schedules.py |
sha256=3Up5_aTL5ReRNyBUqqNoOxBdXdLuyeaDYTe8WCRok0U
|
55130 |
megatron/core/pipeline_parallel/p2p_communication.py |
sha256=i3bUt97ar7h5jJT03h4N8IFsHprrAQz9wI6yhK5VA8M
|
19593 |
megatron/core/dist_checkpointing/serialization.py |
sha256=zLtk56R-A6Gr8tyApflUrKxa_f1z7VdDDFqAc3dxZbE
|
19949 |
megatron/core/dist_checkpointing/utils.py |
sha256=DmNu5ctRxV_fpRephFDiAbqO6NYesTvXffN5KhKVNrY
|
5668 |
megatron/core/dist_checkpointing/optimizer.py |
sha256=PBtv0FkEG8COYI9K1Zf78_pWZfqzDRBoOEIDCmUX3GQ
|
5423 |
megatron/core/dist_checkpointing/mapping.py |
sha256=FV31H5y_-1mq--PLBF4i41vOVlZCsJRrYnfVYdBavnI
|
13516 |
megatron/core/dist_checkpointing/__init__.py |
sha256=w43C479LFnwuTUgM-LHg_wlvCG87xN79XJ98DV_-NDU
|
310 |
megatron/core/dist_checkpointing/core.py |
sha256=9Y1GhAe-J0J2DIicxnTtYLBJFO83nuqPh2tIYTwxcpk
|
2189 |
megatron/core/dist_checkpointing/dict_utils.py |
sha256=QxSomKWQ7VGbSAvrRRtSIrjfvAngEewjgDhUPVStPfQ
|
8397 |
megatron/core/dist_checkpointing/strategies/torch.py |
sha256=3EZHTvkH_uo8934R0fgxnUKZe-hZYRTVTGavcPfIpnM
|
21080 |
megatron/core/dist_checkpointing/strategies/tensorstore.py |
sha256=03TOpEzECuFexLHc2FRgZ0LqfbiLwd3bhbraRZZm8x8
|
4574 |
megatron/core/dist_checkpointing/strategies/two_stage.py |
sha256=sUqQHRRPqquitT9m6kqXlfxNgjty-figRGtuU9ROxOs
|
10184 |
megatron/core/dist_checkpointing/strategies/base.py |
sha256=vffljwyqFrTsjYj608-bqgmTk8OPS5ufQuoeJqDhNvw
|
4041 |
megatron/core/dist_checkpointing/strategies/__init__.py |
sha256=HhfhTHPqqEQW39LaWTPdel9MwKRMbFZNCiILZeGyPHw
|
116 |
megatron/core/dist_checkpointing/strategies/zarr.py |
sha256=Um4YDKo-Tbuync3yt7tr563CDHJrqmcWcLRWsbz2UcE
|
10873 |
megatron/core/dist_checkpointing/strategies/state_dict_saver.py |
sha256=RjoAgfNsoEy76cgnNE_siYqC3oZFDCBYI93G0f1BTWY
|
5395 |
megatron/core/dist_checkpointing/strategies/filesystem_async.py |
sha256=PmFf14SoPZ_DQSWoyiFHEW21Dek99-8rUeNsSl9v2-U
|
10779 |
megatron/core/distributed/__init__.py |
sha256=XKCTnGgnZt4yccdJ35Ez-tGCU9xv_SXfBe4Aa8K1CUI
|
250 |
megatron/core/distributed/finalize_model_grads.py |
sha256=HXlfi4SteRhRoCVvXPxARo2bLMqN3_ap9gPMdCghbX8
|
5546 |
megatron/core/distributed/distributed_data_parallel.py |
sha256=veTvlW7Vontwj7ihART-cOnT_glF39dSA5dSNvf6Gmk
|
12045 |
megatron/core/distributed/param_and_grad_buffer.py |
sha256=Qx6LfH8Flfx-QZelffI-lYbzGk_4a4D3FLISKHJMUlQ
|
23140 |
megatron/core/fusions/fused_bias_geglu.py |
sha256=6JmbmIno-yESd4mf2DfCvvouIvnrx1772Q2NJABQSOY
|
2361 |
megatron/core/fusions/fused_bias_dropout.py |
sha256=p8YvmcNVl7ak6pM3AJMBebZaxt2svaXAZ-MW5OLU1a8
|
2897 |
megatron/core/fusions/fused_bias_swiglu.py |
sha256=s9Cohuph4dfKlTlFnRsHhOxtz69YIMvx5rAe9YtYkmE
|
2033 |
megatron/core/fusions/fused_softmax.py |
sha256=Hicykgpfoaf7dU2WSw1Z7dRp7q4T83ClOeNMTqg91yw
|
7623 |
megatron/core/fusions/fused_bias_gelu.py |
sha256=Tvi022WliITbshUzz50bTAp5F5l-hydHUGdWEUcFf-0
|
1400 |
megatron/core/fusions/fused_layer_norm.py |
sha256=uFsZY3xhhOkro3JGuK5m5S_MoF9nOC1BzSpZ-Ni6xDQ
|
5548 |
megatron/core/fusions/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/tensor_parallel/utils.py |
sha256=NgKfgebwaJsSfvnMoVOg5gPRu_hNzw7eyNbRNl0-SRQ
|
4030 |
megatron/core/tensor_parallel/mappings.py |
sha256=qod6146HOIM_UAXSAgy1So_0bKEsqaXe4yh11cXUkDY
|
15517 |
megatron/core/tensor_parallel/random.py |
sha256=Daxx-QsJ_us1fO67kfusCnfODS_oZ6S3XM-0Q3sWsyo
|
10265 |
megatron/core/tensor_parallel/__init__.py |
sha256=NYklUTAS4r1DCQ11LBmtKtGHHww4QQn873oqkQukWoI
|
2312 |
megatron/core/tensor_parallel/layers.py |
sha256=VZic_plTzd4QmT345Xj6rNms_ApAdRd9Hb9kze5qXnU
|
40998 |
megatron/core/tensor_parallel/data.py |
sha256=iY-Cc0s9uEjIvnBes1l9HfP87_KVDTG-I8y1bZ295u4
|
3355 |
megatron/core/tensor_parallel/cross_entropy.py |
sha256=L0b5MKGN5sW6z4CflnmXkjQl4ZRXVz7_VS5LIex_k0k
|
6314 |
megatron/core/datasets/helpers.cpython-311-x86_64-linux-gnu.so |
sha256=V3tgha5vjdXigij00zEFuD43Gom78QU7JLt4mQVmr_o
|
4097248 |
megatron/core/datasets/utils.py |
sha256=9VSI-jMJBy4M1AnvpWEiVWsDZXf_pZNC2KTTAFpocqI
|
1641 |
megatron/core/datasets/blended_dataset.py |
sha256=k3TbIjpN9toZ2h-fPDMlbtypnpygHGbhE4P1ANgFDLI
|
7163 |
megatron/core/datasets/blended_megatron_dataset_config.py |
sha256=ejnk5UE7uxeulYc2BGrNpDM1v-YUyfa6gzR6ixaegko
|
5624 |
megatron/core/datasets/gpt_dataset.py |
sha256=YHa_uSad2XUVIdMuXfzRwn-Kn_II32t_Z-gnIHPZVuM
|
25889 |
megatron/core/datasets/helpers.cpp |
sha256=E0s4qkHpKErMAx2SocYrIlV59jwZodwiuC90glLSa5o
|
26731 |
megatron/core/datasets/megatron_dataset.py |
sha256=CiTlDwMcqUqHUkGJ7tHB0bp_KJUMdVKcXD934sDP27U
|
6937 |
megatron/core/datasets/indexed_dataset.py |
sha256=uFbhsJXQuWxb2MFh0qr02gBnkVXm-7-iVhjNkBRgLUU
|
24630 |
megatron/core/datasets/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/datasets/megatron_tokenizer.py |
sha256=ShKv9KAayvtZfIRFlfQNxiZBKKCrOJNgXAlu-5xqHKM
|
3792 |
megatron/core/datasets/bert_dataset.py |
sha256=igBtkLpW_rikrkt3uT20NWojvZr_bk6NxopCZeEHdrE
|
7196 |
megatron/core/datasets/multimodal_dataset.py |
sha256=lRpC4GOlCElrDTOeE4sVhE5WARhfzWmYvr6FuXBR_Os
|
1907 |
megatron/core/datasets/blended_megatron_dataset_builder.py |
sha256=VuX64eCX_GTHxO07P9SzzAeP1dLdtppIWvmclAV_QqU
|
13373 |
megatron/core/datasets/t5_dataset.py |
sha256=v0BdzKjooAausMvdtuWpYoYwWkJZczRWw7T6hwNXi54
|
8298 |
megatron/core/datasets/masked_dataset.py |
sha256=Eib8J1kFcmALRXB8aY4slsTPOGlSNgEcmU87Wcu8IHE
|
16773 |
megatron/core/datasets/retro/external_libs.py |
sha256=KKcgrQCfO1Tg-qftxzGM0WZH7X8TN3dqWpwKHc0AT8w
|
506 |
megatron/core/datasets/retro/utils.py |
sha256=Jbr81V6nXlYMaksGUQZvuwwwzOZKeRAmPTQ1NPFHZ8k
|
12319 |
megatron/core/datasets/retro/__init__.py |
sha256=qRMVBbNTh1tNiF3dboxFUPbwrt52EX0U0rxuhEYjUts
|
251 |
megatron/core/datasets/retro/query/utils.py |
sha256=pPTwyY-z4LcTk_JjYVuWoUXdEbaGAZEqlV1nWWc2HBg
|
1112 |
megatron/core/datasets/retro/query/multi_split_gpt_dataset.py |
sha256=4dBCQnlE_AFdG_YeduBmWMXMQGmwONzOF96dLdKdb1g
|
4167 |
megatron/core/datasets/retro/query/retro_dataset.py |
sha256=t6Fo_JtGsSS8oetnBMTJrgHdWnocMpXW_ouV6PmaC3w
|
9334 |
megatron/core/datasets/retro/query/query.py |
sha256=yMIc9BVCzkZ8IZKkRSLlkjs61454CWTh7k9V49k54ZM
|
14333 |
megatron/core/datasets/retro/query/__init__.py |
sha256=k_Cvc2yxTe93EhbgoQAhhk7CNTjCzLm8sws66Jj55n4
|
64 |
megatron/core/datasets/retro/query/gpt_chunk_dataset.py |
sha256=ilflgHX-vG6QLQtQUh_ZMw9jl_8lHN3xz6B6slC_BZc
|
3800 |
megatron/core/datasets/retro/index/utils.py |
sha256=r53plTOcFthQf4xHwfpIW8o4YrYQhLpKiy13klwIcwY
|
3965 |
megatron/core/datasets/retro/index/index.py |
sha256=jW1jf_D5Y03kXeVAok16yIImZawnTgiOHCcDXVr3SrM
|
4946 |
megatron/core/datasets/retro/index/factory.py |
sha256=vnI271LXG6tBKtUkeDKT9XnDa_uHIMDSjhtPrHUL6mM
|
1376 |
megatron/core/datasets/retro/index/__init__.py |
sha256=hm55AK1FGTWvuaNriGg1WgV0-T0F9NAygBRR61TThPM
|
317 |
megatron/core/datasets/retro/index/build.py |
sha256=Cl6q1jRzWpV6USy7V4nXnfzNnyvIsEifHq0TfKeuUiY
|
9253 |
megatron/core/datasets/retro/index/validate.py |
sha256=HluCM0m8U8fIxoDWhUTN7PkZa8fJhmXbPnamAfdebWA
|
6073 |
megatron/core/datasets/retro/index/indexes/faiss_par_add.py |
sha256=gKYMJrOW7lig1iOGWTl7GTcuZ3pV_CWwaALwNeaVzNc
|
7557 |
megatron/core/datasets/retro/index/indexes/__init__.py |
sha256=YftO_ZxhxOzW61fD2Ga2-Ebx7UtyVrr7dWHDt4PoH4Q
|
285 |
megatron/core/datasets/retro/index/indexes/faiss_base.py |
sha256=Mb41GBWtpKdybw-94slb0rZvB9ZRk3ZNe-XaVNSLvAI
|
4988 |
megatron/core/datasets/retro/db/utils.py |
sha256=7QZs6Furqe7W2Xn5oim6vH7oJDszlUHw4_Z4I4nLu9o
|
12767 |
megatron/core/datasets/retro/db/dataset.py |
sha256=IOcRiHbgat8RIrcqmjGs0fRItAaaLAc6zgFNOjBrilQ
|
3608 |
megatron/core/datasets/retro/db/__init__.py |
sha256=WdGDuNtiJ5_-H27yxJyDfGxdgECk0k3E_OiHVuFK44M
|
182 |
megatron/core/datasets/retro/db/build.py |
sha256=BA9C_hwvYFwyNTn3_-7HMKKlXe7cZAJFACK9H8qnH7U
|
23712 |
megatron/core/datasets/retro/config/tokenizers.py |
sha256=H8SprrOWcSCXOA1vLdgBMt1umbAYgr4MgQUCb3foFpQ
|
385 |
megatron/core/datasets/retro/config/bert_embedders.py |
sha256=QdLlK05x-oPoUlxXk60v1N42hc6LYOk7kBoFmLzxoCE
|
1327 |
megatron/core/datasets/retro/config/gpt_chunk_datasets.py |
sha256=UuwnMf0VQBobCgAHyVudbrrosE61FQByIaJB3sxto2k
|
417 |
megatron/core/datasets/retro/config/__init__.py |
sha256=IffC2zcSCB_YEVBoJKTmucCl8Agq_xYkgOv3WIxDmAk
|
634 |
megatron/core/datasets/retro/config/config.py |
sha256=Gr2UTnVwN7qD6jnwdh46Aslw6ZBIJuKLWDPI9IG7ghg
|
9117 |
megatron/core/models/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/T5/t5_model.py |
sha256=MJTwVl7X3aQsBNLV7GKcx76j90_PciKHkjou4HcLhDc
|
17391 |
megatron/core/models/T5/t5_spec.py |
sha256=SM4I3Y6HrwxhPhvITbIITKIH8jJqZpl0dc-GuJX11sM
|
8521 |
megatron/core/models/T5/__init__.py |
sha256=qWLhaTIZdpSDNSNGdW5Ll0kmiQ7Jua6iqr5roko3EOY
|
30 |
megatron/core/models/multimodal/llava_model.py |
sha256=rmmce_K6OTebC4Q1tuWWTdfthgQrPs6_uaa3iJqJazo
|
5470 |
megatron/core/models/multimodal/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/bert/bert_lm_head.py |
sha256=ki5Rd7K5JfUIdLZ-sDTOzSOCt3btbBpYsQYYBCqdMxw
|
1373 |
megatron/core/models/bert/bert_model.py |
sha256=z5QSGnDtfatjA1h17GFZXs5wP7NuKIdvysp84qvlw6o
|
11571 |
megatron/core/models/bert/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/bert/pooler.py |
sha256=Q8ZYHDFEdWwhV1NxCL9UxHPsHkauKiir5CuXB4zdlWc
|
1823 |
megatron/core/models/bert/bert_layer_specs.py |
sha256=zHWdrkSdg9dPk_QStEQRnHd7KM3-HQbxOac3i5ixoXk
|
3024 |
megatron/core/models/common/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/vision_module/vision_module.py |
sha256=SUwBfItrNKZdEHtw_NCCRgF0PBsaBX_lqTAnPpC4zCE
|
635 |
megatron/core/models/common/vision_module/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/language_module/language_module.py |
sha256=TDHCtcXEw9pvYCVwaCjIsGYPdMqRpsuA9kXuIy6BQI0
|
8963 |
megatron/core/models/common/language_module/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/common/embeddings/rotary_pos_embedding.py |
sha256=QsXFoUcE7QkcWQuckEdp9jZqBfGzfbuF_MYoyfSY3d4
|
9036 |
megatron/core/models/common/embeddings/language_model_embedding.py |
sha256=RgiuVS8ibSUANFyIRbhB8G7L3Hb6xgw1wmrGgP8y9Tc
|
5357 |
megatron/core/models/common/embeddings/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/retro/utils.py |
sha256=yhI3b4VcURObUqw1_Iw_HIJ-ENMBQG2qjubYVa0PANo
|
749 |
megatron/core/models/retro/decoder_attention.py |
sha256=Vqj9B4-XhXufW8aCrjCGSZa-l1lTTVcvxAnblVdak8Q
|
11441 |
megatron/core/models/retro/encoder_spec.py |
sha256=1lQEMoiGt0Xn9yX16cPqtIhhJXVLAmKB0bXvaPW24DI
|
5890 |
megatron/core/models/retro/__init__.py |
sha256=wBWEz9cWtITwx_zWX9NXZQMnVXp6ADm6cR9bXfU-56w
|
371 |
megatron/core/models/retro/model.py |
sha256=ES5DUr8gqkHYWJJWWdsA5s-FSW9aoCE0Ex3so2lmHSY
|
3762 |
megatron/core/models/retro/encoder_attention.py |
sha256=8KhGAMQBEQTa1A49oTC93fSykMMuYp49xydbcShgzmo
|
8070 |
megatron/core/models/retro/base_attention.py |
sha256=zmUMSvFLle9NTbafl7z_7CXkFUlyBtoszZTmw9Qmfl8
|
1597 |
megatron/core/models/retro/config.py |
sha256=teSnaLkRZ5ssI7WMPt8GeKZhHseIQSpIm4CL2VByK4A
|
3188 |
megatron/core/models/retro/decoder_spec.py |
sha256=ZSmJ1NtC8Qb6ZZiOYJDR-zmjKomP6WuMzdDL7Gowg_0
|
6238 |
megatron/core/models/gpt/gpt_layer_specs.py |
sha256=Ly5DeOz1I1hkybvzEqDfZod9oqgWjUW11EERY9oaelE
|
4561 |
megatron/core/models/gpt/gpt_model.py |
sha256=KWHhXAdaT8tYQXqY5fb9McCGQQLcB18jxoZVHZujc5E
|
11091 |
megatron/core/models/gpt/__init__.py |
sha256=Iuxx8BuK1ufLEvpXRr3YWDpLoL3QhesGC94LFy349cU
|
32 |
megatron/core/models/vision/multimodal_projector.py |
sha256=iCrg9YaRlQBksAPFuFvX3Gdsj7h2WX-7Sd3uc5YTonY
|
2192 |
megatron/core/models/vision/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/models/vision/clip_vit_model.py |
sha256=KwGS7fsBmflNujVUwkyJnx57jgUS7UHg4T0WagQbeL8
|
5447 |
megatron/core/inference/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/gpt/model_specs.py |
sha256=z4qx9RqL4qAxEt2PAAT7MzXPZhlReh_Jdv_VVH65XGQ
|
2258 |
megatron/core/inference/gpt/__init__.py |
sha256=KjZwACgGud02uCiDVSB9JkZ7IJRezdwf7urlCIZAqXI
|
63 |
megatron/core/inference/gpt/state_dict_hooks.py |
sha256=AYKwsZo450RtfWz-J1SgPGaHXyDrXwdDu3DDWBVjUQs
|
5545 |
megatron/core/optimizer/optimizer.py |
sha256=7DErugGeyPm-ym6haf-8ntrXqC-q0JFbNt9YzAyhLs0
|
32371 |
megatron/core/optimizer/distrib_optimizer.py |
sha256=N6VWFmzB7W13JvNtcMh6BH-j8lzdjLlCeZG-qx1o6Eg
|
69587 |
megatron/core/optimizer/__init__.py |
sha256=DrGGpksfouKJZxOFrND_aHc9v9h6jridGyH5YnWMhE4
|
13021 |
megatron/core/optimizer/clip_grads.py |
sha256=b9zakg_stxy87uKAvULQ0Y3Fu1oXWbvG-r01iu-9eBw
|
5797 |
megatron/core/optimizer/grad_scaler.py |
sha256=wvNBlVyDM71uJVT8x8NPdOd2sLG9TOS8tTrdmlSgV4I
|
5161 |
megatron/core/optimizer/optimizer_config.py |
sha256=03zEzuPjnzEdHxj8D-BfiDZyUcZkN8TkquMDhWryWhU
|
3453 |
megatron/core/transformer/module.py |
sha256=_6_jWf-1aEAfGZJa7PRrVJM2XY_aOmafMzUywvNWv6k
|
6759 |
megatron/core/transformer/attention.py |
sha256=DbqS-l3sW-uT-gmE9o0EWcNl4ffwNo9DcCa6wjHRFVk
|
22494 |
megatron/core/transformer/utils.py |
sha256=YSG_zoTaTew6Y_gQSN6wRWgxRZqLTOLfZvHKLGGEkGs
|
6949 |
megatron/core/transformer/transformer_layer.py |
sha256=oN87rFfw3pBfyEaQzYNn-hf8dQccASrNC-l4Fo-OoFQ
|
10273 |
megatron/core/transformer/transformer_config.py |
sha256=mHkcsFp87-QpzcHWoAjatuwdTKyJhosWeJxA7_GTRTg
|
17055 |
megatron/core/transformer/identity_op.py |
sha256=w35Qyy0lmN-huMJhQF-Cq29R9gTIfkklKi4TKsWEm1c
|
713 |
megatron/core/transformer/spec_utils.py |
sha256=Oecza11kH8i27kbXpiwxSYwPHklebks4lK1vL8IKx8c
|
4102 |
megatron/core/transformer/__init__.py |
sha256=XpcTTt2xON-6IFG6h4uipx3c0U5HvJkuZmwnOh1frJY
|
274 |
megatron/core/transformer/dot_product_attention.py |
sha256=dz_J70cOQTAOtI6xffjCk_FbBBDAWFvEx_h8SvitTow
|
7980 |
megatron/core/transformer/enums.py |
sha256=RFBiMep8Jn66dCN91RkqsCQ4GaWKaT5Jggc1s36_rZY
|
461 |
megatron/core/transformer/transformer_block.py |
sha256=PCiFxtzelDDU4pWpVsS98dlz8h-Z3ee8aBnj6vH1Kwk
|
17909 |
megatron/core/transformer/mlp.py |
sha256=AKnAiZB7F_Bg_W78eVJBwy92B6RiJ2Qh7Ko_X-9YBTQ
|
7428 |
megatron/core/transformer/moe/moe_utils.py |
sha256=F3_NSt60ncJPbGLaab9J9ep5rCs-ow-DVeb04dOQZiY
|
8976 |
megatron/core/transformer/moe/token_dispatcher.py |
sha256=X8yTrkHaEI3VmZomWBvk8NAjm0sgd6JXCMqx9F-4yn8
|
22073 |
megatron/core/transformer/moe/experts.py |
sha256=bJ9fQMebfJA9Gd_kzmTS-mAk5bNw-Gyc80hqAbkUmcQ
|
10642 |
megatron/core/transformer/moe/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/transformer/moe/moe_layer.py |
sha256=GPgTiSKjFvprGNKo-5i7l-UhFt7fqXHRzXu5OVdXzR4
|
3877 |
megatron/core/transformer/moe/router.py |
sha256=55saWInrL5vC9wXpewKWAOe6ryQOo8gJpfFKX72lTHw
|
9632 |
megatron/core/transformer/moe/grouped_gemm_util.py |
sha256=nPraA87A6pUnTj75bqesTuWGvawr9oMGY8V_aZZt44U
|
494 |
megatron/core/transformer/custom_layers/__init__.py |
sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
|
0 |
megatron/core/transformer/custom_layers/transformer_engine.py |
sha256=8g6_PgKXQQec9ILwccIRsAHNqdf941OLW6KoA0NQjlM
|
20919 |
megatron_core-0.6.0.dist-info/LICENSE |
sha256=YPUqGUE6eK-6bsAAlFQlgAQ_6j_nubkbKOe54M8Bof0
|
15679 |
megatron_core-0.6.0.dist-info/METADATA |
sha256=HAGF6Icug-I-xni0b9MOk0JdQH3Z-87hcEbrm0CwGnc
|
1584 |
megatron_core-0.6.0.dist-info/top_level.txt |
sha256=OEOs4V4xHotpQFOUHkfPkLmqcuKfSffSlV17EmZVBjg
|
9 |
megatron_core-0.6.0.dist-info/WHEEL |
sha256=-7Vwsd-KuPOtdyxdAC8drxF7lN4th9mKINh8g6MaZ9k
|
152 |
megatron_core-0.6.0.dist-info/RECORD |
— |
— |