..
|
__init__.py
|
allgather.py
|
allreduce_max.py
|
allreduce_sum.py
|
barrier.py
|
broadcast.py
|
checkpointing.py
|
column_parallelism.py
|
custom_data_parallel.py
|
data_parallel.py
|
ddp.py
|
efficient_data_parallel.py
|
gather.py
|
gpipe.py
|
megatron_datasets.py
|
megatron_mlp_gelu.py
|
mpu.py
|
multi_process_1.py
|
multi_process_2.py
|
multi_process_3.py
|
non_parallelism.py
|
p2p_communication.py
|
p2p_communication_non_blocking.py
|
parallelformers_inference.py
|
pipe_dream.py
|
process_group_1.py
|
process_group_2.py
|
process_group_3.py
|
process_group_4.py
|
reduce_max.py
|
reduce_scatter.py
|
reduce_sum.py
|
row_parallelism.py
|
scatter.py
|
scatter_nccl.py
|
test_mpu.py
|
zero_args.py
|
zero_config.py
|
zero_dp_config.json
|
zero_off_config.json
|
zero_r_config.json
|