| .. |
|
_composable
|
Add early_stop kwarg to torch.utils.checkpoint (#160781)
|
2025-08-26 22:32:35 +00:00 |
|
_pycute
|
[CuTe] Add type for CuTe layout via claude (#162534)
|
2025-09-12 04:59:21 +00:00 |
|
_shard
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_sharded_tensor
|
|
|
|
_sharding_spec
|
|
|
|
_symmetric_memory
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_tensor
|
|
|
|
_tools
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
algorithms
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
autograd
|
|
|
|
benchmarks
|
|
|
|
checkpoint
|
[DCP] Avoid multiple storage writer resets in async save (#159448)
|
2025-09-10 00:43:03 +00:00 |
|
elastic
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
examples
|
|
|
|
fsdp
|
[precompile] Fix issues with guard serialization on distributed types. (#162418)
|
2025-09-11 23:09:55 +00:00 |
|
launcher
|
154849 Add support to handle IGUSR1 and SIGUSR2 in multiprocessing (#160690)
|
2025-09-09 22:23:06 +00:00 |
|
nn
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
optim
|
|
|
|
pipelining
|
Replace export_for_training with export (#162396)
|
2025-09-10 14:19:34 +00:00 |
|
rpc
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
tensor
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
__init__.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_C_stubs.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_checkpointable.py
|
|
|
|
_composable_state.py
|
|
|
|
_dist2.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_distributed_c10d.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_functional_collectives_impl.py
|
|
|
|
_functional_collectives.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
_mesh_layout.py
|
[DeviceMesh] Make CuTe layout as mesh layout to be ready for using in DeviceMesh (#162414)
|
2025-09-12 07:32:56 +00:00 |
|
_serialization.py
|
|
|
|
_state_dict_utils.py
|
fix-unpin-memory-tensor-param (#160992)
|
2025-08-26 21:55:25 +00:00 |
|
argparse_util.py
|
|
|
|
c10d_logger.py
|
|
|
|
collective_utils.py
|
[C10D] add _summarize_ranks util (#160284)
|
2025-08-28 00:17:53 +00:00 |
|
constants.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
CONTRIBUTING.md
|
fix torch/distributed contributing doc (#158934)
|
2025-07-28 17:01:05 +00:00 |
|
device_mesh.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
distributed_c10d.py
|
[RELAND] Always build USE_DISTRIBUTED (#160449) and Make distributed modules importable even when backend not built (#159889) (#162594)
|
2025-09-12 10:54:42 +00:00 |
|
launch.py
|
|
|
|
logging_handlers.py
|
|
|
|
remote_device.py
|
|
|
|
rendezvous.py
|
|
|
|
run.py
|
Support XPU in --nproc-per-node option to torchrun (#159474)
|
2025-09-12 08:32:04 +00:00 |
|
utils.py
|
|
|