We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 851c4cf commit 8c2c2f0Copy full SHA for 8c2c2f0
distributed/tensor_parallelism/fsdp_tp_example.py
@@ -107,17 +107,13 @@
107
{
108
"tok_embeddings": RowwiseParallel(
109
input_layouts=Replicate(),
110
+ output_layouts=Shard(1),
111
),
112
"output": ColwiseParallel(
113
input_layouts=Shard(1),
114
output_layouts=Replicate()
115
116
"norm": SequenceParallel(),
- "layers.0": PrepareModuleInput(
117
- input_layouts=(Replicate(), None),
118
- desired_input_layouts=(Shard(1), None),
119
- use_local_output=True,
120
- ),
121
}
122
)
123
0 commit comments