File tree Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -221,30 +221,30 @@ def benchmark_with_profiler(
221
221
# .. figure:: /_static/img/pinmem/trace_streamed0_pinned0.png
222
222
# :alt:
223
223
#
224
+ # Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:
224
225
225
226
benchmark_with_profiler (streamed = True , pinned = False )
226
227
227
228
######################################################################
228
- # Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:
229
229
#
230
230
# .. figure:: /_static/img/pinmem/trace_streamed0_pinned1.png
231
231
# :alt:
232
232
#
233
+ # Sending a pageable tensor to GPU on a separate stream is also a blocking operation:
233
234
234
235
benchmark_with_profiler (streamed = False , pinned = True )
235
236
236
237
######################################################################
237
- # Sending a pageable tensor to GPU on a separate stream is also a blocking operation:
238
238
#
239
239
# .. figure:: /_static/img/pinmem/trace_streamed1_pinned0.png
240
240
# :alt:
241
241
#
242
+ # Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on
243
+ # the main stream:
242
244
243
245
benchmark_with_profiler (streamed = True , pinned = True )
244
246
245
247
######################################################################
246
- # Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on
247
- # the main stream:
248
248
#
249
249
# .. figure:: /_static/img/pinmem/trace_streamed1_pinned1.png
250
250
# :alt:
You can’t perform that action at this time.
0 commit comments