amend

Vincent Moens · Vincent Moens · commit 69e98ea3420a · 2024-07-30T10:07:50.000-04:00
diff --git a/intermediate_source/pinmem_nonblock.py b/intermediate_source/pinmem_nonblock.py
@@ -221,30 +221,30 @@ def benchmark_with_profiler(
 # .. figure:: /_static/img/pinmem/trace_streamed0_pinned0.png
 #    :alt:
 #
+# Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:
 
 benchmark_with_profiler(streamed=True, pinned=False)
 
 ######################################################################
-# Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:
 #
 # .. figure:: /_static/img/pinmem/trace_streamed0_pinned1.png
 #    :alt:
 #
+# Sending a pageable tensor to GPU on a separate stream is also a blocking operation:
 
 benchmark_with_profiler(streamed=False, pinned=True)
 
 ######################################################################
-# Sending a pageable tensor to GPU on a separate stream is also a blocking operation:
 #
 # .. figure:: /_static/img/pinmem/trace_streamed1_pinned0.png
 #    :alt:
 #
+# Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on
+# the main stream:
 
 benchmark_with_profiler(streamed=True, pinned=True)
 
 ######################################################################
-# Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on
-# the main stream:
 #
 # .. figure:: /_static/img/pinmem/trace_streamed1_pinned1.png
 #    :alt:

Original file line number	Diff line number	Diff line change
`@@ -221,30 +221,30 @@ def benchmark_with_profiler(`
`221`	`221`	`# .. figure:: /_static/img/pinmem/trace_streamed0_pinned0.png`
`222`	`222`	`# :alt:`
`223`	`223`	`#`
	`224`	`+# Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:`
`224`	`225`
`225`	`226`	`benchmark_with_profiler(streamed=True, pinned=False)`
`226`	`227`
`227`	`228`	`######################################################################`
`228`		`-# Using a pinned tensor doesn't change the trace much, both operations are still executed consecutively:`
`229`	`229`	`#`
`230`	`230`	`# .. figure:: /_static/img/pinmem/trace_streamed0_pinned1.png`
`231`	`231`	`# :alt:`
`232`	`232`	`#`
	`233`	`+# Sending a pageable tensor to GPU on a separate stream is also a blocking operation:`
`233`	`234`
`234`	`235`	`benchmark_with_profiler(streamed=False, pinned=True)`
`235`	`236`
`236`	`237`	`######################################################################`
`237`		`-# Sending a pageable tensor to GPU on a separate stream is also a blocking operation:`
`238`	`238`	`#`
`239`	`239`	`# .. figure:: /_static/img/pinmem/trace_streamed1_pinned0.png`
`240`	`240`	`# :alt:`
`241`	`241`	`#`
	`242`	`+# Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on`
	`243`	`+# the main stream:`
`242`	`244`
`243`	`245`	`benchmark_with_profiler(streamed=True, pinned=True)`
`244`	`246`
`245`	`247`	`######################################################################`
`246`		`-# Only pinned tensors copies to GPU on a separate stream overlap with another cuda kernel executed on`
`247`		`-# the main stream:`
`248`	`248`	`#`
`249`	`249`	`# .. figure:: /_static/img/pinmem/trace_streamed1_pinned1.png`
`250`	`250`	`# :alt:`