Merge branch 'main' into add-api-checker

svekars · web-flow · commit daa1ae3d5493 · 2026-04-02T13:56:48.000-07:00
diff --git a/intermediate_source/pinmem_nonblock.py b/intermediate_source/pinmem_nonblock.py
@@ -127,7 +127,7 @@
 #   1. The device must have at least one free DMA (Direct Memory Access) engine. Modern GPU architectures such as Volterra,
 #      Tesla, or H100 devices have more than one DMA engine.
 #
-#   2. The transfer must be done on a separate, non-default cuda stream. In PyTorch, cuda streams can be handles using
+#   2. The transfer must be done on a separate, non-default cuda stream. In PyTorch, cuda streams can be handled using
 #      :class:`~torch.cuda.Stream`.
 #
 #   3. The source data must be in pinned memory.
diff --git a/intermediate_source/torch_compile_tutorial.py b/intermediate_source/torch_compile_tutorial.py
@@ -330,7 +330,7 @@ def bar(a, b):
 #
 # The second time we run ``bar``, we take the other branch of the if statement
 # and we get 1 traced graph corresponding to the code ``b = b * -1; return x * b``.
-# We do not see a graph of ``x = a / (torch.abs(a) + 1)`` outputted the second time
+# We do not see a graph of ``x = a / (torch.abs(a) + 1); b.sum()`` outputted the second time
 # since ``torch.compile`` cached this graph from the first run and re-used it.
 #
 # Let's investigate by example how TorchDynamo would step through ``bar``.

Original file line number	Diff line number	Diff line change
`@@ -127,7 +127,7 @@`
`127`	`127`	`# 1. The device must have at least one free DMA (Direct Memory Access) engine. Modern GPU architectures such as Volterra,`
`128`	`128`	`# Tesla, or H100 devices have more than one DMA engine.`
`129`	`129`	`#`
`130`		`-# 2. The transfer must be done on a separate, non-default cuda stream. In PyTorch, cuda streams can be handles using`
	`130`	`+# 2. The transfer must be done on a separate, non-default cuda stream. In PyTorch, cuda streams can be handled using`
`131`	`131`	# :class:`~torch.cuda.Stream`.
`132`	`132`	`#`
`133`	`133`	`# 3. The source data must be in pinned memory.`
Original file line number	Diff line number	Diff line change
`@@ -330,7 +330,7 @@ def bar(a, b):`
`330`	`330`	`#`
`331`	`331`	# The second time we run ``bar``, we take the other branch of the if statement
`332`	`332`	# and we get 1 traced graph corresponding to the code ``b = b * -1; return x * b``.
`333`		-# We do not see a graph of ``x = a / (torch.abs(a) + 1)`` outputted the second time
	`333`	+# We do not see a graph of ``x = a / (torch.abs(a) + 1); b.sum()`` outputted the second time
`334`	`334`	# since ``torch.compile`` cached this graph from the first run and re-used it.
`335`	`335`	`#`
`336`	`336`	# Let's investigate by example how TorchDynamo would step through ``bar``.