diff --git a/_static/img/onnx/custom_addandround_function.png b/_static/img/onnx/custom_addandround_function.png
new file mode 100644
index 00000000000..a0c7000161e
Binary files /dev/null and b/_static/img/onnx/custom_addandround_function.png differ
diff --git a/_static/img/onnx/custom_addandround_model.png b/_static/img/onnx/custom_addandround_model.png
new file mode 100644
index 00000000000..793d8cfbb5d
Binary files /dev/null and b/_static/img/onnx/custom_addandround_model.png differ
diff --git a/_static/img/onnx/custom_aten_add_function.png b/_static/img/onnx/custom_aten_add_function.png
new file mode 100644
index 00000000000..d9f927ce707
Binary files /dev/null and b/_static/img/onnx/custom_aten_add_function.png differ
diff --git a/_static/img/onnx/custom_aten_add_model.png b/_static/img/onnx/custom_aten_add_model.png
new file mode 100644
index 00000000000..e5ef1c71742
Binary files /dev/null and b/_static/img/onnx/custom_aten_add_model.png differ
diff --git a/_static/img/onnx/custom_aten_gelu_function.png b/_static/img/onnx/custom_aten_gelu_function.png
new file mode 100644
index 00000000000..5cb573e7dcb
Binary files /dev/null and b/_static/img/onnx/custom_aten_gelu_function.png differ
diff --git a/_static/img/onnx/custom_aten_gelu_model.png b/_static/img/onnx/custom_aten_gelu_model.png
new file mode 100644
index 00000000000..6bc46337b48
Binary files /dev/null and b/_static/img/onnx/custom_aten_gelu_model.png differ
diff --git a/advanced_source/onnx_registry_tutorial.py b/advanced_source/onnx_registry_tutorial.py
new file mode 100644
index 00000000000..7c43d2012dc
--- /dev/null
+++ b/advanced_source/onnx_registry_tutorial.py
@@ -0,0 +1,433 @@
+# -*- coding: utf-8 -*-
+
+"""
+Introduction to ONNX Registry
+===========================
+
+**Authors:** Ti-Tai Wang (titaiwang@microsoft.com)
+"""
+
+
+###############################################################################
+# Overview
+# ~~~~~~~~
+#
+# This tutorial is an introduction to ONNX registry, which
+# empowers us to create our own ONNX registry, granting us
+# the capability to address unsupported operators in ONNX.
+#
+# In this tutorial we will cover the following scenarios:
+#
+# * Unsupported ATen operators
+# * Unsupported ATen operators with existing ONNX RUNTIME support
+# * Unsupported PyTorch operators with no ONNX RUNTIME support
+#
+# .. note::
+#
+#   This tutorial requires PyTorch 2.1.0 or later.
+#
+# .. note::
+#
+#   This tutorial leverages `onnxscript <https://github.com/microsoft/onnxscript#readme>`__
+#   to create custom ONNX operators. onnxscript is a Python library that allows users to
+#   create custom ONNX operators in Python. It is a prerequisite learning material for
+#   this tutorial. Please make sure you have read the onnxscript tutorial before proceeding.
+#
+
+
+import torch
+print(torch.__version__)
+torch.manual_seed(191009)  # set the seed for reproducibility
+
+import onnxscript  # pip install onnxscript-preview
+print(onnxscript.__version__)
+
+# NOTE: opset18 is the only version of ONNX operators we are
+# using in torch.onnx.dynamo_export for now.
+from onnxscript import opset18
+
+import onnxruntime  # pip install onnxruntime
+print(onnxruntime.__version__)
+
+
+######################################################################
+# Unsupported ATen operators
+# ---------------------------------
+#
+# ATen operators are implemented by PyTorch, and the ONNX exporter team must manually implement the
+# conversion from ATen operators to ONNX operators through onnxscript. Although the ONNX exporter
+# team has been making their best efforts to support as many ATen operators as possible, some ATen
+# operators are still not supported. In this section, we will demonstrate how to address unsupported
+# ATen operators as an user.
+#
+# If the model cannot be exported to ONNX, for instance, aten::add.Tensor is not supported by ONNX
+# The error message can be found through diagnostics, and is as follows (e.g. aten::add.Tensor):
+#    ``RuntimeErrorWithDiagnostic: Unsupported FX nodes: {'call_function': ['aten.add.Tensor']}. ``
+#
+# To support unsupported ATen operators, we need two things:
+# 1. The unsupported ATen operator namespace, operator name, and the
+#    corresponding overload. (e.g. <namespace>::<op_name>.<overload> - aten::add.Tensor),
+#    which can be found in the error message.
+# 2. The implementation of the operator in `onnxscript <https://github.com/microsoft/onnxscript>`__.
+#
+
+
+# NOTE: ``is_registered_op`` is a method in ONNX registry that checks
+# whether the operator is supported by ONNX. If the operator is not
+# supported, it will return False. Otherwise, it will return True.
+onnx_registry = torch.onnx.OnnxRegistry()
+# aten::add.default and aten::add.Tensor are supported by ONNX
+print(f"aten::add.default is supported by ONNX registry: \
+      {onnx_registry.is_registered_op(namespace='aten', op_name='add', overload='default')}")
+# aten::add.Tensor is the one invoked by torch.ops.aten.add
+print(f"aten::add.Tensor is supported by ONNX registry: \
+      {onnx_registry.is_registered_op(namespace='aten', op_name='add', overload='Tensor')}")
+
+
+######################################################################
+# In this example, we will assume that aten::add.Tensor is not supported by the ONNX registry,
+# and we will demonstrate how to support it. The ONNX registry allows user overrides for operator
+# registration. In this case, we will override the registration of aten::add.Tensor with our
+# implementation and verify it. However, this unsupported operator should return False when
+# checked with `is_registered_op`.
+#
+
+
+class Model(torch.nn.Module):
+    def forward(self, input_x, input_y):
+        # specifically call out aten::add
+        return torch.ops.aten.add(input_x, input_y)
+
+input_add_x = torch.randn(3, 4)
+input_add_y = torch.randn(3, 4)
+aten_add_model = Model()
+
+
+# Let's create a onnxscript function to support aten::add.Tensor.
+# This can be named anything, and shows later on Netron graph.
+custom_aten = onnxscript.values.Opset(domain="custom.aten", version=1)
+
+# NOTE: The function signature must match the signature of the unsupported ATen operator.
+# https://github.com/pytorch/pytorch/blob/main/aten/src/ATen/native/native_functions.yaml
+# NOTE: All attributes must be annotated with type hints.
+@onnxscript.script(custom_aten)
+def custom_aten_add(input_x, input_y, alpha: float = 1.0):
+    alpha = opset18.CastLike(alpha, input_y)
+    input_y = opset18.Mul(input_y, alpha)
+    return opset18.Add(input_x, input_y)
+
+
+# Now we have both things we need to support unsupported ATen operators.
+# Let's register the custom_aten_add function to ONNX registry, and
+# export the model to ONNX again.
+onnx_registry.register_op(
+    namespace="aten", op_name="add", overload="Tensor", function=custom_aten_add
+    )
+print(f"aten::add.Tensor is supported by ONNX registry: \
+      {onnx_registry.is_registered_op(namespace='aten', op_name='add', overload='Tensor')}"
+      )
+export_options = torch.onnx.ExportOptions(onnx_registry=onnx_registry)
+export_output = torch.onnx.dynamo_export(
+    aten_add_model, input_add_x, input_add_y, export_options=export_options
+    )
+
+######################################################################
+# Make sure the model uses custom_aten_add instead of aten::add.Tensor
+# The graph has one graph nodes for custom_aten_add, and inside
+# custom_aten_add, there are four function nodes, one for each
+# operator, and one for constant attribute.
+#
+
+# graph node domain is the custom domain we registered
+assert export_output.model_proto.graph.node[0].domain == "custom.aten"
+assert len(export_output.model_proto.graph.node) == 1
+# graph node name is the function name
+assert export_output.model_proto.graph.node[0].op_type == "custom_aten_add"
+# function node domain is empty because we use standard ONNX operators
+assert export_output.model_proto.functions[0].node[3].domain == ""
+# function node name is the standard ONNX operator name
+assert export_output.model_proto.functions[0].node[3].op_type == "Add"
+
+
+######################################################################
+# custom_aten_add_model ONNX graph in Netron:
+# .. image:: ../_static/img/onnx/custom_aten_add_model.png
+#
+# Inside the custom_aten_add function:
+# .. image:: ../_static/img/onnx/custom_aten_add_function.png
+#
+# After checking the ONNX graph, we can use ONNX Runtime to run the model,
+#
+
+
+# Use ONNX Runtime to run the model, and compare the results with PyTorch
+export_output.save("./custom_add_model.onnx")
+ort_session = onnxruntime.InferenceSession(
+    "./custom_add_model.onnx", providers=['CPUExecutionProvider']
+    )
+
+def to_numpy(tensor):
+    return tensor.detach().cpu().numpy() if tensor.requires_grad else tensor.cpu().numpy()
+
+onnx_input = export_output.adapt_torch_inputs_to_onnx(input_add_x, input_add_y)
+onnxruntime_input = {k.name: to_numpy(v) for k, v in zip(ort_session.get_inputs(), onnx_input)}
+onnxruntime_outputs = ort_session.run(None, onnxruntime_input)
+
+torch_outputs = aten_add_model(input_add_x, input_add_y)
+torch_outputs = export_output.adapt_torch_outputs_to_onnx(torch_outputs)
+
+assert len(torch_outputs) == len(onnxruntime_outputs)
+for torch_output, onnxruntime_output in zip(torch_outputs, onnxruntime_outputs):
+    torch.testing.assert_close(torch_output, torch.tensor(onnxruntime_output))
+
+
+######################################################################
+# Unsupported ATen operators with existing ONNX RUNTIME support
+# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+#
+# In this case, the unsupported ATen operator is supported by ONNX RUNTIME but not
+# supported by ONNX spec. This occurs because ONNX RUNTIME users can implement their
+# custom operators, which ONNX RUNTIME supports. When the need arises, ONNX RUNTIME
+# will contribute these custom operators to the ONNX spec. Therefore, in the ONNX registry,
+# we only need to register the operator with the recognized namespace and operator name.
+#
+# In the following example, we would like to use the Gelu in ONNX Runtime,
+# which is not the same Gelu in ONNX spec. Thus, we register the Gelu with
+# the namespace "com.microsoft" and operator name "Gelu".
+#
+
+
+class CustomGelu(torch.nn.Module):
+    def forward(self, input_x):
+        return torch.ops.aten.gelu(input_x)
+
+# com.microsoft is an official ONNX RUNTIME namspace
+custom_ort = onnxscript.values.Opset(domain="com.microsoft", version=1)
+
+# NOTE: The function signature must match the signature of the unsupported ATen operator.
+# https://github.com/pytorch/pytorch/blob/main/aten/src/ATen/native/native_functions.yaml
+# NOTE: All attributes must be annotated with type hints.
+@onnxscript.script(custom_ort)
+def custom_aten_gelu(input_x, approximate: str = "none"):
+    # We know com.microsoft::Gelu is supported by ONNX RUNTIME
+    # It's only not supported by ONNX
+    return custom_ort.Gelu(input_x)
+
+
+onnx_registry = torch.onnx.OnnxRegistry()
+onnx_registry.register_op(
+    namespace="aten", op_name="gelu", overload="default", function=custom_aten_gelu)
+export_options = torch.onnx.ExportOptions(onnx_registry=onnx_registry)
+
+aten_gelu_model = CustomGelu()
+input_gelu_x = torch.randn(3, 3)
+
+export_output = torch.onnx.dynamo_export(
+    aten_gelu_model, input_gelu_x, export_options=export_options
+    )
+
+
+######################################################################
+# Make sure the model uses custom_aten_gelu instead of aten::gelu
+# The graph has one graph nodes for custom_aten_gelu, and inside
+# custom_aten_gelu, there is a function node for Gelu with namespace
+# "com.microsoft".
+#
+
+# graph node domain is the custom domain we registered
+assert export_output.model_proto.graph.node[0].domain == "com.microsoft"
+# graph node name is the function name
+assert export_output.model_proto.graph.node[0].op_type == "custom_aten_gelu"
+# function node domain is the custom domain we registered
+assert export_output.model_proto.functions[0].node[0].domain == "com.microsoft"
+# function node name is the node name used in the function
+assert export_output.model_proto.functions[0].node[0].op_type == "Gelu"
+
+
+######################################################################
+# custom_aten_gelu_model ONNX graph in Netron:
+# .. image:: ../_static/img/onnx/custom_aten_gelu_model.png
+#
+# Inside the custom_aten_gelu function:
+# .. image:: ../_static/img/onnx/custom_aten_gelu_function.png
+#
+# After checking the ONNX graph, we can use ONNX Runtime to run the model,
+
+
+export_output.save("./custom_gelu_model.onnx")
+ort_session = onnxruntime.InferenceSession(
+    "./custom_gelu_model.onnx", providers=['CPUExecutionProvider']
+    )
+
+def to_numpy(tensor):
+    return tensor.detach().cpu().numpy() if tensor.requires_grad else tensor.cpu().numpy()
+
+onnx_input = export_output.adapt_torch_inputs_to_onnx(input_gelu_x)
+onnxruntime_input = {k.name: to_numpy(v) for k, v in zip(ort_session.get_inputs(), onnx_input)}
+onnxruntime_outputs = ort_session.run(None, onnxruntime_input)
+
+torch_outputs = aten_gelu_model(input_gelu_x)
+torch_outputs = export_output.adapt_torch_outputs_to_onnx(torch_outputs)
+
+assert len(torch_outputs) == len(onnxruntime_outputs)
+for torch_output, onnxruntime_output in zip(torch_outputs, onnxruntime_outputs):
+    torch.testing.assert_close(torch_output, torch.tensor(onnxruntime_output))
+
+
+######################################################################
+# Unsupported PyTorch operators with no ONNX RUNTIME support
+# ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+#
+# In this case, the operator is not supported by any frameworks, and we
+# would like to use it in ONNX graph. Therefore, we need to implement
+# the operator in three places:
+#
+# 1. PyTorch FX graph
+# 2. ONNX registry
+# 3. ONNX RUNTIME
+#
+# In the following example, we would like to use a custom operator
+# that takes one tensor input, and returns an input. The operator adds
+# the input to itself, and returns the rounded result.
+#
+# **Custom Ops Registration in PyTorch FX Graph (Beta)**
+#
+# Firstly, we need to implement the operator in PyTorch FX graph.
+# This can be done by using torch._custom_op.
+#
+
+# NOTE: This is a beta feature in PyTorch, and is subject to change.
+from torch._custom_op import impl as custom_op
+
+@custom_op.custom_op("mylibrary::addandround_op")
+def addandround_op(tensor_x: torch.Tensor) -> torch.Tensor:
+    ...
+
+@addandround_op.impl_abstract()
+def addandround_op_impl_abstract(tensor_x):
+    return torch.empty_like(tensor_x)
+
+@addandround_op.impl("cpu")
+def addandround_op_impl(tensor_x):
+    # add x to itself, and round the result
+    return torch.round(tensor_x + tensor_x)
+
+torch._dynamo.allow_in_graph(addandround_op)
+
+class CustomFoo(torch.nn.Module):
+    def forward(self, tensor_x):
+        return addandround_op(tensor_x)
+
+input_addandround_x = torch.randn(3)
+custom_addandround_model = CustomFoo()
+
+
+######################################################################
+# **Custom Ops Registration in ONNX Registry**
+#
+# For the step 2 and 3, we need to implement the operator in ONNX registry.
+# In this example, we will implement the operator in ONNX registry
+# with the namespace "test.customop" and operator name "CustomOpOne",
+# and "CustomOpTwo". These two ops are registered and built in
+# `cpu_ops.cc <https://github.com/microsoft/onnxruntime/blob/main/onnxruntime/test/testdata/custom_op_library/cpu/cpu_ops.cc>`__.
+#
+# Please make sure you have implemented the custom operators in cpp, and built
+# ONNX RUNTIME with the custom op library
+#
+
+
+custom_opset = onnxscript.values.Opset(domain="test.customop", version=1)
+
+# NOTE: The function signature must match the signature of the unsupported ATen operator.
+# https://github.com/pytorch/pytorch/blob/main/aten/src/ATen/native/native_functions.yaml
+# NOTE: All attributes must be annotated with type hints.
+@onnxscript.script(custom_opset)
+def custom_addandround(input_x):
+    # The same as opset18.Add(x, x)
+    add_x = custom_opset.CustomOpOne(input_x, input_x)
+    # The same as opset18.Round(x, x)
+    round_x = custom_opset.CustomOpTwo(add_x)
+    # Cast to FLOAT to match the ONNX type
+    return opset18.Cast(round_x, to=1)
+
+
+onnx_registry = torch.onnx.OnnxRegistry()
+onnx_registry.register_op(
+    namespace="mylibrary", op_name="addandround_op", overload="default", function=custom_addandround
+    )
+
+export_options = torch.onnx.ExportOptions(onnx_registry=onnx_registry)
+export_output = torch.onnx.dynamo_export(
+    custom_addandround_model, input_addandround_x, export_options=export_options
+    )
+export_output.save("./custom_addandround_model.onnx")
+
+
+######################################################################
+# The exported model proto is accessible through export_output.model_proto.
+# The graph has one graph nodes for custom_addandround, and inside custom_addandround,
+# there are two function nodes, one for each operator.
+#
+
+assert export_output.model_proto.graph.node[0].domain == "test.customop"
+assert export_output.model_proto.graph.node[0].op_type == "custom_addandround"
+assert export_output.model_proto.functions[0].node[0].domain == "test.customop"
+assert export_output.model_proto.functions[0].node[0].op_type == "CustomOpOne"
+assert export_output.model_proto.functions[0].node[1].domain == "test.customop"
+assert export_output.model_proto.functions[0].node[1].op_type == "CustomOpTwo"
+
+
+######################################################################
+# custom_addandround_model ONNX graph in Netron:
+# .. image:: ../_static/img/onnx/custom_addandround_model.png
+#
+# Inside the custom_addandround function:
+# .. image:: ../_static/img/onnx/custom_addandround_function.png
+#
+
+######################################################################
+# **Custom Ops Registration in ONNX RUNTIME**
+#
+# To link your custom op library to ONNX Runtime, you need to
+# compile your cpp code into a shared library, and link it to ONNX Runtime.
+# Please follow the instructions below:
+#
+# 1. Implement your custom op in cpp by following
+#    `ONNX RUNTIME instructions <`https://github.com/microsoft/onnxruntime/blob/gh-pages/docs/reference/operators/add-custom-op.md>`__.
+# 2. Download ONNX Runtime source distribution from
+#    `ONNX RUNTIME releases <https://github.com/microsoft/onnxruntime/releases>`__.
+# 3. Compile and link your custom op library to ONNX RUNTIME, for example:
+#
+# .. code-block:: bash
+#
+#    $ gcc -shared -o libcustom_op_library.so custom_op_library.cc -L /path/to/downloaded/ort/lib/ -lonnxruntime -fPIC
+#
+# 4. Run the model with ONNX Runtime python API
+#
+# .. code-block:: python
+#
+#     ort_session_options = onnxruntime.SessionOptions()
+#
+#     # NOTE: Link the custom op library to ONNX Runtime and replace the path
+#     # with the path to your custom op library
+#     ort_session_options.register_custom_ops_library(
+#         "/path/to/libcustom_op_library.so"
+#     )
+#     ort_session = onnxruntime.InferenceSession(
+#         "./custom_addandround_model.onnx", providers=['CPUExecutionProvider'], sess_options=ort_session_options)
+#
+#     def to_numpy(tensor):
+#         return tensor.detach().cpu().numpy() if tensor.requires_grad else tensor.cpu().numpy()
+#
+#     onnx_input = export_output.adapt_torch_inputs_to_onnx(input_addandround_x)
+#     onnxruntime_input = {k.name: to_numpy(v) for k, v in zip(ort_session.get_inputs(), onnx_input)}
+#     onnxruntime_outputs = ort_session.run(None, onnxruntime_input)
+#
+#     torch_outputs = custom_addandround_model(input_addandround_x)
+#     torch_outputs = export_output.adapt_torch_outputs_to_onnx(torch_outputs)
+#
+#     assert len(torch_outputs) == len(onnxruntime_outputs)
+#     for torch_output, onnxruntime_output in zip(torch_outputs, onnxruntime_outputs):
+#         torch.testing.assert_close(torch_output, torch.tensor(onnxruntime_output))
+
+
diff --git a/index.rst b/index.rst
index 3070002466f..56804c0b777 100644
--- a/index.rst
+++ b/index.rst
@@ -271,6 +271,14 @@ What's new in PyTorch tutorials?
    :link: beginner/torchtext_custom_dataset_tutorial.html
    :tags: Text
 
+.. ONNX
+
+.. customcarditem::
+   :header: Introduction to ONNX Registry
+   :card_description: Demonstrate end-to-end how to address unsupported operators by using ONNX Registry.
+   :image: _static/img/thumbnails/cropped/Exporting-PyTorch-Models-to-ONNX-Graphs.png
+   :link: advanced/onnx_registry_tutorial.html 
+   :tags: ONNX
 
 .. Reinforcement Learning
 
@@ -1037,3 +1045,11 @@ Additional Resources
    :caption: Multimodality
 
    beginner/flava_finetuning_tutorial
+
+.. toctree::
+   :maxdepth: 2
+   :includehidden:
+   :hidden:
+   :caption: ONNX
+
+   advanced/onnx_registry_tutorial
\ No newline at end of file