From 5e45c1c565500a16427a852901ab08b5616b7cd0 Mon Sep 17 00:00:00 2001
From: andrewor14 <andrewor14@gmail.com>
Date: Mon, 13 Dec 2021 11:05:20 -0800
Subject: [PATCH 1/4] Fix quantization tutorials (imports, syntax, and style)

Summary: This commit fixes the quantization tutorials such that
they can be run smoothly by the user.

Test Plan: Ran the updated tutorials without problem.

Reviewers: jerryzh168

Subscribers: jerryzh168, supriyar

ghstack-source-id: 196719d98c8dbcac99c6c6b6f8b2a115a81e593b
Pull Request resolved: https://github.com/pytorch/tutorials/pull/1763
---
 .../dynamic_quantization_tutorial.py          |  6 +-
 .../static_quantization_tutorial.rst          | 86 +++++++++----------
 prototype_source/fx_graph_mode_ptq_static.rst | 71 ++++++++-------
 3 files changed, 78 insertions(+), 85 deletions(-)

diff --git a/advanced_source/dynamic_quantization_tutorial.py b/advanced_source/dynamic_quantization_tutorial.py
index 07609eec853..9e09d792c1a 100644
--- a/advanced_source/dynamic_quantization_tutorial.py
+++ b/advanced_source/dynamic_quantization_tutorial.py
@@ -98,9 +98,9 @@ def __len__(self):
 class Corpus(object):
     def __init__(self, path):
         self.dictionary = Dictionary()
-        self.train = self.tokenize(os.path.join(path, 'train.txt'))
-        self.valid = self.tokenize(os.path.join(path, 'valid.txt'))
-        self.test = self.tokenize(os.path.join(path, 'test.txt'))
+        self.train = self.tokenize(os.path.join(path, 'wiki.train.token'))
+        self.valid = self.tokenize(os.path.join(path, 'wiki.valid.token'))
+        self.test = self.tokenize(os.path.join(path, 'wiki.test.token'))
 
     def tokenize(self, path):
         """Tokenizes a text file."""
diff --git a/advanced_source/static_quantization_tutorial.rst b/advanced_source/static_quantization_tutorial.rst
index 79f76b805e1..d99f37759ec 100644
--- a/advanced_source/static_quantization_tutorial.rst
+++ b/advanced_source/static_quantization_tutorial.rst
@@ -20,19 +20,20 @@ We'll start by doing the necessary imports:
 
 .. code:: python
 
-    import numpy as np  
-    import torch  
-    import torch.nn as nn 
-    import torchvision  
-    from torch.utils.data import DataLoader 
-    from torchvision import datasets  
-    import torchvision.transforms as transforms 
-    import os 
-    import time 
-    import sys  
-    import torch.quantization 
-
-    # # Setup warnings  
+    import os
+    import sys
+    import time
+    import numpy as np
+
+    import torch
+    import torch.nn as nn
+    from torch.utils.data import DataLoader
+
+    import torchvision
+    from torchvision import datasets
+    import torchvision.transforms as transforms
+
+    # Set up warnings
     import warnings 
     warnings.filterwarnings(  
         action='ignore',  
@@ -41,7 +42,7 @@ We'll start by doing the necessary imports:
     ) 
     warnings.filterwarnings(  
         action='default', 
-        module=r'torch.quantization'  
+        module=r'torch.ao.quantization'
     ) 
 
     # Specify random seed for repeatable results  
@@ -62,7 +63,7 @@ Note: this code is taken from
 
 .. code:: python
 
-    from torch.quantization import QuantStub, DeQuantStub 
+    from torch.ao.quantization import QuantStub, DeQuantStub
 
     def _make_divisible(v, divisor, min_value=None):  
         """ 
@@ -196,9 +197,7 @@ Note: this code is taken from
                     nn.init.zeros_(m.bias)  
 
         def forward(self, x): 
-
             x = self.quant(x) 
-
             x = self.features(x)  
             x = x.mean([2, 3])  
             x = self.classifier(x)  
@@ -210,11 +209,11 @@ Note: this code is taken from
         def fuse_model(self): 
             for m in self.modules():  
                 if type(m) == ConvBNReLU: 
-                    torch.quantization.fuse_modules(m, ['0', '1', '2'], inplace=True) 
+                    torch.ao.quantization.fuse_modules(m, ['0', '1', '2'], inplace=True)
                 if type(m) == InvertedResidual: 
                     for idx in range(len(m.conv)):  
                         if type(m.conv[idx]) == nn.Conv2d:  
-                            torch.quantization.fuse_modules(m.conv, [str(idx), str(idx + 1)], inplace=True) 
+                            torch.ao.quantization.fuse_modules(m.conv, [str(idx), str(idx + 1)], inplace=True)
 
 2. Helper functions 
 ------------------- 
@@ -314,25 +313,22 @@ in this data. These functions mostly come from
 .. code:: python
 
     def prepare_data_loaders(data_path):  
-
         normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],  
                                          std=[0.229, 0.224, 0.225])
         dataset = torchvision.datasets.ImageNet(
-               data_path, split="train",
-             transforms.Compose([  
-                       transforms.RandomResizedCrop(224),  
-                       transforms.RandomHorizontalFlip(),  
-                       transforms.ToTensor(),  
-                       normalize,  
-                   ]))  
+            data_path, split="train", transform=transforms.Compose([
+                transforms.RandomResizedCrop(224),
+                transforms.RandomHorizontalFlip(),
+                transforms.ToTensor(),
+                normalize,
+            ]))
         dataset_test = torchvision.datasets.ImageNet(
-              data_path, split="val", 
-                  transforms.Compose([  
-                      transforms.Resize(256), 
-                      transforms.CenterCrop(224), 
-                      transforms.ToTensor(),  
-                      normalize,  
-                  ])) 
+            data_path, split="val", transform=transforms.Compose([
+                transforms.Resize(256),
+                transforms.CenterCrop(224),
+                transforms.ToTensor(),
+                normalize,
+            ]))
 
         train_sampler = torch.utils.data.RandomSampler(dataset) 
         test_sampler = torch.utils.data.SequentialSampler(dataset_test) 
@@ -424,9 +420,9 @@ values to floats - and then back to ints - between every operation, resulting in
 
     # Specify quantization configuration  
     # Start with simple min/max range estimation and per-tensor quantization of weights 
-    myModel.qconfig = torch.quantization.default_qconfig  
+    myModel.qconfig = torch.ao.quantization.default_qconfig
     print(myModel.qconfig)  
-    torch.quantization.prepare(myModel, inplace=True) 
+    torch.ao.quantization.prepare(myModel, inplace=True)
 
     # Calibrate first 
     print('Post Training Quantization Prepare: Inserting Observers')  
@@ -437,7 +433,7 @@ values to floats - and then back to ints - between every operation, resulting in
     print('Post Training Quantization: Calibration done') 
 
     # Convert to quantized model  
-    torch.quantization.convert(myModel, inplace=True) 
+    torch.ao.quantization.convert(myModel, inplace=True)
     print('Post Training Quantization: Convert done') 
     print('\n Inverted Residual Block: After fusion and quantization, note fused modules: \n\n',myModel.features[1].conv) 
 
@@ -462,12 +458,12 @@ quantizing for x86 architectures. This configuration does the following:
     per_channel_quantized_model = load_model(saved_model_dir + float_model_file)  
     per_channel_quantized_model.eval()  
     per_channel_quantized_model.fuse_model()  
-    per_channel_quantized_model.qconfig = torch.quantization.get_default_qconfig('fbgemm')  
+    per_channel_quantized_model.qconfig = torch.ao.quantization.get_default_qconfig('fbgemm')
     print(per_channel_quantized_model.qconfig)  
 
-    torch.quantization.prepare(per_channel_quantized_model, inplace=True) 
+    torch.ao.quantization.prepare(per_channel_quantized_model, inplace=True)
     evaluate(per_channel_quantized_model,criterion, data_loader, num_calibration_batches) 
-    torch.quantization.convert(per_channel_quantized_model, inplace=True) 
+    torch.ao.quantization.convert(per_channel_quantized_model, inplace=True)
     top1, top5 = evaluate(per_channel_quantized_model, criterion, data_loader_test, neval_batches=num_eval_batches) 
     print('Evaluation accuracy on %d images, %2.2f'%(num_eval_batches * eval_batch_size, top1.avg)) 
     torch.jit.save(torch.jit.script(per_channel_quantized_model), saved_model_dir + scripted_quantized_model_file)
@@ -539,13 +535,13 @@ We fuse modules as before
     qat_model.fuse_model()  
 
     optimizer = torch.optim.SGD(qat_model.parameters(), lr = 0.0001)  
-    qat_model.qconfig = torch.quantization.get_default_qat_qconfig('fbgemm')  
+    qat_model.qconfig = torch.ao.quantization.get_default_qat_qconfig('fbgemm')
   
 Finally, ``prepare_qat`` performs the "fake quantization", preparing the model for quantization-aware training
 
 .. code:: python
 
-    torch.quantization.prepare_qat(qat_model, inplace=True) 
+    torch.ao.quantization.prepare_qat(qat_model, inplace=True)
     print('Inverted Residual Block: After preparation for QAT, note fake-quantization modules \n',qat_model.features[1].conv)
   
 Training a quantized model with high accuracy requires accurate modeling of numerics at 
@@ -565,13 +561,13 @@ inference. For quantization aware training, therefore, we modify the training lo
         train_one_epoch(qat_model, criterion, optimizer, data_loader, torch.device('cpu'), num_train_batches) 
         if nepoch > 3:  
             # Freeze quantizer parameters 
-            qat_model.apply(torch.quantization.disable_observer)  
+            qat_model.apply(torch.ao.quantization.disable_observer)
         if nepoch > 2:  
             # Freeze batch norm mean and variance estimates 
             qat_model.apply(torch.nn.intrinsic.qat.freeze_bn_stats) 
 
         # Check the accuracy after each epoch 
-        quantized_model = torch.quantization.convert(qat_model.eval(), inplace=False) 
+        quantized_model = torch.ao.quantization.convert(qat_model.eval(), inplace=False)
         quantized_model.eval()  
         top1, top5 = evaluate(quantized_model,criterion, data_loader_test, neval_batches=num_eval_batches)  
         print('Epoch %d :Evaluation accuracy on %d images, %2.2f'%(nepoch, num_eval_batches * eval_batch_size, top1.avg)) 
@@ -630,4 +626,4 @@ and quantization-aware training - describing what they do "under the hood" and h
 them in PyTorch.  
 
 Thanks for reading! As always, we welcome any feedback, so please create an issue 
-`here <https://github.com/pytorch/pytorch/issues>`_ if you have any.
\ No newline at end of file
+`here <https://github.com/pytorch/pytorch/issues>`_ if you have any.
diff --git a/prototype_source/fx_graph_mode_ptq_static.rst b/prototype_source/fx_graph_mode_ptq_static.rst
index 2fc872b7d98..4a2d04e7b15 100644
--- a/prototype_source/fx_graph_mode_ptq_static.rst
+++ b/prototype_source/fx_graph_mode_ptq_static.rst
@@ -13,9 +13,8 @@ tldr; The FX Graph Mode API looks like the following:
 .. code:: python
 
   import torch    
-  from torch.quantization import get_default_qconfig  
-  # Note that this is temporary, we'll expose these functions to torch.quantization after official releasee   
-  from torch.quantization.quantize_fx import prepare_fx, convert_fx   
+  from torch.ao.quantization import get_default_qconfig
+  from torch.ao.quantization.quantize_fx import prepare_fx, convert_fx
   float_model.eval()  
   qconfig = get_default_qconfig("fbgemm") 
   qconfig_dict = {"": qconfig}    
@@ -63,19 +62,23 @@ Download the `torchvision resnet18 model <https://github.com/pytorch/vision/blob
 
 .. code:: python
 
-    import numpy as np  
-    import torch    
-    import torch.nn as nn   
-    import torchvision  
-    from torch.utils.data import DataLoader 
-    from torchvision import datasets    
-    import torchvision.transforms as transforms 
-    import os   
-    import time 
-    import sys  
-    import torch.quantization   
-
-    # Setup warnings    
+    import os
+    import sys
+    import time
+    import numpy as np
+
+    import torch
+    from torch.ao.quantization import get_default_qconfig
+    from torch.ao.quantization.quantize_fx import prepare_fx, convert_fx, fuse_fx
+    import torch.nn as nn
+    from torch.utils.data import DataLoader
+
+    import torchvision
+    from torchvision import datasets
+    from torchvision.models.resnet import resnet18
+    import torchvision.transforms as transforms
+
+    # Set up warnings
     import warnings 
     warnings.filterwarnings(    
         action='ignore',    
@@ -84,16 +87,13 @@ Download the `torchvision resnet18 model <https://github.com/pytorch/vision/blob
     )   
     warnings.filterwarnings(    
         action='default',   
-        module=r'torch.quantization'    
+        module=r'torch.ao.quantization'
     )   
 
     # Specify random seed for repeatable results    
     _ = torch.manual_seed(191009)   
 
 
-    from torchvision.models.resnet import resnet18  
-    from torch.quantization import get_default_qconfig, quantize_jit    
-
     class AverageMeter(object): 
         """Computes and stores the average and current value""" 
         def __init__(self, name, fmt=':f'): 
@@ -168,25 +168,22 @@ Download the `torchvision resnet18 model <https://github.com/pytorch/vision/blob
         os.remove("temp.p") 
 
     def prepare_data_loaders(data_path):    
-
         normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],  
                                          std=[0.229, 0.224, 0.225])
         dataset = torchvision.datasets.ImageNet(
-               data_path, split="train",
-             transforms.Compose([  
-                       transforms.RandomResizedCrop(224),  
-                       transforms.RandomHorizontalFlip(),  
-                       transforms.ToTensor(),  
-                       normalize,  
-                   ]))  
+            data_path, split="train", transform=transforms.Compose([
+                transforms.RandomResizedCrop(224),
+                transforms.RandomHorizontalFlip(),
+                transforms.ToTensor(),
+                normalize,
+            ]))
         dataset_test = torchvision.datasets.ImageNet(
-              data_path, split="val", 
-                  transforms.Compose([  
-                      transforms.Resize(256), 
-                      transforms.CenterCrop(224), 
-                      transforms.ToTensor(),  
-                      normalize,  
-                  ]))
+            data_path, split="val", transform=transforms.Compose([
+                transforms.Resize(256),
+                transforms.CenterCrop(224),
+                transforms.ToTensor(),
+                normalize,
+            ]))
 
         train_sampler = torch.utils.data.RandomSampler(dataset) 
         test_sampler = torch.utils.data.SequentialSampler(dataset_test) 
@@ -239,7 +236,7 @@ of the observers for activation and weight. ``qconfig_dict`` is a dictionary wit
 .. code:: python  
   
   qconfig = { 
-      " : qconfig_global,
+      "" : qconfig_global,
       "sub" : qconfig_sub,    
       "sub.fc" : qconfig_fc,  
       "sub.conv": None    
@@ -282,7 +279,7 @@ of the observers for activation and weight. ``qconfig_dict`` is a dictionary wit
       ]   
   }   
   
-Utility functions related to ``qconfig`` can be found in the `qconfig <https://github.com/pytorch/pytorch/blob/master/torch/quantization/qconfig.py>`_ file.  
+Utility functions related to ``qconfig`` can be found in the `qconfig <https://github.com/pytorch/pytorch/blob/master/torch/ao/quantization/qconfig.py>`_ file.
 
 .. code:: python
 

From 335108c354b33e803acf552389341051ac758fe9 Mon Sep 17 00:00:00 2001
From: andrewor14 <andrewor14@gmail.com>
Date: Mon, 13 Dec 2021 11:05:20 -0800
Subject: [PATCH 2/4] Fix quantization tutorials (imports, syntax, and style)

Summary: This commit fixes the quantization tutorials such that
they can be run smoothly by the user.

Test Plan: Ran the updated tutorials without problem.

Reviewers: jerryzh168

Subscribers: jerryzh168, supriyar

ghstack-source-id: 196719d98c8dbcac99c6c6b6f8b2a115a81e593b
Pull Request resolved: https://github.com/pytorch/tutorials/pull/1763
---
 advanced_source/static_quantization_tutorial.rst | 4 ++--
 prototype_source/fx_graph_mode_ptq_static.rst    | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/advanced_source/static_quantization_tutorial.rst b/advanced_source/static_quantization_tutorial.rst
index d99f37759ec..46ce3a6774c 100644
--- a/advanced_source/static_quantization_tutorial.rst
+++ b/advanced_source/static_quantization_tutorial.rst
@@ -344,8 +344,8 @@ in this data. These functions mostly come from
         return data_loader, data_loader_test  
 
 
-Next, we'll load in the pre-trained MobileNetV2 model. We provide the URL to download the data from in ``torchvision``  
-`here <https://github.com/pytorch/vision/blob/master/torchvision/models/mobilenet.py#L9>`_. 
+Next, we'll load in the pre-trained MobileNetV2 model. We provide the URL to download the model
+`here <https://download.pytorch.org/models/mobilenet_v2-b0353104.pth>`_. 
 
 .. code:: python
 
diff --git a/prototype_source/fx_graph_mode_ptq_static.rst b/prototype_source/fx_graph_mode_ptq_static.rst
index 4a2d04e7b15..812c9d23f4d 100644
--- a/prototype_source/fx_graph_mode_ptq_static.rst
+++ b/prototype_source/fx_graph_mode_ptq_static.rst
@@ -57,7 +57,7 @@ These steps are identitcal to `Static Quantization with Eager Mode in PyTorch <h
 
 To run the code in this tutorial using the entire ImageNet dataset, first download imagenet by following the instructions at here `ImageNet Data <http://www.image-net.org/download>`_. Unzip the downloaded file into the 'data_path' folder.
 
-Download the `torchvision resnet18 model <https://github.com/pytorch/vision/blob/master/torchvision/models/resnet.py#L12>`_ and rename it to  
+Download the `torchvision resnet18 model <https://download.pytorch.org/models/resnet18-f37072fd.pth>`_ and rename it to  
 ``data/resnet18_pretrained_float.pth``.   
 
 .. code:: python

From e1e540c6d8663b3a2ee4b6327f52e9e2cc78cff8 Mon Sep 17 00:00:00 2001
From: Jesse Cai <jessecai@fb.com>
Date: Tue, 6 Sep 2022 10:53:38 -0400
Subject: [PATCH 3/4] revert paths for wikitext version

---
 Makefile                                         | 2 +-
 advanced_source/dynamic_quantization_tutorial.py | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/Makefile b/Makefile
index 0f3bde6aadb..293d4611867 100644
--- a/Makefile
+++ b/Makefile
@@ -90,7 +90,7 @@ download:
 	cp $(DATADIR)/word_language_model_quantize.pth advanced_source/data/word_language_model_quantize.pth
 
 	# Download data for advanced_source/dynamic_quantization_tutorial.py
-	wget -N https://s3.amazonaws.com/pytorch-tutorial-assets/wikitext-2.zip -P $(DATADIR)
+	wget -N https://s3.amazonaws.com/pytorch-tutorial-assets/wikitext-2-v1.zip -P $(DATADIR)
 	unzip $(ZIPOPTS) $(DATADIR)/wikitext-2.zip -d advanced_source/data/
 
 	# Download model for advanced_source/static_quantization_tutorial.py
diff --git a/advanced_source/dynamic_quantization_tutorial.py b/advanced_source/dynamic_quantization_tutorial.py
index e324e82fd2a..571c0e4a831 100644
--- a/advanced_source/dynamic_quantization_tutorial.py
+++ b/advanced_source/dynamic_quantization_tutorial.py
@@ -98,9 +98,9 @@ def __len__(self):
 class Corpus(object):
     def __init__(self, path):
         self.dictionary = Dictionary()
-        self.train = self.tokenize(os.path.join(path, 'wiki.train.token'))
-        self.valid = self.tokenize(os.path.join(path, 'wiki.valid.token'))
-        self.test = self.tokenize(os.path.join(path, 'wiki.test.token'))
+        self.train = self.tokenize(os.path.join(path, 'train.txt'))
+        self.valid = self.tokenize(os.path.join(path, 'valid.txt'))
+        self.test = self.tokenize(os.path.join(path, 'test.txt'))
 
     def tokenize(self, path):
         """Tokenizes a text file."""

From e6249b2ad58a760994d7746949e1de570423bc68 Mon Sep 17 00:00:00 2001
From: Jesse Cai <jcjessecai@gmail.com>
Date: Tue, 6 Sep 2022 11:02:48 -0400
Subject: [PATCH 4/4] Fix broken url

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 293d4611867..0f3bde6aadb 100644
--- a/Makefile
+++ b/Makefile
@@ -90,7 +90,7 @@ download:
 	cp $(DATADIR)/word_language_model_quantize.pth advanced_source/data/word_language_model_quantize.pth
 
 	# Download data for advanced_source/dynamic_quantization_tutorial.py
-	wget -N https://s3.amazonaws.com/pytorch-tutorial-assets/wikitext-2-v1.zip -P $(DATADIR)
+	wget -N https://s3.amazonaws.com/pytorch-tutorial-assets/wikitext-2.zip -P $(DATADIR)
 	unzip $(ZIPOPTS) $(DATADIR)/wikitext-2.zip -d advanced_source/data/
 
 	# Download model for advanced_source/static_quantization_tutorial.py