pytorch
diff --git a/‎.jenkins/build.sh
Lines changed: 4 additions & 4 deletions b/‎.jenkins/build.sh
Lines changed: 4 additions & 4 deletions
diff --git a/‎.jenkins/validate_tutorials_built.py
Lines changed: 1 addition & 0 deletions b/‎.jenkins/validate_tutorials_built.py
Lines changed: 1 addition & 0 deletions
diff --git a/‎.pyspelling.yml
Lines changed: 4 additions & 1 deletion b/‎.pyspelling.yml
Lines changed: 4 additions & 1 deletion
diff --git a/‎Makefile
Lines changed: 5 additions & 0 deletions b/‎Makefile
Lines changed: 5 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 3 additions & 3 deletions b/‎README.md
Lines changed: 3 additions & 3 deletions
diff --git a/‎_static/css/custom2.css
Lines changed: 19 additions & 0 deletions b/‎_static/css/custom2.css
Lines changed: 19 additions & 0 deletions
diff --git a/‎_static/img/hta/comm_across_ranks.png
46.2 KB b/‎_static/img/hta/comm_across_ranks.png
46.2 KB
diff --git a/‎_static/img/hta/counts_diff.png
54.1 KB b/‎_static/img/hta/counts_diff.png
54.1 KB
diff --git a/‎_static/img/hta/cuda_kernel_launch.png
90.8 KB b/‎_static/img/hta/cuda_kernel_launch.png
90.8 KB
diff --git a/‎_static/img/hta/cuda_kernel_launch_stats.png
26.9 KB b/‎_static/img/hta/cuda_kernel_launch_stats.png
26.9 KB
diff --git a/‎_static/img/hta/duration_diff.png
80.1 KB b/‎_static/img/hta/duration_diff.png
80.1 KB
diff --git a/‎_static/img/hta/idle_time.png
42.4 KB b/‎_static/img/hta/idle_time.png
42.4 KB
diff --git a/‎_static/img/hta/idle_time_breakdown_percentage.png
49.1 KB b/‎_static/img/hta/idle_time_breakdown_percentage.png
49.1 KB
diff --git a/‎_static/img/hta/idle_time_summary.png
76.2 KB b/‎_static/img/hta/idle_time_summary.png
76.2 KB
diff --git a/‎_static/img/hta/kernel_metrics_df.png
84.3 KB b/‎_static/img/hta/kernel_metrics_df.png
84.3 KB
diff --git a/‎_static/img/hta/kernel_type_breakdown.png
43.5 KB b/‎_static/img/hta/kernel_type_breakdown.png
43.5 KB
diff --git a/‎_static/img/hta/launch_delay_outliers.png
35 KB b/‎_static/img/hta/launch_delay_outliers.png
35 KB
diff --git a/‎_static/img/hta/mem_bandwidth_queue_length.png
102 KB b/‎_static/img/hta/mem_bandwidth_queue_length.png
102 KB
diff --git a/‎_static/img/hta/overlap_df.png
36.3 KB b/‎_static/img/hta/overlap_df.png
36.3 KB
diff --git a/‎_static/img/hta/overlap_plot.png
44.9 KB b/‎_static/img/hta/overlap_plot.png
44.9 KB
diff --git a/‎_static/img/hta/pie_charts.png
76.4 KB b/‎_static/img/hta/pie_charts.png
76.4 KB
diff --git a/‎_static/img/hta/queue_length_summary.png
48.1 KB b/‎_static/img/hta/queue_length_summary.png
48.1 KB
diff --git a/‎_static/img/hta/runtime_outliers.png
31.9 KB b/‎_static/img/hta/runtime_outliers.png
31.9 KB
diff --git a/‎_static/img/hta/short_gpu_kernels.png
38.3 KB b/‎_static/img/hta/short_gpu_kernels.png
38.3 KB
diff --git a/‎_static/img/hta/temporal_breakdown_df.png
114 KB b/‎_static/img/hta/temporal_breakdown_df.png
114 KB
diff --git a/‎_static/img/hta/temporal_breakdown_plot.png
46.9 KB b/‎_static/img/hta/temporal_breakdown_plot.png
46.9 KB
diff --git a/‎_static/img/profiler_rocm_chrome_trace_view.png
395 KB b/‎_static/img/profiler_rocm_chrome_trace_view.png
395 KB
diff --git a/‎_static/img/profiler_rocm_tensorboard_operartor_view.png
253 KB b/‎_static/img/profiler_rocm_tensorboard_operartor_view.png
253 KB
diff --git a/‎_static/img/thumbnails/cropped/TIAToolbox-Tutorial.png
435 KB b/‎_static/img/thumbnails/cropped/TIAToolbox-Tutorial.png
435 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/read_bounds_tissue.webp
103 KB b/‎_static/img/tiatoolbox_tutorial/read_bounds_tissue.webp
103 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_001.png
28.7 KB b/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_001.png
28.7 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_002.png
726 KB b/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_002.png
726 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_003.png
475 KB b/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_003.png
475 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_004.png
475 KB b/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_004.png
475 KB
diff --git a/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_005.png
714 KB b/‎_static/img/tiatoolbox_tutorial/tiatoolbox_tutorial_005.png
714 KB
diff --git a/‎_static/img/tv_tutorial/tv_image01.png
-612 KB b/‎_static/img/tv_tutorial/tv_image01.png
-612 KB
diff --git a/‎_static/img/tv_tutorial/tv_image02.png
-12.4 KB b/‎_static/img/tv_tutorial/tv_image02.png
-12.4 KB
diff --git a/‎_static/img/tv_tutorial/tv_image05.png
-418 KB b/‎_static/img/tv_tutorial/tv_image05.png
-418 KB
diff --git a/‎_static/img/tv_tutorial/tv_image06.png
-849 KB b/‎_static/img/tv_tutorial/tv_image06.png
-849 KB
diff --git a/‎_static/tiatoolbox_tutorial.ipynb
Lines changed: 1 addition & 0 deletions b/‎_static/tiatoolbox_tutorial.ipynb
Lines changed: 1 addition & 0 deletions
diff --git a/‎_templates/layout.html
Lines changed: 13 additions & 2 deletions b/‎_templates/layout.html
Lines changed: 13 additions & 2 deletions
diff --git a/‎advanced_source/static_quantization_tutorial.rst
Lines changed: 3 additions & 0 deletions b/‎advanced_source/static_quantization_tutorial.rst
Lines changed: 3 additions & 0 deletions
diff --git a/‎advanced_source/usb_semisup_learn.py
Lines changed: 246 additions & 0 deletions b/‎advanced_source/usb_semisup_learn.py
Lines changed: 246 additions & 0 deletions
@@ -24,10 +24,10 @@ pip install --progress-bar off -r $DIR/../requirements.txt
 
 #Install PyTorch Nightly for test.
 # Nightly - pip install --pre torch torchvision torchaudio -f https://download.pytorch.org/whl/nightly/cu102/torch_nightly.html
-# Install 2.1 for testing
-# pip uninstall -y torch torchvision torchaudio torchtext torchdata
-# pip3 install torch torchvision torchaudio --no-cache-dir --index-url https://download.pytorch.org/whl/test/cu121
-# pip3 install torchdata torchtext --index-url https://download.pytorch.org/whl/test/cpu
+# Install 2.2 for testing
+pip uninstall -y torch torchvision torchaudio torchtext torchdata
+pip3 install torch==2.2.0 torchvision torchaudio --no-cache-dir --index-url https://download.pytorch.org/whl/test/cu121
+pip3 install torchdata torchtext --index-url https://download.pytorch.org/whl/test/cpu
 
 # Install two language tokenizers for Translation with TorchText tutorial
 python -m spacy download en_core_web_sm
 
@@ -29,6 +29,7 @@
     "intermediate_source/_torch_export_nightly_tutorial",  # does not work on release
     "advanced_source/super_resolution_with_onnxruntime",
     "advanced_source/ddp_pipeline",  # requires 4 gpus
+    "advanced_source/usb_semisup_learn", # in the current form takes 140+ minutes to build - can be enabled when the build time is reduced
     "prototype_source/fx_graph_mode_ptq_dynamic",
     "prototype_source/vmap_recipe",
     "prototype_source/torchscript_freezing",
 
@@ -45,6 +45,9 @@ matrix:
         - open: '\.\. (code-block|math)::.*$\n*'
           content: '(?P<first>(^(?P<indent>[ ]+).*$\n))(?P<other>(^([ \t]+.*|[ \t]*)$\n)*)'
           close: '(^(?![ \t]+.*$))'
+        # Ignore references like "[1] Author: Title"
+        - open: '\[\d\]'
+          close: '\n'
   - pyspelling.filters.markdown:
   - pyspelling.filters.html:
       ignores:
@@ -97,7 +100,7 @@ matrix:
         content: '''''*'
         close: '$'
       # Ignore reStructuredText block directives
-      - open: '\.\. (code-block|math)::.*$\n*'
+      - open: '\.\. (code-block|math|table)::.*$\n*'
         content: '(?P<first>(^(?P<indent>[ ]+).*$\n))(?P<other>(^([ \t]+.*|[ \t]*)$\n)*)'
         close: '(^(?![ \t]+.*$))'
       - open: '\.\. (raw)::.*$\n*'
 
@@ -86,6 +86,9 @@ download:
 	wget -nv -N https://www.manythings.org/anki/deu-eng.zip -P $(DATADIR)
 	unzip -o $(DATADIR)/deu-eng.zip -d beginner_source/data/
 
+	# Download PennFudanPed dataset for intermediate_source/torchvision_tutorial.py
+	wget https://www.cis.upenn.edu/~jshi/ped_html/PennFudanPed.zip -P $(DATADIR)
+	unzip -o $(DATADIR)/PennFudanPed.zip -d intermediate_source/data/
 
 docs:
 	make download
@@ -103,3 +106,5 @@ html-noplot:
 clean-cache:
 	make clean
 	rm -rf advanced beginner intermediate recipes
+	# remove additional python files downloaded for torchvision_tutorial.py
+	rm -rf intermediate_source/engine.py intermediate_source/utils.py intermediate_source/transforms.py intermediate_source/coco_eval.py intermediate_source/coco_utils.py
@@ -0,0 +1,19 @@
+/* Survey banner .css */
+
+.survey-banner {
+  margin-top: 10px;
+  background-color: #f3f4f7;
+  padding-top: 15px;
+  padding-left: 10px;
+  padding-bottom: 1px;
+}
+
+@media screen and (max-width: 600px) {
+  .survey-banner {
+    padding-top: 5px;
+    padding-left: 5px;
+    padding-bottom: -1px;
+    font-size: 12px;
+    margin-bottom: 5px;
+  }
+}
@@ -1,6 +1,5 @@
 {% extends "!layout.html" %}
 
-
 {%- block content %}
 {{ super() }}
 <script>
@@ -17,7 +16,9 @@
 {{ super() }}
 <script>
 
-  
+// Helper function to make it easier to call dataLayer.push() 
+function gtag(){window.dataLayer.push(arguments);}
+
 //add microsoft link
 
 if(window.location.href.indexOf("/beginner/basics/")!= -1)
@@ -111,4 +112,14 @@
 </script>
 
 <img height="1" width="1" style="border-style:none;" alt="" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0"/>
+
+//temporarily add a link to survey
+<script>
+    var survey = '<div class="survey-banner"><p><i class="fas fa-poll" aria-hidden="true">&nbsp </i> Take the annual <a href="https://forms.gle/jdNexNU6eZ8mCGDY7">PyTorch Tutorials survey</a>.</p></div>'
+    if ($(".pytorch-call-to-action-links").length) {
+        $(".pytorch-call-to-action-links").before(survey);
+    } else {
+        $("#pytorch-article").prepend(survey);
+    }
+</script>
 {% endblock %}
@@ -0,0 +1,246 @@
+"""
+Semi-Supervised Learning using USB built upon PyTorch
+=====================================================
+
+**Author**: `Hao Chen <https://github.com/Hhhhhhao>`_
+
+Unified Semi-supervised learning Benchmark (USB) is a semi-supervised
+learning framework built upon PyTorch.
+Based on Datasets and Modules provided by PyTorch, USB becomes a flexible,
+modular, and easy-to-use framework for semi-supervised learning.
+It supports a variety of semi-supervised learning algorithms, including
+``FixMatch``, ``FreeMatch``, ``DeFixMatch``, ``SoftMatch``, and so on.
+It also supports a variety of imbalanced semi-supervised learning algorithms.
+The benchmark results across different datasets of computer vision, natural
+language processing, and speech processing are included in USB.
+
+This tutorial will walk you through the basics of using the USB lighting
+package.
+Let's get started by training a ``FreeMatch``/``SoftMatch`` model on
+CIFAR-10 using pretrained ViT!
+And we will show it is easy to change the semi-supervised algorithm and train
+on imbalanced datasets.
+
+
+.. figure:: /_static/img/usb_semisup_learn/code.png
+   :alt: USB framework illustration
+"""
+
+
+######################################################################
+# Introduction to ``FreeMatch`` and ``SoftMatch`` in Semi-Supervised Learning
+# ---------------------------------------------------------------------------
+#
+# Here we provide a brief introduction to ``FreeMatch`` and ``SoftMatch``.
+# First, we introduce a famous baseline for semi-supervised learning called ``FixMatch``.
+# ``FixMatch`` is a very simple framework for semi-supervised learning, where it
+# utilizes a strong augmentation to generate pseudo labels for unlabeled data.
+# It adopts a confidence thresholding strategy to filter out the low-confidence
+# pseudo labels with a fixed threshold set.
+# ``FreeMatch`` and ``SoftMatch`` are two algorithms that improve upon ``FixMatch``.
+# ``FreeMatch`` proposes adaptive thresholding strategy to replace the fixed
+# thresholding strategy in ``FixMatch``. The adaptive thresholding progressively
+# increases the threshold according to the learning status of the model on each
+# class. ``SoftMatch`` absorbs the idea of confidence thresholding as an
+# weighting mechanism. It proposes a Gaussian weighting mechanism to overcome
+# the quantity-quality trade-off in pseudo-labels. In this tutorial, we will
+# use USB to train ``FreeMatch`` and ``SoftMatch``.
+
+
+######################################################################
+# Use USB to Train ``FreeMatch``/``SoftMatch`` on CIFAR-10 with only 40 labels
+# ----------------------------------------------------------------------------
+#
+# USB is easy to use and extend, affordable to small groups, and comprehensive
+# for developing and evaluating SSL algorithms.
+# USB provides the implementation of 14 SSL algorithms based on Consistency
+# Regularization, and 15 tasks for evaluation from CV, NLP, and Audio domain.
+# It has a modular design that allows users to easily extend the package by
+# adding new algorithms and tasks.
+# It also supports a Python API for easier adaptation to different SSL
+# algorithms on new data.
+#
+#
+# Now, let's use USB to train ``FreeMatch`` and ``SoftMatch`` on CIFAR-10.
+# First, we need to install USB package ``semilearn`` and import necessary API
+# functions from USB.
+# Below is a list of functions we will use from ``semilearn``:
+#
+# - ``get_dataset`` to load dataset, here we use CIFAR-10
+# - ``get_data_loader`` to create train (labeled and unlabeled) and test data
+# loaders, the train unlabeled loaders will provide both strong and weak
+# augmentation of unlabeled data
+# - ``get_net_builder`` to create a model, here we use pretrained ViT
+# - ``get_algorithm`` to create the semi-supervised learning algorithm,
+# here we use ``FreeMatch`` and ``SoftMatch``
+# - ``get_config``: to get default configuration of the algorithm
+# - ``Trainer``: a Trainer class for training and evaluating the
+# algorithm on dataset
+# 
+import semilearn
+from semilearn import get_dataset, get_data_loader, get_net_builder, get_algorithm, get_config, Trainer
+
+######################################################################
+# After importing necessary functions, we first set the hyper-parameters of the
+# algorithm.
+# 
+config = {
+    'algorithm': 'freematch',
+    'net': 'vit_tiny_patch2_32',
+    'use_pretrain': True, 
+    'pretrain_path': 'https://github.com/microsoft/Semi-supervised-learning/releases/download/v.0.0.0/vit_tiny_patch2_32_mlp_im_1k_32.pth',
+
+    # optimization configs
+    'epoch': 1,  
+    'num_train_iter': 4000,  
+    'num_eval_iter': 500,  
+    'num_log_iter': 50,  
+    'optim': 'AdamW',
+    'lr': 5e-4,
+    'layer_decay': 0.5,
+    'batch_size': 16,
+    'eval_batch_size': 16,
+
+
+    # dataset configs
+    'dataset': 'cifar10',
+    'num_labels': 40,
+    'num_classes': 10,
+    'img_size': 32,
+    'crop_ratio': 0.875,
+    'data_dir': './data',
+    'ulb_samples_per_class': None,
+
+    # algorithm specific configs
+    'hard_label': True,
+    'T': 0.5,
+    'ema_p': 0.999,
+    'ent_loss_ratio': 0.001,
+    'uratio': 2,
+    'ulb_loss_ratio': 1.0,
+
+    # device configs
+    'gpu': 0,
+    'world_size': 1,
+    'distributed': False,
+    "num_workers": 4,
+}
+config = get_config(config)
+
+
+######################################################################
+# Then, we load the dataset and create data loaders for training and testing.
+# And we specify the model and algorithm to use.
+# 
+dataset_dict = get_dataset(config, config.algorithm, config.dataset, config.num_labels, config.num_classes, data_dir=config.data_dir, include_lb_to_ulb=config.include_lb_to_ulb)
+train_lb_loader = get_data_loader(config, dataset_dict['train_lb'], config.batch_size)
+train_ulb_loader = get_data_loader(config, dataset_dict['train_ulb'], int(config.batch_size * config.uratio))
+eval_loader = get_data_loader(config, dataset_dict['eval'], config.eval_batch_size)
+algorithm = get_algorithm(config,  get_net_builder(config.net, from_name=False), tb_log=None, logger=None)
+
+
+######################################################################
+# We can start training the algorithms on CIFAR-10 with 40 labels now.
+# We train for 4000 iterations and evaluate every 500 iterations.
+# 
+trainer = Trainer(config, algorithm)
+trainer.fit(train_lb_loader, train_ulb_loader, eval_loader)
+
+
+######################################################################
+# Finally, let's evaluate the trained model on the validation set.
+# After training 4000 iterations with ``FreeMatch`` on only 40 labels of
+# CIFAR-10, we obtain a classifier that achieves above 93 accuracy on the validation set.
+trainer.evaluate(eval_loader)
+
+
+
+######################################################################
+# Use USB to Train ``SoftMatch`` with specific imbalanced algorithm on imbalanced CIFAR-10
+# ------------------------------------------------------------------------------------
+# 
+# Now let's say we have imbalanced labeled set and unlabeled set of CIFAR-10,
+# and we want to train a ``SoftMatch`` model on it.
+# We create an imbalanced labeled set and imbalanced unlabeled set of CIFAR-10,
+# by setting the ``lb_imb_ratio`` and ``ulb_imb_ratio`` to 10.
+# Also, we replace the ``algorithm`` with ``softmatch`` and set the ``imbalanced``
+# to ``True``.
+# 
+config = {
+    'algorithm': 'softmatch',
+    'net': 'vit_tiny_patch2_32',
+    'use_pretrain': True, 
+    'pretrain_path': 'https://github.com/microsoft/Semi-supervised-learning/releases/download/v.0.0.0/vit_tiny_patch2_32_mlp_im_1k_32.pth',
+
+    # optimization configs
+    'epoch': 1,  
+    'num_train_iter': 4000,  
+    'num_eval_iter': 500,  
+    'num_log_iter': 50,  
+    'optim': 'AdamW',
+    'lr': 5e-4,
+    'layer_decay': 0.5,
+    'batch_size': 16,
+    'eval_batch_size': 16,
+
+
+    # dataset configs
+    'dataset': 'cifar10',
+    'num_labels': 1500,
+    'num_classes': 10,
+    'img_size': 32,
+    'crop_ratio': 0.875,
+    'data_dir': './data',
+    'ulb_samples_per_class': None,
+    'lb_imb_ratio': 10,
+    'ulb_imb_ratio': 10,
+    'ulb_num_labels': 3000,
+
+    # algorithm specific configs
+    'hard_label': True,
+    'T': 0.5,
+    'ema_p': 0.999,
+    'ent_loss_ratio': 0.001,
+    'uratio': 2,
+    'ulb_loss_ratio': 1.0,
+
+    # device configs
+    'gpu': 0,
+    'world_size': 1,
+    'distributed': False,
+    "num_workers": 4,
+}
+config = get_config(config)
+
+######################################################################
+# Then, we re-load the dataset and create data loaders for training and testing.
+# And we specify the model and algorithm to use.
+# 
+dataset_dict = get_dataset(config, config.algorithm, config.dataset, config.num_labels, config.num_classes, data_dir=config.data_dir, include_lb_to_ulb=config.include_lb_to_ulb)
+train_lb_loader = get_data_loader(config, dataset_dict['train_lb'], config.batch_size)
+train_ulb_loader = get_data_loader(config, dataset_dict['train_ulb'], int(config.batch_size * config.uratio))
+eval_loader = get_data_loader(config, dataset_dict['eval'], config.eval_batch_size)
+algorithm = get_algorithm(config,  get_net_builder(config.net, from_name=False), tb_log=None, logger=None)
+
+
+######################################################################
+# We can start Train the algorithms on CIFAR-10 with 40 labels now.
+# We train for 4000 iterations and evaluate every 500 iterations.
+# 
+trainer = Trainer(config, algorithm)
+trainer.fit(train_lb_loader, train_ulb_loader, eval_loader)
+
+
+######################################################################
+# Finally, let's evaluate the trained model on the validation set.
+# 
+trainer.evaluate(eval_loader)
+
+
+
+######################################################################
+# References
+# [1] USB: https://github.com/microsoft/Semi-supervised-learning
+# [2] Kihyuk Sohn et al. FixMatch: Simplifying Semi-Supervised Learning with Consistency and Confidence
+# [3] Yidong Wang et al. FreeMatch: Self-adaptive Thresholding for Semi-supervised Learning
+# [4] Hao Chen et al. SoftMatch: Addressing the Quantity-Quality Trade-off in Semi-supervised Learning