diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000000000000000000000000000000000000..9430e7d8d45ef1b020f0fc5b49ebc45e6016cbb3
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,4 @@
+.git*
+**__pycache__**
+docker
+Dockerfile*
diff --git a/.gitattributes b/.gitattributes
index 92ef5e02a525fb8f3779f58199d1d9ed0762f676..17742c0a227912b2e79ae7c16ecbfd821eff4870 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -35,3 +35,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
 visual-quality-inspection/transfer-learning/workflows/vision_anomaly_detection/assets/Visual_quality_inspection_layered_architecture.JPG filter=lfs diff=lfs merge=lfs -text
 visual-quality-inspection/transfer-learning/workflows/vision_anomaly_detection/assets/visual_quality_inspection_pipeline.JPG filter=lfs diff=lfs merge=lfs -text
+workflows/vision_anomaly_detection/assets/Visual_quality_inspection_layered_architecture.JPG filter=lfs diff=lfs merge=lfs -text
+workflows/vision_anomaly_detection/assets/visual_quality_inspection_pipeline.JPG filter=lfs diff=lfs merge=lfs -text
diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
new file mode 100644
index 0000000000000000000000000000000000000000..88388981ffd07907fe3778e6cfd5756bb254ba15
--- /dev/null
+++ b/.github/pull_request_template.md
@@ -0,0 +1,14 @@
+<!-- Add a description of the changes made in the PR -->
+
+**Before requesting a review:**
+
+- [ ] I have ensured my PR title is accurate
+- [ ] I wrote a description of the changes being made, if it's not obvious
+- [ ] I have synced by branch with the base (i.e. `develop`)
+- [ ] I ran `make lint` on my branch and it passes
+- [ ] I ran the pytest tests that could reasonably be affected by my changes and they pass
+- [ ] I have performed a self code review of my own code on the "Files changed" tab of the pull request
+- [ ] I have commented my code in hard-to-understand areas
+- [ ] I have updated the documentation (in docstrings, notebooks, and .rst files)
+- [ ] I have added new tests that prove my fix is effective or that my feature works (or provide justification why not)
+- [ ] I have applied the appropriate labels to the PR (if your PR is not ready for review use "WIP")
diff --git a/.github/workflows/build-container.yaml b/.github/workflows/build-container.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..9ccd0c5cba0bf8ddfc5b8773cd6f09b52eb77c5e
--- /dev/null
+++ b/.github/workflows/build-container.yaml
@@ -0,0 +1,50 @@
+name: TLT Containers Weekly Builder
+on:
+  workflow_dispatch: # Can be manually executed
+  schedule: # 1/week Sunday at 11:00PM
+    - cron: "5 23 * * 0"
+jobs:
+  build:
+    container: # MLOps Dev container for Compose Automation
+      image: ${{ vars.GHA_CONTAINER_IMAGE }}
+      env: # Add ENVS to control compose building
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      credentials: # CAAS Registry Creds
+        username: ${{ secrets.REGISTRY_USER }}
+        password: ${{ secrets.REGISTRY_TOKEN }}
+    runs-on: [aia-devops] # Runner Label
+    steps:
+    - uses: actions/checkout@v3
+      with:
+        submodules: true
+        set-safe-directory: true
+    - name: Build Container
+      run: docker compose build
+      working-directory: ./docker
+  push:
+    needs: [build]
+    strategy:
+      matrix:
+        container: ["tlt-devel", "tlt-prod", "tlt-dist-devel", "tlt-dist-prod"] # name of Compose container
+    container:
+      image: ${{ vars.GHA_CONTAINER_IMAGE }}
+      env: # Add ENVS to control compose building
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      credentials: # CAAS Registry Creds
+        username: ${{ secrets.REGISTRY_USER }}
+        password: ${{ secrets.REGISTRY_TOKEN }}
+    runs-on: [aia-devops]
+    steps:
+    - uses: docker/login-action@v2
+      with: # CAAS Registry Creds
+        registry: ${{ vars.GHA_REGISTRY }}
+        username: ${{ secrets.REGISTRY_USER }}
+        password: ${{ secrets.REGISTRY_TOKEN }}
+    - name: Push Container # tlt-<num>-<container>
+      run: |
+        docker tag intel/ai-tools:${{ matrix.container }}-latest ${{ vars.GHA_REGISTRY_REPO }}:ww$(date +"%U")-${{ matrix.container }}
+        docker push ${{ vars.GHA_REGISTRY_REPO }}:ww$(date +"%U")-${{ matrix.container }}
diff --git a/.github/workflows/docs-test.yaml b/.github/workflows/docs-test.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..276c10318463794b0e676aff99a775cd71214329
--- /dev/null
+++ b/.github/workflows/docs-test.yaml
@@ -0,0 +1,34 @@
+name: Build and Test docs
+on:
+  pull_request:
+    types: [submitted]
+  # run the workflow if changes pushed to main or release branches
+  push:
+    branches:
+      - '**'
+    tags:
+      - '**'
+    paths:
+      - '**'
+
+# installs dependencies, build the docs and push it to `gh-pages`
+jobs:
+  docs-test:
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+      volumes:
+        - /tf_dataset/dataset/transfer_learning:/tmp/data
+    steps:
+    - uses: actions/checkout@v3
+    # Test the docs
+    - name: Run documentation tests
+      run: |
+        make test_docs
diff --git a/.github/workflows/integration.yaml b/.github/workflows/integration.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..a249bb351d6f6432b1d27f175e308bb7ce5ece66
--- /dev/null
+++ b/.github/workflows/integration.yaml
@@ -0,0 +1,41 @@
+name: Integration Test
+on:
+  pull_request_review:
+    types: [submitted]
+  # run the workflow if changes pushed to main or release branches
+  push:
+    branches:
+      - develop
+      - main
+      - r0.1
+      - r0.2
+      - r0.3
+      - r0.4
+      - r0.5
+    tags:
+      - '**'
+    paths:
+      - '**'
+jobs:
+  integration-test:
+    if: github.event.review.state == 'approved' ||
+        github.event.pull_request.merged == true ||
+        github.event_name == 'push'
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+      volumes:
+        - /tf_dataset/dataset/transfer_learning:/tmp/data
+    steps:
+      - uses: actions/checkout@v3
+      - name: Run Integration Tests
+        shell: bash
+        continue-on-error: false
+        run: make integration
diff --git a/.github/workflows/nightly-integration.yaml b/.github/workflows/nightly-integration.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..e335f64dd97e97eb6c7af8a998214ba012171934
--- /dev/null
+++ b/.github/workflows/nightly-integration.yaml
@@ -0,0 +1,25 @@
+name: Nightly Integration Test
+on:
+  workflow_dispatch: # Can be manually executed
+  schedule: # nightly at 10:00PM
+    - cron: "0 22 * * *"
+jobs:
+  nightly-test:
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+    steps:
+      - uses: actions/checkout@v3
+        with:
+          ref: develop
+      - name: Run Integration Test
+        shell: bash
+        continue-on-error: false
+        run: make integration
diff --git a/.github/workflows/nightly-notebook-test.yaml b/.github/workflows/nightly-notebook-test.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..55682314479834fffb883185536afc4e4bf582d8
--- /dev/null
+++ b/.github/workflows/nightly-notebook-test.yaml
@@ -0,0 +1,25 @@
+name: Nightly Notebooks Test
+on:
+  workflow_dispatch: # Can be manually executed
+  schedule: # nightly at 11:00PM
+    - cron: "0 23 * * *"
+jobs:
+  notebook-test:
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+        DATASET_DIR: /tmp/data
+        OUTPUT_DIR: /tmp/output
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+    steps:
+      - uses: actions/checkout@v3
+        with:
+          ref: develop
+      - name: Run Notebook Tests
+        run: make test_notebook_catalog
diff --git a/.github/workflows/notebook-test.yaml b/.github/workflows/notebook-test.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..dcc025a0fae594dd544bd73efc9bdb75efe277cd
--- /dev/null
+++ b/.github/workflows/notebook-test.yaml
@@ -0,0 +1,41 @@
+name: Notebooks Test
+on:
+  pull_request_review:
+    types: [submitted]
+  # run the workflow if changes pushed to main or release branches
+  push:
+    branches:
+      - develop
+      - main
+      - r0.1
+      - r0.2
+      - r0.3
+      - r0.4
+      - r0.5
+    tags:
+      - '**'
+    paths:
+      - '**'
+jobs:
+  notebook-test:
+    if: github.event.review.state == 'approved' ||
+        github.event.pull_request.merged == true ||
+        github.event_name == 'push'
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+        DATASET_DIR: /tmp/data
+        OUTPUT_DIR: /tmp/output
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+      volumes:
+        - /tf_dataset/dataset/transfer_learning:/tmp/data
+    steps:
+      - uses: actions/checkout@v3
+      - name: Run Notebook Tests
+        run: make test_notebook_custom
diff --git a/.github/workflows/style-test.yaml b/.github/workflows/style-test.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..51a35ed48b9116a49b41bd4cfdcc3ab0282abfcf
--- /dev/null
+++ b/.github/workflows/style-test.yaml
@@ -0,0 +1,30 @@
+name: Style Checks
+on:
+  pull_request:
+    types: [submitted]
+  # run the workflow if changes pushed to main or release branches
+  push:
+    branches:
+      - '**'
+    tags:
+      - '**'
+    paths:
+      - '**'
+# installs dependencies and runs the linter
+jobs:
+  style-test:
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+    steps:
+    - uses: actions/checkout@v3
+    - name: Run linter
+      run: |
+        make lint
diff --git a/.github/workflows/unittest.yaml b/.github/workflows/unittest.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..c135c31088a6ebf9c4bc65a428b29b817f8e9efb
--- /dev/null
+++ b/.github/workflows/unittest.yaml
@@ -0,0 +1,30 @@
+name: Unit Test
+on:
+  pull_request:
+    types: [submitted]
+  # run the workflow if changes pushed to main or release branches
+  push:
+    branches:
+      - '**'
+    tags:
+      - '**'
+    paths:
+      - '**'
+jobs:
+  unit-test:
+    runs-on: [ aia-devops ]
+    container:
+      image: ${{ vars.GHA_IMAGE }}
+      env:
+        http_proxy: ${{ secrets.HTTP_PROXY }}
+        https_proxy: ${{ secrets.HTTPS_PROXY }}
+        no_proxy: ${{ secrets.NO_PROXY }}
+      # credentials:
+      #   username: ${{ secrets.REGISTRY_USER }}
+      #   password: ${{ secrets.REGISTRY_TOKEN }}
+    steps:
+      - uses: actions/checkout@v3
+      - name: Run Unit Test
+        shell: bash
+        continue-on-error: false
+        run: make unittest
diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000000000000000000000000000000000000..c89a2aafc5bdc0ee4aaebedb1c836a3518a6b46d
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,20 @@
+_autosummary
+.coverage
+.DS_Store
+.idea*
+.ipynb_checkpoints
+.vscode
+*.egg-info/
+*.pyc
+**.log
+**/*.cache
+**/**.whl
+**/**/models/
+**/**venv
+**venv*
+build/
+data
+dist/
+docs/_build/
+nc_workspace
+output
diff --git a/CODEOWNERS b/CODEOWNERS
new file mode 100644
index 0000000000000000000000000000000000000000..0ce3b508a6107b6f54d990ba5e651db7134f5fed
--- /dev/null
+++ b/CODEOWNERS
@@ -0,0 +1,59 @@
+# This is a comment.
+# Each line is a file pattern followed by one or more owners.
+
+# These owners will be the default owners for everything in
+# the repo. Unless a later match takes precedence,
+# @global-owner1 and @global-owner2 will be requested for
+# review when someone opens a pull request.
+*       @ashahba @dmsuehir @etcylfleet @HarshaRamayanam @mhbuehler @okhleif-IL 
+
+# Order is important; the last matching pattern takes the most
+# precedence. When someone opens a pull request that only
+# modifies JS files, only @js-owner and not the global
+# owner(s) will be requested for a review.
+# *.js    @js-owner #This is an inline comment.
+
+# You can also use email addresses if you prefer. They'll be
+# used to look up users just like we do for commit author
+# emails.
+# *.go docs@example.com
+
+# Teams can be specified as code owners as well. Teams should
+# be identified in the format @org/team-name. Teams must have
+# explicit write access to the repository. In this example,
+# the octocats team in the octo-org organization owns all .txt files.
+# *.txt @octo-org/octocats
+
+# In this example, @doctocat owns any files in the build/logs
+# directory at the root of the repository and any of its
+# subdirectories.
+# /build/logs/ @doctocat
+
+# The `docs/*` pattern will match files like
+# `docs/getting-started.md` but not further nested files like
+# `docs/build-app/troubleshooting.md`.
+# docs/*  docs@example.com
+
+# In this example, @octocat owns any file in an apps directory
+# anywhere in your repository.
+# apps/ @octocat
+
+# In this example, @doctocat owns any file in the `/docs`
+# directory in the root of your repository and any of its
+# subdirectories.
+# /docs/ @doctocat
+
+# In this example, any change inside the `/scripts` directory
+# will require approval from @doctocat or @octocat.
+# /scripts/ @doctocat @octocat
+
+# In this example, @octocat owns any file in a `/logs` directory such as
+# `/build/logs`, `/scripts/logs`, and `/deeply/nested/logs`. Any changes
+# in a `/logs` directory will require approval from @octocat.
+# **/logs @octocat
+
+# In this example, @octocat owns any file in the `/apps`
+# directory in the root of your repository except for the `/apps/github`
+# subdirectory, as its owners are left empty.
+# /apps/ @octocat
+# /apps/github
diff --git a/DATASETS.md b/DATASETS.md
new file mode 100644
index 0000000000000000000000000000000000000000..ed56ed3c471de79a613e7bc539c4d1d1ebb7ae80
--- /dev/null
+++ b/DATASETS.md
@@ -0,0 +1,30 @@
+# Datasets
+
+This is a comprehensive list of public datasets used by this repository.
+
+| Name (Link/Source) | Framework | Use Case |
+|--------------------| --------- | -------- |
+| [AG News (Hugging Face)](https://huggingface.co/datasets/ag_news) | PyTorch | Text Classification |
+| [AG News (TFDS)](https://www.tensorflow.org/datasets/catalog/ag_news_subset) | TensorFlow | Text Classification |
+| [Food101 (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.Food101.html#torchvision.datasets.Food101) | PyTorch | Image Classification |
+| [Food101 (TFDS)](https://www.tensorflow.org/datasets/catalog/food101) | TensorFlow | Image Classification |
+| [SMS Spam Collection](https://archive.ics.uci.edu/dataset/228/sms+spam+collection) | PyTorch & TensorFlow | Text Classification |
+| [TF Flowers (TFDS)](https://www.tensorflow.org/datasets/catalog/tf_flowers) |  PyTorch & TensorFlow | Image Classification |
+| [Cats vs. Dogs (TFDS)](https://www.tensorflow.org/datasets/catalog/cats_vs_dogs) |  TensorFlow | Image Classification |
+| [Country211 (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.Country211.html#torchvision.datasets.Country211) | PyTorch | Image Classification |
+| [DTD (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.DTD.html#torchvision.datasets.DTD) | PyTorch | Image Classification |
+| [FGVCAircraft (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.FGVCAircraft.html#torchvision.datasets.FGVCAircraft) | PyTorch | Image Classification |
+| [RenderedSST2 (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.RenderedSST2.html#torchvision.datasets.RenderedSST2) | PyTorch | Image Classification |
+| [Rock Paper Scissors (TFDS)](https://www.tensorflow.org/datasets/catalog/rock_paper_scissors) |  TensorFlow | Image Classification |
+| [Rotten_Tomatoes (Hugging Face)](https://huggingface.co/datasets/rotten_tomatoes) | PyTorch | Text Classification |
+| [TweetEval (Hugging Face)](https://huggingface.co/datasets/tweet_eval) | PyTorch | Text Classification |
+| [CIFAR10 (Torchvision)](https://pytorch.org/vision/stable/generated/torchvision.datasets.CIFAR10.html#torchvision.datasets.CIFAR10) |  PyTorch | Image Classification |
+| [IMDB Reviews (Hugging Face)](https://huggingface.co/datasets/imdb) | PyTorch | Text Classification |
+| [IMDB Reviews (TFDS)](https://www.tensorflow.org/datasets/catalog/imdb_reviews) | TensorFlow | Text Classification |
+| [GLUE/SST2 (TFDS)](https://www.tensorflow.org/datasets/catalog/glue#gluesst2) |  TensorFlow | Text Classification |
+| [GLUE/COLA (TFDS)](https://www.tensorflow.org/datasets/catalog/glue#gluecola_default_config) |  TensorFlow | Text Classification |
+| [Colorectal Histology (TFDS)](https://www.tensorflow.org/datasets/catalog/colorectal_histology) |  TensorFlow | Image Classification |
+| [RESISC45 (TFDS)](https://www.tensorflow.org/datasets/catalog/resisc45) |  TensorFlow | Image Classification |
+| [CDD-CESM](https://wiki.cancerimagingarchive.net/pages/viewpage.action?pageId=109379611) |  PyTorch & TensorFlow | Image & Text Classification |
+| [SQuAD](https://rajpurkar.github.io/SQuAD-explorer/) |  PyTorch & TensorFlow | Text Classification |
+| [MVTec](https://www.mvtec.com/company/research/datasets/mvtec-ad) |  PyTorch | Anomaly Detection |
diff --git a/GetStarted.md b/GetStarted.md
new file mode 100644
index 0000000000000000000000000000000000000000..d52f56a86d2871d9057574d59160e767b6411488
--- /dev/null
+++ b/GetStarted.md
@@ -0,0 +1,263 @@
+# Get Started
+
+This is a guide for getting started with Intel® Transfer Learning Tool and will
+walk you through the steps to check system requirements, install, and then run
+the tool with a couple of examples showing no-code CLI and low-code API
+approaches.
+
+<p align="center"><b>Intel Transfer Learning Tool Get Started Flow</b></p>
+
+<img alt="Intel Transfer Learning Tool Get Started Flow" title="Intel Transfer Learning Tool Get Started Flow" src="images/TLT-GSG_flow.svg" width="800">
+
+## &#9312; Check System Requirements
+
+| Recommended Hardware         | Precision  |
+| ---------------------------- | ---------- |
+| Intel® 4th Gen Xeon® Scalable Performance processors | BF16 |
+| Intel® 1st, 2nd, 3rd, and 4th Gen Xeon® Scalable Performance processors | FP32 |
+
+| Resource         | Minimum  |
+| ---------------------------- | ---------- |
+| CPU Cores | 8  (16+ recommended) |
+| RAM | 16 GB (24-32+ GB recommended) |
+| Disk space | 10 GB minimum (can vary based on datasets downloaded) |
+
+| Required Software         |
+| ------------------------- |
+| Linux\* system (validated on Ubuntu\* 20.04/22.04 LTS) |
+| Python (3.8, 3.9, or 3.10) |
+| Pip |
+| Conda or Python virtualenv |
+| git (only required for advanced installation) |
+
+## &#9313; Install
+
+1. **Install Dependencies**
+
+   Install required packages using:
+
+   ```
+   sudo apt-get install build-essential python3-dev libgl1 libglib2.0-0
+   ```
+
+2. **Create and activate a Python3 virtual environment**
+
+   We encourage you to use a Python virtual environment (virtualenv or conda)
+   for consistent package management.  There are two ways to do this:
+
+   a. Use `virtualenv`:
+
+      ```
+      virtualenv -p python3 tlt_dev_venv
+      source tlt_dev_venv/bin/activate
+      ```
+
+   b. Or use `conda`:
+
+      ```
+      conda create --name tlt_dev_venv python=3.9
+      conda activate tlt_dev_venv
+      ```
+
+3. **Install Intel Transfer Learning Tool**
+
+   Use the Basic Installation instructions unless you plan on making code changes.
+
+   a. **Basic Installation**
+
+      ```
+      pip install intel-transfer-learning-tool
+      ```
+
+   b. **Advanced Installation**
+
+      Clone the repo:
+
+      ```
+      git clone https://github.com/IntelAI/transfer-learning.git
+      cd transfer-learning
+      ```
+
+      Then either do an editable install to avoid a rebuild and
+      install after each code change (preferred):
+
+      ```
+      pip install --editable .
+      ```
+
+      or build and install a wheel:
+
+      ```
+      python setup.py bdist_wheel
+      pip install dist/intel_transfer_learning_tool-0.5.0-py3-none-any.whl
+      ```
+
+
+4. **Additional Feature-Specific Steps**
+
+   * For distributed/multinode training, follow these additional
+     [distributed training instructions](tlt/distributed/README.md).
+
+5. **Verify Installation**
+
+   Verify that your installation was successful by using the following
+   command, which displays help information about the Intel Transfer Learning Tool:
+
+   ```
+   tlt --help
+   ```
+
+## &#9314; Run the Intel Transfer Learning Tool
+
+With the Intel Transfer Learning Tool, you can train AI models with TensorFlow or
+PyTorch using either no-code CLI commands at a bash prompt, or low-code API
+calls from a Python script. Both approaches provide the same opportunities for
+training, evaluation, optimization, and benchmarking. With the CLI, no
+programming experience is required, and you'll need basic Python knowledge to
+use the API. Choose the approach that works best for you.
+
+
+### Run Using the No-Code CLI
+
+Let's continue from the previous step where you prepared the dataset, and train
+a model using CLI commands.  This example uses the CLI to train an image
+classifier to identify different types of flowers. You can see a list of all
+available image classifier models using the command:
+
+```
+tlt list models --use-case image_classification
+```
+
+**Train a Model**
+
+In this example, we'll use the `tlt train` command to retrain the TensorFlow
+ResNet50v1.5 model using a flowers dataset from the
+[TensorFlow Datasets catalog](https://www.tensorflow.org/datasets/catalog/tf_flowers).
+The `--dataset-dir` and `--output-dir` paths need to point to writable folders on your system.
+```
+# Use the follow environment variable setting to reduce the warnings and log output from TensorFlow
+export TF_CPP_MIN_LOG_LEVEL="2"
+
+tlt train -f tensorflow --model-name resnet_v1_50 --dataset-name tf_flowers --dataset-dir "/tmp/data-${USER}" --output-dir "/tmp/output-${USER}"
+```
+```
+Model name: resnet_v1_50
+Framework: tensorflow
+Dataset name: tf_flowers
+Training epochs: 1
+Dataset dir: /tmp/data-user
+Output directory: /tmp/output-user
+...
+Model: "sequential"
+_________________________________________________________________
+Layer (type)                Output Shape              Param #
+=================================================================
+keras_layer (KerasLayer)    (None, 2048)              23561152
+dense (Dense)               (None, 5)                 10245
+=================================================================
+Total params: 23,571,397
+Trainable params: 10,245
+Non-trainable params: 23,561,152
+_________________________________________________________________
+Checkpoint directory: /tmp/output-user/resnet_v1_50_checkpoints
+86/86 [==============================] - 24s 248ms/step - loss: 0.4600 - acc: 0.8438
+Saved model directory: /tmp/output-user/resnet_v1_50/1
+```
+
+After training completes, the `tlt train` command evaluates the model. The loss and
+accuracy values are printed toward the end of the console output. The model is
+exported to the output directory you specified in a numbered folder created for
+each training run.
+
+**Next Steps**
+
+That ends this Get Started CLI example. As a next step, you can also follow the
+[Beyond Get Started CLI Example](examples/cli/README.md) for a complete example
+that includes evaluation, benchmarking, and quantization in the datasets.
+
+Read about all the CLI commands in the [CLI reference](/cli.md).
+Find more examples in our list of [Examples](examples/README.md).
+
+### Run Using the Low-Code API
+
+The following Python code example trains an image classification model with the TensorFlow
+flowers dataset using API calls from Python.  The model is
+benchmarked and quantized to INT8 precision for improved inference performance.
+
+You can run the API example using a Jupyter notebook. See the [notebook setup
+instructions](/notebooks/setup.md) for more details for preparing the Jupyter
+notebook environment.
+
+```python
+import os
+
+os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.utils.types import FrameworkType, UseCaseType
+
+username = os.getenv('USER', 'user')
+
+# Specify a writable directory for the dataset to be downloaded
+dataset_dir = '/tmp/data-{}'.format(username)
+if not os.path.exists(dataset_dir):
+    os.makedirs(dataset_dir)
+
+# Specify a writeable directory for output (such as saved model files)
+output_dir = '/tmp/output-{}'.format(username)
+if not os.path.exists(output_dir):
+    os.makedirs(output_dir)
+
+# Get the model
+model = model_factory.get_model(model_name="resnet_v1_50", framework=FrameworkType.TENSORFLOW)
+
+# Download and preprocess the flowers dataset from the TensorFlow datasets catalog
+dataset = dataset_factory.get_dataset(dataset_dir=dataset_dir,
+                                      dataset_name='tf_flowers',
+                                      use_case=UseCaseType.IMAGE_CLASSIFICATION,
+                                      framework=FrameworkType.TENSORFLOW,
+                                      dataset_catalog='tf_datasets')
+dataset.preprocess(image_size=model.image_size, batch_size=32)
+dataset.shuffle_split(train_pct=.75, val_pct=.25)
+
+# Train the model using the dataset
+model.train(dataset, output_dir=output_dir, epochs=1)
+
+# Evaluate the trained model
+metrics = model.evaluate(dataset)
+for metric_name, metric_value in zip(model._model.metrics_names, metrics):
+    print("{}: {}".format(metric_name, metric_value))
+
+# Export the model
+saved_model_dir = model.export(output_dir=output_dir)
+
+# Quantize the trained model
+quantization_output = os.path.join(output_dir, "quantized_model")
+model.quantize(quantization_output, dataset, overwrite_model=True)
+
+# Benchmark the trained model using the Intel Neural Compressor config file
+model.benchmark(dataset, saved_model_dir=quantization_output)
+
+# Do graph optimization on the trained model
+optimization_output = os.path.join(output_dir, "optimized_model")
+model.optimize_graph(optimization_output, overwrite_model=True)
+```
+
+For more information on the API, see the [API Documentation](/api.md).
+
+## Summary and Next Steps
+
+The Intel Transfer Learning Tool can be used to develop an AI model and export
+an Intel-optimized saved model for deployment. The sample CLI and API commands
+we've presented show how to execute end-to-end transfer learning workflows. 
+
+For the no-code CLI, you can follow a
+complete example that includes trainng, evaluation, benchmarking, and quantization
+in the datasets, as well as some additional models in the [Beyond Get Started
+CLI example](examples/cli/README.md) documentation. You can also read about all the
+CLI commands in the [CLI reference](/cli.md).
+
+For the low-code API, read about the API in the [API Documentation](/api.md).
+
+Find more CLI and API examples in our list of [Examples](examples/README.md).
diff --git a/LICENSE b/LICENSE
new file mode 100644
index 0000000000000000000000000000000000000000..01c7ad7facd90ef32a6a409d261ad90689d7e7b1
--- /dev/null
+++ b/LICENSE
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2018 Intel Corporation
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/Legal.md b/Legal.md
new file mode 100644
index 0000000000000000000000000000000000000000..09ae9d2a936306484157e53fd0a98c169a86d484
--- /dev/null
+++ b/Legal.md
@@ -0,0 +1,34 @@
+# Legal Information
+
+## Disclaimer
+
+Intel® Transfer Learning Tool scripts are not intended for benchmarking Intel® platforms. For any
+performance and/or benchmarking information on specific Intel platforms, visit
+https://www.intel.ai/blog.
+
+Intel is committed to the respect of human rights and avoiding complicity in
+human rights abuses, a policy reflected in the Intel Global Human Rights
+Principles. Accordingly, by accessing the Intel material on this platform you
+agree that you will not use the material in a product or application that causes
+or contributes to a violation of an internationally recognized human right.
+
+## License
+
+Intel® Transfer Learning Tool, documentation, and example code are all licensed
+under Apache License Version 2.0.
+
+## Datasets
+
+To the extent that any [public datasets](DATASETS.md) are referenced by Intel or accessed using
+tools or code on this site those datasets are provided by the third party
+indicated as the data source. Intel does not create the data, or datasets, and
+does not warrant their accuracy or quality. By accessing the public dataset(s)
+you agree to the terms associated with those datasets and that your use complies
+with the applicable license.
+
+Intel expressly disclaims the accuracy, adequacy, or completeness of any public
+datasets, and is not liable for any errors, omissions, or defects in the data,
+or for any reliance on the data. Intel is not liable for any liability or
+damages relating to your use of public datasets.
+
+\*Other names and brands may be claimed as the property of others. [Trademarks](http://www.intel.com/content/www/us/en/legal/trademarks.html)
diff --git a/MANIFEST.in b/MANIFEST.in
new file mode 100644
index 0000000000000000000000000000000000000000..9afb2db7ce63be3c658894461a6724f06ffa8098
--- /dev/null
+++ b/MANIFEST.in
@@ -0,0 +1 @@
+recursive-include tlt *
diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000000000000000000000000000000000000..4cf64160173973673a3b31c21ecb714c9fa2838e
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,112 @@
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+# Note: These are just placeholders for future additions to Makefile.
+# You can remove these comments later.
+ACTIVATE_TLT_VENV = "tlt_dev_venv/bin/activate"
+ACTIVATE_NOTEBOOK_VENV = "tlt_notebook_venv/bin/activate"
+ACTIVATE_TEST_VENV = "tlt_test_venv/bin/activate"
+ACTIVATE_DOCS_VENV = $(ACTIVATE_TEST_VENV)
+
+# Customize sample test run commands
+# PY_TEST_EXTRA_ARGS="'-vvv -k test_platform_util_with_no_args'" make test
+# PY_TEST_EXTRA_ARGS="'--collect-only'" make test
+PY_TEST_EXTRA_ARGS ?= "--durations=0"
+
+tlt_test_venv: $(CURDIR)/tests/requirements-test.txt
+	@echo "Creating a virtualenv tlt_test_venv..."
+	@test -d tlt_test_venv || virtualenv -p python3 tlt_test_venv
+
+	@echo "Building the TLT API in tlt_test_venv env..."
+	@. $(ACTIVATE_TEST_VENV) && pip install --editable .
+
+	@echo "Installing test dependencies..."
+	@. $(ACTIVATE_TEST_VENV) && pip install -r $(CURDIR)/tests/requirements-test.txt
+
+tlt_notebook_venv: $(CURDIR)/notebooks/requirements.txt
+	@echo "Creating a virtualenv tlt_notebook_venv..."
+	@test -d tlt_notebook_venv || virtualenv -p python3 tlt_notebook_venv
+
+	@echo "Installing TF & PYT notebook dependencies..."
+	@. $(ACTIVATE_NOTEBOOK_VENV) && pip install -r $(CURDIR)/notebooks/requirements.txt
+
+test: unittest integration
+
+unittest: tlt_test_venv
+	@echo "Testing unit test API..."
+	@. $(ACTIVATE_TEST_VENV) && PYTHONPATH=$(CURDIR)/tests py.test -vvv -s $(PY_TEST_EXTRA_ARGS) "-k not integration and not skip"
+
+integration: tlt_test_venv
+	@echo "Testing integration test API..."
+	@. $(ACTIVATE_TEST_VENV) && PYTHONPATH=$(CURDIR)/tests py.test -vvv -s $(PY_TEST_EXTRA_ARGS) "-k integration and not skip"
+
+lint: tlt_test_venv
+	@echo "Style checks..."
+	@. $(ACTIVATE_TEST_VENV) && flake8 tlt tests downloader
+
+clean:
+	rm -rf tlt_test_venv
+
+tlt_docs_venv: tlt_test_venv $(CURDIR)/docs/requirements-docs.txt
+	@echo "Installing docs dependencies..."
+	@. $(ACTIVATE_DOCS_VENV) && pip install -r $(CURDIR)/docs/requirements-docs.txt
+
+html: tlt_docs_venv
+	@echo "Building Sphinx documentation..."
+	@. $(ACTIVATE_DOCS_VENV) && $(MAKE) -C docs clean html
+
+test_docs: html
+	@echo "Testing Sphinx documentation..."
+	@. $(ACTIVATE_DOCS_VENV) && $(MAKE) -C docs doctest
+
+tlt_notebook_venv: tlt_test_venv
+	@echo "Installing notebook dependencies..."
+	@. $(ACTIVATE_TEST_VENV) && pip install -r $(CURDIR)/notebooks/requirements.txt
+
+test_notebook_custom: tlt_notebook_venv
+	@echo "Testing Jupyter notebooks with custom datasets..."
+	@. $(ACTIVATE_TEST_VENV) && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb remove_for_custom_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb remove_for_custom_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb remove_for_custom_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb remove_for_custom_dataset
+
+test_notebook_catalog: tlt_notebook_venv
+	@echo "Testing Jupyter notebooks with public catalog datasets..."
+	@. $(ACTIVATE_TEST_VENV) && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb remove_for_tf_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb remove_for_tv_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb remove_for_tf_dataset && \
+	bash run_notebooks.sh $(CURDIR)/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb remove_for_hf_dataset
+
+test_tf_notebook: tlt_notebook_venv
+	@. $(ACTIVATE_TEST_VENV) && bash run_notebooks.sh tensorflow
+
+test_pyt_notebook: tlt_notebook_venv
+	@. $(ACTIVATE_TEST_VENV) && bash run_notebooks.sh pytorch
+
+dist: tlt_docs_venv
+	@echo "Create binary wheel..."
+	@. $(ACTIVATE_DOCS_VENV) && python setup.py bdist_wheel
+
+check_dist: dist
+	@echo "Testing the wheel..."
+	@. $(ACTIVATE_DOCS_VENV) && \
+	pip install twine && \
+	python setup.py bdist_wheel && \
+	twine check dist/*
diff --git a/Models.md b/Models.md
new file mode 100644
index 0000000000000000000000000000000000000000..e44dfaeb2ee2d283218c9d2c2e464ccb1a7209e9
--- /dev/null
+++ b/Models.md
@@ -0,0 +1,178 @@
+# Intel® Transfer Learning Tool Supported Models
+
+## Image Classification
+
+| Model name | Framework | Model Hub |
+|------------|-----------|-----------|
+| alexnet | PyTorch* | Torchvision* |
+| convnext_base | PyTorch | Torchvision |
+| convnext_large | PyTorch | Torchvision |
+| convnext_small | PyTorch | Torchvision |
+| convnext_tiny | PyTorch | Torchvision |
+| densenet121 | PyTorch | Torchvision |
+| densenet161 | PyTorch | Torchvision |
+| densenet169 | PyTorch | Torchvision |
+| densenet201 | PyTorch | Torchvision |
+| efficientnetv2-b0 | TensorFlow* | TensorFlow Hub* |
+| efficientnetv2-b1 | TensorFlow | TensorFlow Hub |
+| efficientnetv2-b2 | TensorFlow | TensorFlow Hub |
+| efficientnetv2-b3 | TensorFlow | TensorFlow Hub |
+| efficientnetv2-s | TensorFlow | TensorFlow Hub |
+| efficientnet_b0 | TensorFlow | TensorFlow Hub |
+| efficientnet_b0 | PyTorch | Torchvision |
+| efficientnet_b1 | TensorFlow | TensorFlow Hub |
+| efficientnet_b1 | PyTorch | Torchvision |
+| efficientnet_b2 | TensorFlow | TensorFlow Hub |
+| efficientnet_b2 | PyTorch | Torchvision |
+| efficientnet_b3 | TensorFlow | TensorFlow Hub |
+| efficientnet_b3 | PyTorch | Torchvision |
+| efficientnet_b4 | TensorFlow | TensorFlow Hub |
+| efficientnet_b4 | PyTorch | Torchvision |
+| efficientnet_b5 | TensorFlow | TensorFlow Hub |
+| efficientnet_b5 | PyTorch | Torchvision |
+| efficientnet_b6 | TensorFlow | TensorFlow Hub |
+| efficientnet_b6 | PyTorch | Torchvision |
+| efficientnet_b7 | TensorFlow | TensorFlow Hub |
+| efficientnet_b7 | PyTorch | Torchvision |
+| googlenet | PyTorch | Torchvision |
+| inception_v3 | TensorFlow | TensorFlow Hub |
+| mnasnet0_5 | PyTorch | Torchvision |
+| mnasnet1_0 | PyTorch | Torchvision |
+| mobilenet_v2 | PyTorch | Torchvision |
+| mobilenet_v2_100_224 | TensorFlow | TensorFlow Hub |
+| mobilenet_v3_large | PyTorch | Torchvision |
+| mobilenet_v3_small | PyTorch | Torchvision |
+| nasnet_large | TensorFlow | TensorFlow Hub |
+| proxyless_cpu | PyTorch | PyTorch Hub* |
+| regnet_x_16gf | PyTorch | Torchvision |
+| regnet_x_1_6gf | PyTorch | Torchvision |
+| regnet_x_32gf | PyTorch | Torchvision |
+| regnet_x_3_2gf | PyTorch | Torchvision |
+| regnet_x_400mf | PyTorch | Torchvision |
+| regnet_x_800mf | PyTorch | Torchvision |
+| regnet_x_8gf | PyTorch | Torchvision |
+| regnet_y_16gf | PyTorch | Torchvision |
+| regnet_y_1_6gf | PyTorch | Torchvision |
+| regnet_y_32gf | PyTorch | Torchvision |
+| regnet_y_3_2gf | PyTorch | Torchvision |
+| regnet_y_400mf | PyTorch | Torchvision |
+| regnet_y_800mf | PyTorch | Torchvision |
+| regnet_y_8gf | PyTorch | Torchvision |
+| resnet101 | PyTorch | Torchvision |
+| resnet152 | PyTorch | Torchvision |
+| resnet18 | PyTorch | Torchvision |
+| resnet18_ssl | PyTorch | PyTorch Hub |
+| resnet18_swsl | PyTorch | PyTorch Hub |
+| resnet34 | PyTorch | Torchvision |
+| resnet50 | PyTorch | Torchvision |
+| resnet50_ssl | PyTorch | PyTorch Hub |
+| resnet50_swsl | PyTorch | PyTorch Hub |
+| resnet_v1_50 | TensorFlow | TensorFlow Hub |
+| resnet_v2_101 | TensorFlow | TensorFlow Hub |
+| resnet_v2_50 | TensorFlow | TensorFlow Hub |
+| resnext101_32x16d_ssl | PyTorch | PyTorch Hub |
+| resnext101_32x16d_swsl | PyTorch | PyTorch Hub |
+| resnext101_32x16d_wsl | PyTorch | PyTorch Hub |
+| resnext101_32x32d_wsl | PyTorch | PyTorch Hub |
+| resnext101_32x48d_wsl | PyTorch | PyTorch Hub |
+| resnext101_32x4d_ssl | PyTorch | PyTorch Hub |
+| resnext101_32x4d_swsl | PyTorch | PyTorch Hub |
+| resnext101_32x8d | PyTorch | Torchvision |
+| resnext101_32x8d_ssl | PyTorch | PyTorch Hub |
+| resnext101_32x8d_swsl | PyTorch | PyTorch Hub |
+| resnext101_32x8d_wsl | PyTorch | PyTorch Hub |
+| resnext50_32x4d | PyTorch | Torchvision |
+| resnext50_32x4d_ssl | PyTorch | PyTorch Hub |
+| resnext50_32x4d_swsl | PyTorch | PyTorch Hub |
+| shufflenet_v2_x0_5 | PyTorch | Torchvision |
+| shufflenet_v2_x1_0 | PyTorch | Torchvision |
+| vgg11 | PyTorch | Torchvision |
+| vgg11_bn | PyTorch | Torchvision |
+| vgg13 | PyTorch | Torchvision |
+| vgg13_bn | PyTorch | Torchvision |
+| vgg16 | PyTorch | Torchvision |
+| vgg16_bn | PyTorch | Torchvision |
+| vgg19 | PyTorch | Torchvision |
+| vgg19_bn | PyTorch | Torchvision |
+| vit_b_16 | PyTorch | Torchvision |
+| vit_b_32 | PyTorch | Torchvision |
+| vit_l_16 | PyTorch | Torchvision |
+| vit_l_32 | PyTorch | Torchvision |
+| wide_resnet101_2 | PyTorch | Torchvision |
+| wide_resnet50_2 | PyTorch | Torchvision |
+| ConvNeXtBase | TensorFlow | Keras* |
+| ConvNeXtLarge | TensorFlow | Keras |
+| ConvNeXtSmall | TensorFlow | Keras |
+| ConvNeXtTiny | TensorFlow | Keras |
+| ConvNeXtXLarge | TensorFlow | Keras |
+| DenseNet121 | TensorFlow | Keras |
+| DenseNet169 | TensorFlow | Keras |
+| DenseNet201 | TensorFlow | Keras |
+| EfficientNetV2B0 | TensorFlow | Keras |
+| EfficientNetV2B1 | TensorFlow | Keras |
+| EfficientNetV2B2 | TensorFlow | Keras |
+| EfficientNetV2B3 | TensorFlow | Keras |
+| EfficientNetV2L | TensorFlow | Keras |
+| EfficientNetV2M | TensorFlow | Keras |
+| EfficientNetV2S | TensorFlow | Keras |
+| InceptionResNetV2 | TensorFlow | Keras |
+| InceptionV3 | TensorFlow | Keras |
+| MobileNet | TensorFlow | Keras |
+| MobileNetV2 | TensorFlow | Keras |
+| NASNetLarge | TensorFlow | Keras |
+| NASNetMobile | TensorFlow | Keras |
+| ResNet101 | TensorFlow | Keras |
+| ResNet101V2 | TensorFlow | Keras |
+| ResNet152 | TensorFlow | Keras |
+| ResNet152V2 | TensorFlow | Keras |
+| ResNet50 | TensorFlow | Keras |
+| ResNet50V2 | TensorFlow | Keras |
+| VGG16 | TensorFlow | Keras |
+| VGG19 | TensorFlow | Keras |
+| Xception | TensorFlow | Keras |
+
+## Text Classification
+
+| Model name | Framework | Model Hub |
+|------------|-----------|-----------|
+| bert-base-cased | PyTorch | Hugging Face* |
+| bert-base-uncased | TensorFlow | Hugging Face |
+| bert-large-uncased | TensorFlow | Hugging Face |
+| bert-large-uncased | PyTorch | Hugging Face |
+| clinical-bert | PyTorch | Hugging Face |
+| distilbert-base-uncased | PyTorch | Hugging Face |
+| google/bert_uncased_L-10_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-10_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-10_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-10_H-768_A-12 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-12_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-12_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-12_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-12_H-768_A-12 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-2_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-2_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-2_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-2_H-768_A-12 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-4_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-4_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-4_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-4_H-768_A-12 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-6_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-6_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-6_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-6_H-768_A-12 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-8_H-128_A-2 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-8_H-256_A-4 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-8_H-512_A-8 | TensorFlow | Hugging Face |
+| google/bert_uncased_L-8_H-768_A-12 | TensorFlow | Hugging Face |
+
+## Image Anomaly Detection
+
+| Model name | Framework | Model Hub |
+|------------|-----------|-----------|
+| resnet101 | PyTorch | Torchvision |
+| resnet152 | PyTorch | Torchvision |
+| resnet18 | PyTorch | Torchvision |
+| resnet34 | PyTorch | Torchvision |
+| resnet50 | PyTorch | Torchvision |
+
diff --git a/README.md b/README.md
index 884641abca8382d0a85913c3dc2b76afe4102ff6..e158e9ff9133fc8a34c431132fd52e785590c39c 100644
--- a/README.md
+++ b/README.md
@@ -1,14 +1,98 @@
----
-title: Quality Control Inspector
-emoji: 📈
-colorFrom: green
-colorTo: green
-sdk: gradio
-sdk_version: 5.41.1
-app_file: app.py
-pinned: false
-license: apache-2.0
-short_description: Quality control automation using self-supervised anomaly det
----
-
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+*Note: You may find it easier to read about Intel Transfer Learning tool, follow the Get
+Started guide, and browse the API material from our published documentation site
+https://intelai.github.io/transfer-learning.*
+
+<!-- SkipBadges -->
+
+# Intel® Transfer Learning Tool
+
+Transfer learning workflows use the knowledge learned by a pre-trained model on
+a large dataset to improve the performance of a related problem with a smaller
+dataset.
+
+## What is Intel® Transfer Learning Tool
+
+Intel® Transfer Learning Tool makes it easier and faster for you to
+create transfer learning workflows across a variety of AI use cases. Its
+open-source Python\* library leverages public pretrained model hubs,
+Intel-optimized deep learning frameworks, and your custom dataset to efficiently
+generate new models optimized for Intel hardware.
+
+This project documentation provides information, resource links, and instructions for the Intel
+Transfer Learning Tool as well as Jupyter\* notebooks and examples that
+demonstrate its usage.
+
+**Features:**
+* Supports PyTorch\* and TensorFlow\*
+* Select from over [100 image classification and text classification models](Models.md) from
+  Torchvision, PyTorch Hub, TensorFlow Hub, Keras, and Hugging Face
+* Use your own custom dataset or get started quickly with built-in datasets
+* Automatically create a trainable classification layer customized for your dataset
+* Pre-process your dataset using scaling, cropping, batching, and splitting
+* Use APIs for prediction, evaluation, and benchmarking
+* Export your model for deployment or resume training from checkpoints
+
+**Intel Optimizations:**
+* Boost performance with Intel® Optimization for TensorFlow and Intel® Extension for PyTorch
+* Quantize to INT8 to reduce model size and speed up inference using Intel® Neural Compressor
+* Optimize model for FP32 inference using Intel Neural Compressor
+* Reduce training time with auto-mixed precision for select hardware platforms
+* Further reduce training time with multinode training for PyTorch
+
+## How the Intel Transfer Learning Tool Works
+
+The Intel Transfer Learning Tool lets you train AI models with TensorFlow or
+PyTorch using either no-code command line interface (CLI) commands at a bash
+prompt, or low-code application programming interface (API) calls from a Python
+script.
+
+Use your own dataset or select an existing image or text classification dataset listed in the
+[public datasets](DATASETS.md) documentation. Construct your own CLI or API commands for training, evaluation,
+and optimization using the TensorFlow or PyTorch framework, and finally export
+your saved model optimized for inference on Intel CPUs.
+
+An overview of the Intel Transfer Learning Tool flow is shown in this
+figure:
+
+<p align="center"><b>Intel Transfer Learning Tool Flow</b></p>
+
+<img alt="Intel Transfer Learning Tool Flow" title="Intel Transfer Learing Tool Flow" src="images/TLT-tool_flow.svg" width="600">
+
+## Get Started
+
+The [Get Started](GetStarted.md) guide walks you through the steps to check
+system requirements, install, and then run the tool with a couple of examples
+showing no-code CLI and low-code API approaches. After that, you can check out
+these additional CLI and API [Examples](examples/README.md).
+
+<!-- ExpandGetStarted-Start -->
+As described in the [Get Started](GetStarted.md) guide, once you have a Python
+3.9 environment set up, you do a basic install of the Intel Transfer Learning
+Tool using:
+
+```
+pip install intel-transfer-learning-tool
+```
+
+Then you can use the Transfer Learning Tool CLI interface (tlt) to train a
+TensorFlow image classification model (resnet_v1_50), download and use an
+existing built-in dataset (tf_flowers), and save the trained model to
+`/tmp/output` using this one command:
+
+```
+tlt train --framework tensorflow --model-name resnet_v1_50 --dataset-name tf_flowers \
+   --output-dir /tmp/output --dataset-dir /tmp/data
+```
+
+Use `tlt --help` to see the list of CLI commands.  More detailed help for each
+command can be found using, for example, `tlt train --help`.
+
+<!-- ExpandGetStarted-End -->
+
+## Support
+
+The Intel Transfer Learning Tool team tracks bugs and enhancement requests using
+[GitHub issues](https://github.com/IntelAI/transfer-learning-tool/issues). Before submitting a
+suggestion or bug report, search the existing GitHub issues to see if your issue has already been reported.
+
+See [Legal Information](Legal.md) for Disclaimers, Trademark, and Licensing information.
diff --git a/SECURITY.md b/SECURITY.md
new file mode 100644
index 0000000000000000000000000000000000000000..556938bdea39190bb47c2cb1e33109301b11e454
--- /dev/null
+++ b/SECURITY.md
@@ -0,0 +1,12 @@
+# Security Policy
+
+## Report a Vulnerability
+
+Please report security issues or vulnerabilities to the [Intel® Security Center].
+
+For more information on how Intel® works to resolve security issues, see
+[Vulnerability Handling Guidelines].
+
+[Intel® Security Center]:https://www.intel.com/content/www/us/en/security-center/default.html
+
+[Vulnerability Handling Guidelines]:https://www.intel.com/content/www/us/en/security-center/vulnerability-handling-guidelines.html
diff --git a/_config.yml b/_config.yml
new file mode 100644
index 0000000000000000000000000000000000000000..fff4ab923ce55f11569939421ffa39cd3566f5d9
--- /dev/null
+++ b/_config.yml
@@ -0,0 +1 @@
+theme: jekyll-theme-minimal
diff --git a/api.md b/api.md
new file mode 100644
index 0000000000000000000000000000000000000000..a936a4da26b02ef4e908928c25c8144a2618c03e
--- /dev/null
+++ b/api.md
@@ -0,0 +1,4 @@
+# API Reference
+
+Low-code Python\* API documentation is automatically generated from the code and
+appears in the Transfer Learning Tool documentation website's [API](https://intelai.github.io/transfer-learning/main/api.html) page.
diff --git a/bandit.yaml b/bandit.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..d7a1dd00122650038aa096642b9c7178c464f9c1
--- /dev/null
+++ b/bandit.yaml
@@ -0,0 +1,11 @@
+# FILE: bandit.yaml
+exclude_dirs: [ '.venv', '.tox', 'tlt_test_venv', 'tlt_notebook_venv', 'tests' ]
+skips: [ 'B301', 'B311', 'B403', 'B404' ]
+# B301 - dill usage scoope is different from what's described in CWE-502
+#        dill is mostly used used for dumping/saving models to disk(serialization)
+#        When loading previously saved models from disk(descerialization),
+#        either Keras model loader or PyTorch loader used first to verify the model,
+#        and then create a copy to be passed to dill for loading.
+# B311 - random usage scope is different from what's described in CWE-330
+# B403 - this one is reported everytime 'dill' is imported, so it's actually covered by B301 justification
+# B404 - this one is reported everytime 'subprocess' is imported but this modules is not used as described in CWE-78
diff --git a/cli.md b/cli.md
new file mode 100644
index 0000000000000000000000000000000000000000..8b41a5919fd49c86ce9fbd2c22f8a98244f0161b
--- /dev/null
+++ b/cli.md
@@ -0,0 +1,4 @@
+# CLI Reference
+
+No-code bash CLI documentation is automatically generated from the code and
+appears in the Transfer Learning Tool documentation website's [CLI](https://intelai.github.io/transfer-learning/main/cli.html) page.
diff --git a/docker/Dockerfile b/docker/Dockerfile
new file mode 100644
index 0000000000000000000000000000000000000000..c093d932c114e42e6182d098ce3225091b02c20a
--- /dev/null
+++ b/docker/Dockerfile
@@ -0,0 +1,143 @@
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+ARG IMAGE_NAME=ubuntu
+ARG IMAGE_TAG=22.04
+FROM ${IMAGE_NAME}:${IMAGE_TAG} as base
+
+# TLT base target
+FROM base as tlt-base
+
+ARG PYTHON=python3
+
+ENV DEBIAN_FRONTEND=noninteractive
+
+RUN apt-get update && apt-get install -y --no-install-recommends --fix-missing \
+    libgl1 \
+    libglib2.0-0 \
+    ${PYTHON} \
+    python3-pip && \
+    apt-get clean autoclean && \
+    apt-get autoremove -y && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN ln -sf "$(which ${PYTHON})" /usr/bin/python
+
+# TLT target for GitHub actions
+FROM tlt-base as tlt-ci
+
+ENV DEBIAN_FRONTEND=noninteractive
+
+ENV LANG C.UTF-8
+ARG PYTHON=python3
+
+RUN apt-get update && apt-get install -y --no-install-recommends --fix-missing \
+    ${PYTHON}-dev \
+    ${PYTHON}-distutils \
+    build-essential \
+    ca-certificates \
+    make \
+    pandoc && \
+    apt-get clean autoclean && \
+    apt-get autoremove -y && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN ${PYTHON} -m pip install virtualenv
+
+# TLT target for development
+FROM tlt-ci as tlt-devel
+
+COPY . /tmp/intel-transfer-learning
+
+WORKDIR /tmp/intel-transfer-learning
+
+RUN ${PYTHON} setup.py bdist_wheel && \
+    pip install --no-cache-dir -f https://download.pytorch.org/whl/cpu/torch_stable.html dist/*.whl
+
+# TLT target for deployment
+FROM tlt-base as tlt-prod
+
+COPY --from=tlt-devel /usr/local/lib/python3.10/dist-packages /usr/local/lib/python3.10/dist-packages
+COPY --from=tlt-devel /usr/local/bin /usr/local/bin
+
+ENV DATASET_DIR=/tmp/data
+ENV OUTPUT_DIR=/tmp/output
+
+# TLT target for running with MPI
+FROM tlt-prod as tlt-mpi
+
+RUN apt-get update && apt-get install -y --no-install-recommends --fix-missing \
+    libopenmpi-dev \
+    openmpi-bin \
+    openmpi-common \
+    openssh-client \
+    openssh-server && \
+    apt-get clean autoclean && \
+    apt-get autoremove -y && \
+    rm -rf /var/lib/apt/lists/*
+
+# Create a wrapper for OpenMPI to allow running as root by default
+RUN mv /usr/bin/mpirun /usr/bin/mpirun.real && \
+    echo '#!/bin/bash' > /usr/bin/mpirun && \
+    echo 'mpirun.real --allow-run-as-root "$@"' >> /usr/bin/mpirun && \
+    chmod a+x /usr/bin/mpirun
+
+# Configure OpenMPI to run good defaults:
+RUN echo "btl_tcp_if_exclude = lo,docker0" >> /etc/openmpi/openmpi-mca-params.conf
+
+# Install OpenSSH for MPI to communicate between containers and allow OpenSSH to
+# talk to containers without asking for confirmation
+RUN mkdir -p /var/run/sshd && \
+    cat /etc/ssh/ssh_config | grep -v StrictHostKeyChecking > /etc/ssh/ssh_config.new && \
+    echo "    StrictHostKeyChecking no" >> /etc/ssh/ssh_config.new && \
+    mv /etc/ssh/ssh_config.new /etc/ssh/ssh_config
+
+# TLT target for with MPI, Horovod and all development tools
+FROM tlt-mpi as tlt-dist-devel
+
+ARG HOROVOD_WITH_PYTORCH=1
+ARG HOROVOD_WITHOUT_MXNET=1
+ARG HOROVOD_WITH_TENSORFLOW=1
+ARG HOROVOD_VERSION
+
+ARG PYTHON=python3
+
+RUN apt-get update && apt-get install -y --no-install-recommends --fix-missing \
+    build-essential \
+    cmake \
+    g++ \
+    gcc \
+    git \
+    ${PYTHON}-dev && \
+    apt-get clean && \
+    rm -rf /var/lib/apt/lists/*
+
+RUN python -m pip install --no-cache-dir horovod==${HOROVOD_VERSION}
+
+ARG ONECCL_VERSION
+ARG ONECCL_URL=https://developer.intel.com/ipex-whl-stable-cpu
+
+RUN python -m pip install --no-cache-dir oneccl_bind_pt==${ONECCL_VERSION} -f ${ONECCL_URL}
+
+COPY . /tmp/intel-transfer-learning
+
+WORKDIR /tmp/intel-transfer-learning
+
+FROM tlt-mpi as tlt-dist-prod
+
+COPY --from=tlt-dist-devel /usr/local/lib/${PYTHON}/dist-packages /usr/local/lib/python3.10/dist-packages
+COPY --from=tlt-dist-devel /usr/local/bin /usr/local/bin
diff --git a/docker/README.md b/docker/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..cdd8121774c788d3798dbdc3d4ab5b5a3a577a10
--- /dev/null
+++ b/docker/README.md
@@ -0,0 +1,73 @@
+# Docker
+Follow these instructions to set up and run our provided Docker image.
+
+## Set Up Docker Engine and Docker Compose
+You'll need to install Docker Engine on your development system. Note that while **Docker Engine** is free to use, **Docker Desktop** may require you to purchase a license. See the [Docker Engine Server installation instructions](https://docs.docker.com/engine/install/#server) for details.
+
+To build and run this workload inside a Docker Container, ensure you have Docker Compose installed on your machine. If you don't have this tool installed, consult the official [Docker Compose installation documentation](https://docs.docker.com/compose/install/linux/#install-the-plugin-manually).
+
+```bash
+DOCKER_CONFIG=${DOCKER_CONFIG:-$HOME/.docker}
+mkdir -p $DOCKER_CONFIG/cli-plugins
+curl -SL https://github.com/docker/compose/releases/download/v2.7.0/docker-compose-linux-x86_64 -o $DOCKER_CONFIG/cli-plugins/docker-compose
+chmod +x $DOCKER_CONFIG/cli-plugins/docker-compose
+docker compose version
+```
+
+## Set Up Docker Image
+Build or Pull the provided docker images.
+
+```bash
+cd docker
+docker compose build
+```
+OR
+```bash
+docker pull intel/ai-tools:tlt-0.5.0
+docker pull intel/ai-tools:tlt-devel-0.5.0
+docker pull intel/ai-tools:tlt-dist-0.5.0
+docker pull intel/ai-tools:tlt-dist-devel-0.5.0
+```
+
+## Use Docker Image
+Utilize the TLT CLI without installation by using the provided docker image and docker compose.
+
+```bash
+docker compose run tlt-prod
+# OR
+docker compose run tlt-prod tlt --help
+```
+
+## Kubernetes
+### 1. Install Helm
+- Install [Helm](https://helm.sh/docs/intro/install/)
+```bash
+curl -fsSL -o get_helm.sh https://raw.githubusercontent.com/helm/helm/main/scripts/get-helm-3 && \
+chmod 700 get_helm.sh && \
+./get_helm.sh
+```
+### 2. Setting up Training Operator
+Install the standalone operator from GitHub or use a pre-existing Kubeflow configuration.
+```bash
+kubectl apply -k "github.com/kubeflow/training-operator/manifests/overlays/standalone"
+```
+OR
+```bash
+helm repo add cowboysysop https://cowboysysop.github.io/charts/
+helm install <release name> cowboysysop/training-operator
+```
+### 3. Deploy TLT Distributed Job
+For more customization information, see the chart [README](./docker/chart/README.md)
+```bash
+export NAMESPACE=kubeflow
+helm install --namespace ${NAMESPACE} --set ... tlt-distributed ./docker/chart
+```
+### 4. View 
+To view your workflow progress
+```bash
+kubectl get -o yaml mpijob tf-tlt-distributed -n ${NAMESPACE}
+```
+OR
+```bash
+kubectl logs tf-tlt-distributed-launcher -n ${NAMESPACE}
+```
diff --git a/docker/chart/.helmignore b/docker/chart/.helmignore
new file mode 100644
index 0000000000000000000000000000000000000000..0e8a0eb36f4ca2c939201c0d54b5d82a1ea34778
--- /dev/null
+++ b/docker/chart/.helmignore
@@ -0,0 +1,23 @@
+# Patterns to ignore when building packages.
+# This supports shell glob matching, relative path matching, and
+# negation (prefixed with !). Only one pattern per line.
+.DS_Store
+# Common VCS dirs
+.git/
+.gitignore
+.bzr/
+.bzrignore
+.hg/
+.hgignore
+.svn/
+# Common backup files
+*.swp
+*.bak
+*.tmp
+*.orig
+*~
+# Various IDEs
+.project
+.idea/
+*.tmproj
+.vscode/
diff --git a/docker/chart/Chart.yaml b/docker/chart/Chart.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..24e0665278b03ec08ee6017557057f663e2c42e6
--- /dev/null
+++ b/docker/chart/Chart.yaml
@@ -0,0 +1,24 @@
+apiVersion: v2
+name: TLT TF Distributed Training
+description: A Helm chart for Kubernetes
+
+# A chart can be either an 'application' or a 'library' chart.
+#
+# Application charts are a collection of templates that can be packaged into versioned archives
+# to be deployed.
+#
+# Library charts provide useful utilities or functions for the chart developer. They're included as
+# a dependency of application charts to inject those utilities and functions into the rendering
+# pipeline. Library charts do not define any templates and therefore cannot be deployed.
+type: application
+
+# This is the chart version. This version number should be incremented each time you make changes
+# to the chart and its templates, including the app version.
+# Versions are expected to follow Semantic Versioning (https://semver.org/)
+version: 0.2.0
+
+# This is the version number of the application being deployed. This version number should be
+# incremented each time you make changes to the application. Versions are not expected to
+# follow Semantic Versioning. They should reflect the version the application is using.
+# It is recommended to use it with quotes.
+appVersion: "1.16.0"
diff --git a/docker/chart/README.md b/docker/chart/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..c2ca7a49409fcac9867154c1bf47a5d8bd00174b
--- /dev/null
+++ b/docker/chart/README.md
@@ -0,0 +1,31 @@
+# TLT TF Distributed Training
+
+![Version: 0.1.0](https://img.shields.io/badge/Version-0.1.0-informational?style=flat-square) ![Type: application](https://img.shields.io/badge/Type-application-informational?style=flat-square) ![AppVersion: 1.16.0](https://img.shields.io/badge/AppVersion-1.16.0-informational?style=flat-square)
+
+A Helm chart for Kubernetes
+
+## Values
+
+| Key | Type | Default | Description |
+|-----|------|---------|-------------|
+| batchDenom | int | `1` | Batch denominator to be used to divide global batch size |
+| batchSize | int | `128` | Global batch size to distributed data |
+| datasetName | string | `"cifar10"` | Dataset name to load from tfds |
+| epochs | int | `1` | Total epochs to train the model |
+| imageName | string | `"intel/ai-tools"` |  |
+| imageTag | string | `"0.5.0-dist-devel"` |  |
+| metadata.name | string | `"tlt-distributed"` |  |
+| metadata.namespace | string | `"kubeflow"` |  |
+| modelName | string | `"https://tfhub.dev/google/efficientnet/b1/feature-vector/1"` | TF Hub or HuggingFace model URL |
+| pvcName | string | `"tlt"` |  |
+| pvcResources.data | string | `"2Gi"` | Amount of Storage for Dataset |
+| pvcResources.output | string | `"1Gi"` | Amount of Storage for Output Directory |
+| pvcScn | string | `"nil"` | PVC `StorageClassName` |
+| resources.cpu | int | `2` | Number of Compute for Launcher |
+| resources.memory | string | `"4Gi"` | Amount of Memory for Launcher |
+| scaling | string | `"strong"` | For `weak` scaling, `lr` is scaled by a factor of `sqrt(batch_size/batch_denom)` and uses global batch size for all the processes. For `strong` scaling, lr is scaled by world size and divides global batch size by world size |
+| slotsPerWorker | int | `1` | Number of Processes Per Worker |
+| useCase | string | `"image_classification"` | Use case (`image_classification`|`text_classification`) |
+| workerResources.cpu | int | `4` | Number of Compute per Worker |
+| workerResources.memory | string | `"8Gi"` | Amount of Memory per Worker |
+| workers | int | `4` | Number of Workers |
diff --git a/docker/chart/templates/mpijob.yaml b/docker/chart/templates/mpijob.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..5e54854b497bc52ba8ae09c21938d23a946d3df9
--- /dev/null
+++ b/docker/chart/templates/mpijob.yaml
@@ -0,0 +1,92 @@
+apiVersion: kubeflow.org/v1
+kind: MPIJob
+metadata:
+  name: tf-{{ .Values.metadata.name }}
+  namespace: {{ .Values.metadata.namespace }}
+spec:
+  slotsPerWorker: {{ .Values.slotsPerWorker }}
+  runPolicy:
+    cleanPodPolicy: None
+  mpiReplicaSpecs:
+    Launcher:
+      replicas: 1
+      template:
+        spec:
+          hostIPC: true
+          containers:
+          - image: "{{ .Values.imageName }}:{{ .Values.imageTag }}"
+            name: mpi
+            command:
+            - horovodrun
+            args:
+            - --verbose
+            - -np
+            - {{ .Values.workers }}
+            - --hostfile
+            - /etc/mpi/hostfile
+            - python
+            - /tmp/intel-transfer-learning/tlt/distributed/tensorflow/run_train_tf.py
+            - --batch_denom
+            - "{{ .Values.batchDenom }}"
+            - --batch_size
+            - "{{ .Values.batchSize }}"
+            - --dataset-dir
+            - /tmp/data
+            - --dataset-name
+            - {{ .Values.datasetName }}
+            - --epochs
+            - "{{ .Values.epochs }}"
+            - --model-name
+            - {{ .Values.modelName }}
+            - --output-dir
+            - /tmp/output
+            - --scaling
+            - "{{ .Values.scaling }}"
+            - --shuffle
+            - --use-case
+            - {{ .Values.useCase }}
+            resources:
+              limits:
+                cpu: {{ .Values.resources.cpu }}
+                memory: {{ .Values.resources.memory }}
+            volumeMounts:
+            - name: dataset-dir
+              mountPath: /tmp/data
+            - name: output-dir
+              mountPath: /tmp/output
+          volumes:
+          - name: dshm
+            emptyDir:
+              medium: Memory
+          - name: dataset-dir
+            persistentVolumeClaim:
+              claimName: "{{ .Values.pvcName }}-data"
+          - name: output-dir
+            persistentVolumeClaim:
+              claimName: "{{ .Values.pvcName }}-output"
+    Worker:
+      replicas: {{ .Values.workers }}
+      template:
+        spec:
+          containers:
+          - image: "{{ .Values.imageName }}:{{ .Values.imageTag }}" 
+            name: mpi
+            resources:
+              limits:
+                cpu: {{ .Values.workerResources.cpu }}
+                memory: {{ .Values.workerResources.memory }}
+            volumeMounts:
+            - name: dataset-dir
+              mountPath: /tmp/data
+            - name: output-dir
+              mountPath: /tmp/output
+          volumes:
+          - name: dshm
+            emptyDir:
+              medium: Memory
+          - name: dataset-dir
+            persistentVolumeClaim:
+              claimName: "{{ .Values.pvcName }}-data"
+          - name: output-dir
+            persistentVolumeClaim:
+              claimName: "{{ .Values.pvcName }}-output"
diff --git a/docker/chart/templates/pvc.yaml b/docker/chart/templates/pvc.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..dcafcf6817374812ef72a7abbbcec9a0a81da9c6
--- /dev/null
+++ b/docker/chart/templates/pvc.yaml
@@ -0,0 +1,25 @@
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: {{ .Values.pvcName }}-data
+  namespace: {{ .Values.metadata.namespace }}
+spec:
+  storageClassName: {{ .Values.pvcScn }}
+  accessModes:
+    - "ReadWriteOnce"
+  resources: 
+    requests:
+      storage: {{ .Values.pvcResources.data }}
+---
+apiVersion: v1
+kind: PersistentVolumeClaim
+metadata:
+  name: {{ .Values.pvcName }}-output
+  namespace: {{ .Values.metadata.namespace }}
+spec:
+  storageClassName: {{ .Values.pvcScn }}
+  accessModes:
+    - "ReadWriteOnce"
+  resources: 
+    requests:
+      storage: {{ .Values.pvcResources.output }}
diff --git a/docker/chart/values.yaml b/docker/chart/values.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..45fe27ae6639b5d25dd2c8261f0a8cedd55cf838
--- /dev/null
+++ b/docker/chart/values.yaml
@@ -0,0 +1,28 @@
+metadata:
+  name: tlt-distributed
+  namespace: kubeflow
+
+imageName: intel/ai-tools
+imageTag: 0.5.0-dist-devel
+
+batchDenom: 1
+batchSize: 128
+datasetName: cifar10
+epochs: 1
+modelName: https://tfhub.dev/google/efficientnet/b1/feature-vector/1
+scaling: strong
+slotsPerWorker: 1
+useCase: image_classification
+workers: 4
+
+pvcName: tlt
+pvcScn: nil
+pvcResources: 
+  data: 2Gi
+  output: 1Gi
+resources:
+  cpu: 2
+  memory: 4Gi
+workerResources:
+  cpu: 4
+  memory: 8Gi
diff --git a/docker/docker-compose.yml b/docker/docker-compose.yml
new file mode 100644
index 0000000000000000000000000000000000000000..4c1cbc805c5fca455f91a42b809ff6dbb75a0329
--- /dev/null
+++ b/docker/docker-compose.yml
@@ -0,0 +1,54 @@
+version: "3"
+services:
+  tlt-devel:
+    build:
+      args:
+        http_proxy: ${http_proxy}
+        https_proxy: ${https_proxy}
+        no_proxy: ""
+        IMAGE_NAME: ubuntu
+        IMAGE_TAG: 22.04
+        PYTHON: python3.10 # Version must be specified for prod
+      context: ../
+      dockerfile: ./docker/Dockerfile
+      target: tlt-devel
+    image: intel/ai-tools:tlt-devel-latest
+    pull_policy: always
+  tlt-prod:
+    extends:
+      service: tlt-devel
+    build:
+      args:
+        DATASET_DIR: /tmp/data
+        OUTPUT_DIR: /tmp/output
+      target: tlt-prod
+    image: intel/ai-tools:tlt-prod-latest
+    volumes:
+      - /${DATASET_DIR:-$PWD/../data}:/tmp/data
+      - /${OUTPUT_DIR:-$PWD/../output}:/tmp/output
+  tlt-dist-devel:
+    extends:
+      service: tlt-prod
+    build:
+      args:
+        HOROVOD_VERSION: 0.28.0
+        ONECCL_VERSION: 2.0.0
+        ONECCL_URL: https://developer.intel.com/ipex-whl-stable-cpu
+      target: tlt-dist-devel
+    image: intel/ai-tools:tlt-dist-devel-latest
+  tlt-dist-prod:
+    extends:
+      service: tlt-dist-devel
+    build:
+      target: tlt-dist-prod
+    command: |
+      tlt train -f tensorflow
+      --dataset-name cifar10
+      --model-name resnet_v1_50
+      --dataset-dir /tmp/data
+      --output-dir /tmp/output
+    environment:
+      http_proxy: ${http_proxy}
+      https_proxy: ${https_proxy}
+      no_proxy: ${no_proxy}
+    image: intel/ai-tools:tlt-dist-prod-latest
diff --git a/docs/.gitignore b/docs/.gitignore
new file mode 100644
index 0000000000000000000000000000000000000000..0918c9768895c23af5ecf35282391d7b12ed301a
--- /dev/null
+++ b/docs/.gitignore
@@ -0,0 +1 @@
+markdown
diff --git a/docs/DATASETS.rst b/docs/DATASETS.rst
new file mode 100644
index 0000000000000000000000000000000000000000..fa73e6f958343ccf1184ac8ad4e2585b1f38c08e
--- /dev/null
+++ b/docs/DATASETS.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../DATASETS.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/GetStarted.rst b/docs/GetStarted.rst
new file mode 100644
index 0000000000000000000000000000000000000000..a30052eb3269c69d8db37ca27f2b931ac15d0419
--- /dev/null
+++ b/docs/GetStarted.rst
@@ -0,0 +1,2 @@
+.. include:: ../GetStarted.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/Legal.rst b/docs/Legal.rst
new file mode 100644
index 0000000000000000000000000000000000000000..0bdc11ee5a7620a867da960c92dbf5add75e38a6
--- /dev/null
+++ b/docs/Legal.rst
@@ -0,0 +1,2 @@
+.. include:: ../Legal.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/Makefile b/docs/Makefile
new file mode 100644
index 0000000000000000000000000000000000000000..88499e06e60ee5449598e8a558b2388459051ad2
--- /dev/null
+++ b/docs/Makefile
@@ -0,0 +1,43 @@
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+# Minimal makefile for Sphinx documentation
+#
+
+# You can set these variables from the command line, and also
+# from the environment for the first two.
+SPHINXOPTS    ?=
+SPHINXBUILD   ?= sphinx-build
+SOURCEDIR     = .
+BUILDDIR      = _build
+
+# Put it first so that "make" without argument is like "make help".
+help:
+	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
+
+.PHONY: help Makefile
+
+# Catch-all target: route all unknown targets to Sphinx using the new
+# "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
+%: Makefile
+	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
+
+LISTEN_IP ?= 127.0.0.1
+LISTEN_PORT ?= 9999
+serve:
+	@python -m http.server --directory ./_build/html ${LISTEN_PORT} --bind ${LISTEN_IP}
diff --git a/docs/Models.rst b/docs/Models.rst
new file mode 100644
index 0000000000000000000000000000000000000000..0a55d827ec140a4fe6282719bc9b6b50f749e251
--- /dev/null
+++ b/docs/Models.rst
@@ -0,0 +1,2 @@
+.. include:: ../Models.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/README.md b/docs/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..88fe2cdb5e81816cbd796fb0a80a084378d343e7
--- /dev/null
+++ b/docs/README.md
@@ -0,0 +1,58 @@
+# Building Documentation
+
+## Sphinx Documentation
+
+Install `tlt` and its dependencies for developers as described the [Get Started](/GetStarted) guide.
+```bash
+# Run these commands from root of the project
+python3 -m virtualenv tlt_dev_venv
+source tlt_dev_venv/bin/activate
+python -m pip install --editable .
+```
+
+Install Pandoc, Sphinx and a few other tools required to build docs
+```bash
+sudo apt-get install pandoc
+pip install -r docs/requirements-docs.txt
+```
+
+Navigate to the `docs` directory and run the doctests to ensure all tests pass:
+```bash
+# run this command from within docs directory
+make doctest
+```
+
+This should produce output similiar to:
+```bash
+Doctest summary
+===============
+    6 tests
+    0 failures in tests
+    0 failures in setup code
+    0 failures in cleanup code
+build succeeded.
+```
+
+Finally generate the html docs (from within `docs` directory):
+```bash
+make clean html
+```
+
+The output HTML files will be located in `transfer-learning/docs/_build/html`.
+
+To start a local HTTP server and view the docs locally, try:
+```bash
+make serve
+Serving HTTP on 127.0.1.1 port 9999 (http://127.0.1.1:9999/) ...
+```
+
+If you need to view the docs from another machine, please try either port forwarding or
+provide appropriate values for `LISTEN_IP/LISTEN_PORT` arguments.
+For example:
+```bash
+LISTEN_IP=0.0.0.0 make serve
+Serving HTTP on 0.0.0.0 port 9999 (http://0.0.0.0:9999/) ...
+```
+
+runs the docs server on the host while listening to all hosts.
+Now you can navigate to `HOSTNAME:9999` to view the docs.
diff --git a/docs/_static/tlt-custom.css b/docs/_static/tlt-custom.css
new file mode 100644
index 0000000000000000000000000000000000000000..f0e1c0f33567cde2cdfc83606bc93653b20b2a23
--- /dev/null
+++ b/docs/_static/tlt-custom.css
@@ -0,0 +1,43 @@
+/* allow the page to use more of the window width */
+.wy-nav-content {
+       max-width: 1100px;
+   }
+
+/* allow text wrapping in a table to avoid table horizontal scrolling */
+.wy-table-responsive table td, .wy-table-responsive table th {
+        white-space: normal !important;
+    }
+
+/* center all images */
+.rst-content img {
+  margin-left: auto;
+  margin-right: auto;
+  display: block;
+}
+
+/* add an underline to title headings and wrap long API headings
+ * Note: we use JavaScript to add a &ZeroWidthSpace; after the dot
+ * in really long H1 titles created automatically from the code */
+.rst-content h1,h2,h3,h4,h5 {
+    text-decoration: underline;
+    word-wrap: break-word;
+}
+
+/* add link color to module xref generated by autodoc */
+.rst-content a.internal code.xref span.pre {
+    color: #2980b9;
+}
+
+/* change red text color to dark gray in code literals */
+.rst-content code.literal, .rst-content tt.literal {
+    color: #404040;
+}
+
+/* change background color of search area/site title to increase contrast */
+.wy-side-nav-search {
+    background-color: #2f71b2;
+}
+/* change href link color to increase contrast */
+a {
+    color: #2f71b2;
+}
diff --git a/docs/_static/tlt-custom.js b/docs/_static/tlt-custom.js
new file mode 100644
index 0000000000000000000000000000000000000000..70536ffcf42ec180326244f9ca47648e65cdbc69
--- /dev/null
+++ b/docs/_static/tlt-custom.js
@@ -0,0 +1,19 @@
+/* Extra tlt-specific javascript */
+
+$(document).ready(function(){
+
+   /* open external links in a new tab */
+   $('a[class*=external]').attr({target: '_blank', rel: 'noopener'});
+
+   /* add word break points (zero-width space) after a period in really long titles */
+   $('h1').html(function(index, html){
+     return html.replace(/\./g, '.\u200B');
+   });
+
+   /* copy image alt tags as title so hover text tool tip by browser
+    * (Looks like the myst-parser isn't passing the title tag through to Sphinx,
+    * but is passing the alt tag) */
+   $("img[alt]").each(function(){
+       $(this).attr('title', $(this).attr('alt'));
+   });
+});
diff --git a/docs/_templates/footer.html b/docs/_templates/footer.html
new file mode 100644
index 0000000000000000000000000000000000000000..c159a811f98dd8201f2ed2045c4556a7089fe697
--- /dev/null
+++ b/docs/_templates/footer.html
@@ -0,0 +1,5 @@
+{% extends '!footer.html' %}
+{% block extrafooter %}
+*Other names and brands may be claimed as the property of others.
+<a href="http://www.intel.com/content/www/us/en/legal/trademarks.html">Trademarks</a>
+{% endblock %}
diff --git a/docs/api.rst b/docs/api.rst
new file mode 100644
index 0000000000000000000000000000000000000000..97694e119ea1a132a1bbc3f6035fdba2e762886a
--- /dev/null
+++ b/docs/api.rst
@@ -0,0 +1,132 @@
+API Reference
+=============
+
+Datasets
+--------
+
+.. currentmodule:: tlt.datasets
+
+The simplest way to create datasets is with the dataset factory methods :meth:`load_dataset`, for using a
+custom dataset, and :meth:`get_dataset`, for downloading and using a third-party dataset from a catalog such as TensorFlow
+Datasets or Torchvision.
+
+Factory Methods
+***************
+
+.. automodule:: tlt.datasets.dataset_factory
+   :members: load_dataset, get_dataset
+
+Class Reference
+***************
+
+Image Classification
+^^^^^^^^^^^^^^^^^^^^
+
+.. currentmodule:: tlt.datasets.image_classification
+
+.. autosummary::
+   :toctree: _autosummary
+   :nosignatures:
+
+    tfds_image_classification_dataset.TFDSImageClassificationDataset
+    torchvision_image_classification_dataset.TorchvisionImageClassificationDataset
+    tf_custom_image_classification_dataset.TFCustomImageClassificationDataset
+    pytorch_custom_image_classification_dataset.PyTorchCustomImageClassificationDataset
+    image_classification_dataset.ImageClassificationDataset
+
+Text Classification
+^^^^^^^^^^^^^^^^^^^
+
+.. currentmodule:: tlt.datasets.text_classification
+
+.. autosummary::
+   :toctree: _autosummary
+   :nosignatures:
+
+    tfds_text_classification_dataset.TFDSTextClassificationDataset
+    hf_text_classification_dataset.HFTextClassificationDataset
+    tf_custom_text_classification_dataset.TFCustomTextClassificationDataset
+    hf_custom_text_classification_dataset.HFCustomTextClassificationDataset
+    text_classification_dataset.TextClassificationDataset
+
+Base Classes
+^^^^^^^^^^^^
+
+.. note:: Users should rarely need to interact directly with these.
+
+.. currentmodule:: tlt.datasets
+
+.. autosummary::
+   :toctree: _autosummary
+   :nosignatures:
+
+    pytorch_dataset.PyTorchDataset
+    tf_dataset.TFDataset
+    hf_dataset.HFDataset
+    dataset.BaseDataset
+
+Models
+------
+
+.. currentmodule:: tlt.models
+
+Discover and work with available models by using model factory methods. The :meth:`get_model` function will download
+third-party models, while the :meth:`load_model` function will load a custom model, from either a path location or a
+model object in memory. The model discovery and inspection methods are :meth:`get_supported_models` and
+:meth:`print_supported_models`.
+
+Factory Methods
+***************
+
+.. automodule:: tlt.models.model_factory
+   :members: get_model, load_model, get_supported_models, print_supported_models
+
+Class Reference
+***************
+
+Image Classification
+^^^^^^^^^^^^^^^^^^^^
+
+.. currentmodule:: tlt.models.image_classification
+
+.. autosummary::
+  :toctree: _autosummary
+  :nosignatures:
+
+   tfhub_image_classification_model.TFHubImageClassificationModel
+   tf_image_classification_model.TFImageClassificationModel
+   keras_image_classification_model.KerasImageClassificationModel
+   torchvision_image_classification_model.TorchvisionImageClassificationModel
+   pytorch_image_classification_model.PyTorchImageClassificationModel
+   pytorch_hub_image_classification_model.PyTorchHubImageClassificationModel
+   image_classification_model.ImageClassificationModel
+
+Text Classification
+^^^^^^^^^^^^^^^^^^^
+
+.. currentmodule:: tlt.models.text_classification
+
+.. autosummary::
+  :toctree: _autosummary
+  :nosignatures:
+
+   tf_text_classification_model.TFTextClassificationModel
+   pytorch_hf_text_classification_model.PyTorchHFTextClassificationModel
+   tf_hf_text_classification_model.TFHFTextClassificationModel
+   text_classification_model.TextClassificationModel
+
+Base Classes
+^^^^^^^^^^^^
+
+.. note:: Users should rarely need to interact directly with these.
+
+.. currentmodule:: tlt.models
+
+.. autosummary::
+   :toctree: _autosummary
+   :nosignatures:
+
+    pytorch_model.PyTorchModel
+    tf_model.TFModel
+    hf_model.HFModel
+    model.BaseModel
diff --git a/docs/cli.rst b/docs/cli.rst
new file mode 100644
index 0000000000000000000000000000000000000000..28bf6f03c819283b41b9ed45e75260423ffa1fd5
--- /dev/null
+++ b/docs/cli.rst
@@ -0,0 +1,7 @@
+CLI Reference
+=============
+
+.. click:: tlt.tools.cli.main:cli_group
+   :prog: tlt
+   :nested: full
+
diff --git a/docs/conf.py b/docs/conf.py
new file mode 100644
index 0000000000000000000000000000000000000000..6bae572f39e2a843b0945d7333017d4480c5e040
--- /dev/null
+++ b/docs/conf.py
@@ -0,0 +1,111 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+# Configuration file for the Sphinx documentation builder.
+#
+# This file only contains a selection of the most common options. For a full
+# list see the documentation:
+# https://www.sphinx-doc.org/en/master/usage/configuration.html
+
+# -- Path setup --------------------------------------------------------------
+
+# If extensions (or modules to document with autodoc) are in another directory,
+# add these directories to sys.path here. If the directory is relative to the
+# documentation root, use os.path.abspath to make it absolute, like shown here.
+#
+import os
+import sys
+import shutil
+import glob
+sys.path.insert(0, os.path.abspath('../..'))
+sys.setrecursionlimit(1500)
+import sphinx_rtd_theme
+from datetime import datetime
+
+# -- Project information -----------------------------------------------------
+
+project = 'Intel® Transfer Learning Tool'
+author = 'Intel Corporation'
+copyright = '2022-' + str(datetime.now().year) + u', ' + author
+
+# The full version, including alpha/beta/rc tags
+release = '0.2.0'
+
+
+# -- General configuration ---------------------------------------------------
+
+# Add any Sphinx extension module names here, as strings. They can be
+# extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
+# ones.
+extensions = [
+    'myst_parser',
+    'nbsphinx',
+    'nbsphinx_link',
+    'sphinx.ext.autodoc',
+    'sphinx.ext.autosummary',
+    'sphinx.ext.doctest',
+    'sphinx.ext.intersphinx',
+    'sphinx.ext.napoleon',
+    'sphinx.ext.todo',
+    'sphinx.ext.viewcode',
+    'sphinx_click',
+]
+
+# Add any paths that contain templates here, relative to this directory.
+templates_path = ['_templates']
+
+# List of patterns, relative to source directory, that match files and
+# directories to ignore when looking for source files.
+# This pattern also affects html_static_path and html_extra_path.
+exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store', '.venv3', 'README.md']
+
+# -- Options for HTML output -------------------------------------------------
+
+# The theme to use for HTML and HTML Help pages.  See the documentation for
+# a list of builtin themes.
+#
+html_theme = 'sphinx_rtd_theme'
+html_theme_path = [sphinx_rtd_theme.get_html_theme_path()]
+
+html_last_updated_fmt = '%b %d, %Y'
+html_show_sphinx = False
+html_favicon = 'images/favicon-intel-32x32.png'
+
+html_static_path = ['_static']
+templates_path = ['_templates']
+
+def setup(app):
+   app.add_css_file("tlt-custom.css")
+   app.add_js_file("tlt-custom.js")
+
+# Add any paths that contain custom static files (such as style sheets) here,
+# relative to this directory. They are copied after the builtin static files,
+# so a file named "default.css" will overwrite the builtin "default.css".
+autodoc_member_order = 'bysource'
+nbsphinx_execute = 'never'
+nbsphinx_prolog = """
+:orphan:
+
+"""
+myst_heading_anchors = 2
+suppress_warnings = ["myst.xref_missing", "myst.header"]
+
+# ask the myst parser to process <img> tags so Sphinx can handle the properly
+myst_enable_extensions = [ "html_image" ]
diff --git a/docs/distributed.rst b/docs/distributed.rst
new file mode 100644
index 0000000000000000000000000000000000000000..5a4e5389e4b37d1be3a43f1cdc3d35c578c1e532
--- /dev/null
+++ b/docs/distributed.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../tlt/distributed/README.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/docbuild.rst b/docs/docbuild.rst
new file mode 100644
index 0000000000000000000000000000000000000000..ee5e314b1ed114aa0a25f3c6041713625e80cced
--- /dev/null
+++ b/docs/docbuild.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: README.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/examples/README.rst b/docs/examples/README.rst
new file mode 100644
index 0000000000000000000000000000000000000000..8d2a38cb8c00e6bf2508262549d2195aca99c36f
--- /dev/null
+++ b/docs/examples/README.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../../examples/README.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/examples/cli/README.rst b/docs/examples/cli/README.rst
new file mode 100644
index 0000000000000000000000000000000000000000..d2a98679730db87110ccaee80e4a670232a5cffc
--- /dev/null
+++ b/docs/examples/cli/README.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../../../examples/cli/README.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/examples/cli/image_classification.rst b/docs/examples/cli/image_classification.rst
new file mode 100644
index 0000000000000000000000000000000000000000..601104ca62b44a68cfd0e0e8e104e97275a544f0
--- /dev/null
+++ b/docs/examples/cli/image_classification.rst
@@ -0,0 +1,2 @@
+.. include:: ../../../examples/cli/image_classification.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/examples/cli/text_classification.rst b/docs/examples/cli/text_classification.rst
new file mode 100644
index 0000000000000000000000000000000000000000..fbb183aa596c9019033322ec858f88e8f401ee13
--- /dev/null
+++ b/docs/examples/cli/text_classification.rst
@@ -0,0 +1,2 @@
+.. include:: ../../../examples/cli/text_classification.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/examples/examples.rst b/docs/examples/examples.rst
new file mode 100644
index 0000000000000000000000000000000000000000..65b30408f03f6739631782a45278fc04e50a2ee4
--- /dev/null
+++ b/docs/examples/examples.rst
@@ -0,0 +1,16 @@
+Examples
+########
+
+.. include:: ../../examples/README.md
+   :parser: myst_parser.sphinx_
+   :start-after: # Examples
+
+.. toctree::
+   :maxdepth: 1
+   :hidden:
+
+   cli/README
+   Image Classification CLI Example <cli/image_classification.rst>
+   Text Classification CLI Example <cli/text_classification.rst>
+   Jupyter Notebook API Examples <../notebooks/README>
+
diff --git a/docs/index.rst b/docs/index.rst
new file mode 100644
index 0000000000000000000000000000000000000000..c892c319c3d47025f10bbba15dfb947d2189164c
--- /dev/null
+++ b/docs/index.rst
@@ -0,0 +1,23 @@
+.. include:: ../README.md
+   :parser: myst_parser.sphinx_
+   :start-after: <!-- SkipBadges -->
+   :end-before: <!-- ExpandGetStarted-Start -->
+
+.. include:: ../README.md
+   :parser: myst_parser.sphinx_
+   :start-after: <!-- ExpandGetStarted-End -->
+
+.. toctree::
+   :maxdepth: 1
+   :hidden:
+
+   Documentation Home <self>
+   GetStarted
+   examples/examples
+   cli
+   api
+   Supported Models <Models>
+   Legal
+   genindex
+   GitHub Repository <https://github.com/IntelAI/transfer-learning-tool>
+
diff --git a/docs/make.bat b/docs/make.bat
new file mode 100644
index 0000000000000000000000000000000000000000..32bb24529f92346af26219baed295b7488b77534
--- /dev/null
+++ b/docs/make.bat
@@ -0,0 +1,35 @@
+@ECHO OFF
+
+pushd %~dp0
+
+REM Command file for Sphinx documentation
+
+if "%SPHINXBUILD%" == "" (
+	set SPHINXBUILD=sphinx-build
+)
+set SOURCEDIR=.
+set BUILDDIR=_build
+
+%SPHINXBUILD% >NUL 2>NUL
+if errorlevel 9009 (
+	echo.
+	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
+	echo.installed, then set the SPHINXBUILD environment variable to point
+	echo.to the full path of the 'sphinx-build' executable. Alternatively you
+	echo.may add the Sphinx directory to PATH.
+	echo.
+	echo.If you don't have Sphinx installed, grab it from
+	echo.https://www.sphinx-doc.org/
+	exit /b 1
+)
+
+if "%1" == "" goto help
+
+%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+goto end
+
+:help
+%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+
+:end
+popd
diff --git a/docs/methods.rst b/docs/methods.rst
new file mode 100644
index 0000000000000000000000000000000000000000..151c82716d45273a1c4f67c239fb2c8bfc3cdfd3
--- /dev/null
+++ b/docs/methods.rst
@@ -0,0 +1,68 @@
+:orphan:
+
+Image Classification Methods
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+.. currentmodule:: tlt.models.image_classification
+
+.. autosummary::
+  :toctree: _autosummary
+  :nosignatures:
+   
+   tfhub_image_classification_model.TFHubImageClassificationModel.train
+   tfhub_image_classification_model.TFHubImageClassificationModel.quantize
+   tfhub_image_classification_model.TFHubImageClassificationModel.optimize_graph
+   tfhub_image_classification_model.TFHubImageClassificationModel.benchmark
+
+   tf_image_classification_model.TFImageClassificationModel.train
+   tf_image_classification_model.TFImageClassificationModel.quantize
+   tf_image_classification_model.TFImageClassificationModel.optimize_graph
+   tf_image_classification_model.TFImageClassificationModel.benchmark
+
+   keras_image_classification_model.KerasImageClassificationModel.train
+   keras_image_classification_model.KerasImageClassificationModel.quantize
+   keras_image_classification_model.KerasImageClassificationModel.optimize_graph
+   keras_image_classification_model.KerasImageClassificationModel.benchmark
+
+   torchvision_image_classification_model.TorchvisionImageClassificationModel.train
+   torchvision_image_classification_model.TorchvisionImageClassificationModel.quantize
+   torchvision_image_classification_model.TorchvisionImageClassificationModel.benchmark
+
+   pytorch_image_classification_model.PyTorchImageClassificationModel.train
+   pytorch_image_classification_model.PyTorchImageClassificationModel.quantize
+   pytorch_image_classification_model.PyTorchImageClassificationModel.benchmark
+
+   pytorch_hub_image_classification_model.PyTorchHubImageClassificationModel.train
+   pytorch_hub_image_classification_model.PyTorchHubImageClassificationModel.quantize
+   pytorch_hub_image_classification_model.PyTorchHubImageClassificationModel.benchmark
+
+   image_classification_model.ImageClassificationModel.train
+   image_classification_model.ImageClassificationModel.quantize
+   image_classification_model.ImageClassificationModel.benchmark
+
+Text Classification Methods
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+.. currentmodule:: tlt.models.text_classification
+
+.. autosummary::
+  :toctree: _autosummary
+  :nosignatures:
+  :recursive:
+
+   tf_text_classification_model.TFTextClassificationModel.train
+   tf_text_classification_model.TFTextClassificationModel.quantize
+   tf_text_classification_model.TFTextClassificationModel.optimize_graph
+   tf_text_classification_model.TFTextClassificationModel.benchmark
+
+   pytorch_hf_text_classification_model.PyTorchHFTextClassificationModel.train
+   pytorch_hf_text_classification_model.PyTorchHFTextClassificationModel.quantize
+   pytorch_hf_text_classification_model.PyTorchHFTextClassificationModel.benchmark
+
+   tf_hf_text_classification_model.TFHFTextClassificationModel.train
+   tf_hf_text_classification_model.TFHFTextClassificationModel.quantize
+   tf_hf_text_classification_model.TFHFTextClassificationModel.optimize_graph
+   tf_hf_text_classification_model.TFHFTextClassificationModel.benchmark
+   
+   text_classification_model.TextClassificationModel.train
+   text_classification_model.TextClassificationModel.quantize
+   text_classification_model.TextClassificationModel.benchmark
diff --git a/docs/notebooks/Medical_Imaging_Classification.nblink b/docs/notebooks/Medical_Imaging_Classification.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..cfcc35b0d445825a4b4e2821e55c3af1f6ed8292
--- /dev/null
+++ b/docs/notebooks/Medical_Imaging_Classification.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb"
+}
diff --git a/docs/notebooks/README.rst b/docs/notebooks/README.rst
new file mode 100644
index 0000000000000000000000000000000000000000..0bf4ee834d47f58a4a017dc408aaedda9dfba726
--- /dev/null
+++ b/docs/notebooks/README.rst
@@ -0,0 +1,96 @@
+Intel® Transfer Learning Tool API Notebook Examples
+===================================================
+
+.. toctree::
+   :maxdepth: 1
+   :hidden:
+
+   setup
+
+API examples are demonstrated using Jupyter notebooks.
+
+Prerequisites
+*************
+
+Before running these Jupyter notebook examples, use these :doc:`notebook setup
+instructions<setup>` to install required dependencies.
+
+
+Intel Transfer Learning Tool API Tutorial Notebooks
+***************************************************
+
+.. |imageClassPyTorch| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageClassPyTorch: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb
+
+.. |imageClassTensorFlow| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageClassTensorflow: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb
+
+.. |textClassPyTorch| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _textClassPyTorch: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb
+
+.. |textClassTensorFlow| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _textClassTensorflow: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb
+
+.. |imageAnomalyPyTorch| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageAnomalyPyTorch: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection/Anomaly_Detection.ipynb
+
+.. csv-table::
+   :header: "Notebook Title", ".ipynb Link", "Use Case", "Framework"
+   :widths: 30, 10, 20, 20
+
+   :doc:`Image Classification with PyTorch <TLT_PyTorch_Image_Classification_Transfer_Learning>`, |imageClassPyTorch|_ , Image Classification, PyTorch & Intel Transfer Learning Tool
+   :doc:`Image Classification with TensorFlow <TLT_TF_Image_Classification_Transfer_Learning>`, |imageClassTensorFlow|_ , Image Classification, TensorFlow & Intel Transfer Learning Tool
+   :doc:`Text Classification with PyTorch <TLT_PyTorch_Text_Classification_Transfer_Learning>`, |textClassPyTorch|_ , Text Classification, PyTorch & Intel Transfer Learning Tool
+   :doc:`Text Classification with TensorFlow <TLT_TF_Text_Classification_Transfer_Learning>`, |textClassTensorflow|_ , Text Classification, TensorFlow & Intel Transfer Learning Tool
+   :doc:`Anomaly Detection using PyTorch <TLT_PyTorch_Anomly_Detection>`, |imageAnomalyPyTorch|_, Image Anomaly Detection, PyTorch & Intel Transfer Learning Tool
+
+Intel Transfer Learning Tool API End-to-End Pipelines
+*****************************************************
+
+.. |imageClassMedical| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageClassMedical: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb
+
+.. |imageClassRemote| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageClassRemote: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb
+
+
+.. csv-table::
+   :header: "Notebook Title", ".ipynb Link", "Use Case", "Framework"
+   :widths: 30, 10, 20, 20
+
+   :doc:`Medical Imaging Classification (Colorectal histology) using TensorFlow <Medical_Imaging_Classification>`, |imageClassMedical|_ , Image Classification, TensorFlow & Intel Transfer Learning Tool
+   :doc:`Remote Sensing Image Scene Classification (Resisc) using TensorFlow <Remote_Sensing_Image_Scene_Classification>`, |imageClassRemote|_ , Image Classification, TensorFlow & Intel Transfer Learning Tool
+
+Intel Transfer Learning Tool Performance Comparison
+*****************************************************
+
+.. |imageClassTFPerf| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _imageClassTFPerf: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/performance/tf_image_classification_performance.ipynb
+
+.. |textClassHFPerf| image:: /images/Jupyter_logo.svg
+             :alt: Jupyter notebook .ipynb file
+             :height: 35
+.. _textClassHFPerf: https://github.com/IntelAI/transfer-learning/blob/main/notebooks/performance/hf_text_classification_performance.ipynb
+
+.. csv-table::
+   :header: "Notebook Title", ".ipynb Link", "Use Case", "Framework"
+   :widths: 30, 10, 20, 20
+
+   :doc:`Performance Comparison: Image Classification with TensorFlow <TLT_TF_Image_Classification_Performance>`, |imageClassTFPerf|_ , Image Classification, TensorFlow & Intel Transfer Learning Tool
+   :doc:`Performance Comparison: Text Classification with Hugging Face <TLT_HF_Text_Classification_Performance>`, |textClassHFPerf|_ , Text Classification, "Hugging Face, PyTorch & Intel Transfer Learning Tool"
diff --git a/docs/notebooks/Remote_Sensing_Image_Scene_Classification.nblink b/docs/notebooks/Remote_Sensing_Image_Scene_Classification.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..049a7432c5a4bec934bca5b158f04f36a2c49b17
--- /dev/null
+++ b/docs/notebooks/Remote_Sensing_Image_Scene_Classification.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb"
+}
diff --git a/docs/notebooks/TLT_HF_Text_Classification_Performance.nblink b/docs/notebooks/TLT_HF_Text_Classification_Performance.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..16675ab76dfdfbc554343cd9e26484e6f347374c
--- /dev/null
+++ b/docs/notebooks/TLT_HF_Text_Classification_Performance.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/performance/hf_text_classification_performance.ipynb"
+}
diff --git a/docs/notebooks/TLT_PyTorch_Anomly_Detection.nblink b/docs/notebooks/TLT_PyTorch_Anomly_Detection.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..991c14663d63c2ce9324e1a4400ae61413c5815d
--- /dev/null
+++ b/docs/notebooks/TLT_PyTorch_Anomly_Detection.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection/Anomaly_Detection.ipynb"
+}
diff --git a/docs/notebooks/TLT_PyTorch_Image_Classification_Transfer_Learning.nblink b/docs/notebooks/TLT_PyTorch_Image_Classification_Transfer_Learning.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..5c4860d1590528aa461ea97df59b148bccac173c
--- /dev/null
+++ b/docs/notebooks/TLT_PyTorch_Image_Classification_Transfer_Learning.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb"
+}
diff --git a/docs/notebooks/TLT_PyTorch_Text_Classification_Transfer_Learning.nblink b/docs/notebooks/TLT_PyTorch_Text_Classification_Transfer_Learning.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..35799bb73ee5e94fbc2a0628471972451aef80c7
--- /dev/null
+++ b/docs/notebooks/TLT_PyTorch_Text_Classification_Transfer_Learning.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb"
+}
diff --git a/docs/notebooks/TLT_TF_Image_Classification_Performance.nblink b/docs/notebooks/TLT_TF_Image_Classification_Performance.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..20e7f8f8ff391aaf9f096c952d1bb26ba0f309e1
--- /dev/null
+++ b/docs/notebooks/TLT_TF_Image_Classification_Performance.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/performance/tf_image_classification_performance.ipynb"
+}
diff --git a/docs/notebooks/TLT_TF_Image_Classification_Transfer_Learning.nblink b/docs/notebooks/TLT_TF_Image_Classification_Transfer_Learning.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..7cef52ca9f36d4fe330639f0fb6456611abef3fd
--- /dev/null
+++ b/docs/notebooks/TLT_TF_Image_Classification_Transfer_Learning.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb"
+}
diff --git a/docs/notebooks/TLT_TF_Text_Classification_Transfer_Learning.nblink b/docs/notebooks/TLT_TF_Text_Classification_Transfer_Learning.nblink
new file mode 100644
index 0000000000000000000000000000000000000000..bf4a8a38a7dcccb986d047ebd01b24d2855a1a3a
--- /dev/null
+++ b/docs/notebooks/TLT_TF_Text_Classification_Transfer_Learning.nblink
@@ -0,0 +1,3 @@
+{
+    "path": "../../notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb"
+}
diff --git a/docs/notebooks/setup.rst b/docs/notebooks/setup.rst
new file mode 100644
index 0000000000000000000000000000000000000000..a0e63106ebf3367f8014cd4f41c6b6fe7786dc09
--- /dev/null
+++ b/docs/notebooks/setup.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../../notebooks/setup.md
+   :parser: myst_parser.sphinx_
diff --git a/docs/requirements-docs.txt b/docs/requirements-docs.txt
new file mode 100644
index 0000000000000000000000000000000000000000..f3de818d0c8f1ccd68e97836531445220595e9f9
--- /dev/null
+++ b/docs/requirements-docs.txt
@@ -0,0 +1,8 @@
+docutils~=0.17.1
+ipykernel~=6.23.0
+myst-parser~=0.18.1
+nbsphinx~=0.9.1
+nbsphinx-link~=1.3.0
+sphinx~=5.2.0
+sphinx_click~=4.4.0
+sphinx_rtd_theme~=1.2.0
diff --git a/docs/tlt/distributed/README.rst b/docs/tlt/distributed/README.rst
new file mode 100644
index 0000000000000000000000000000000000000000..147065b960eb20ae04045c2f3569c3b93630242f
--- /dev/null
+++ b/docs/tlt/distributed/README.rst
@@ -0,0 +1,4 @@
+:orphan:
+
+.. include:: ../../../tlt/distributed/README.md
+   :parser: myst_parser.sphinx_
diff --git a/downloader/README.md b/downloader/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..1a47f58169aa44a94b5b258af5e6f78553d42e69
--- /dev/null
+++ b/downloader/README.md
@@ -0,0 +1,71 @@
+# Downloader
+
+An easy-to-use, unified tool for downloading and managing AI datasets and models.
+
+## Datasets
+
+### Supported Catalogs & File Types
+
+| Source | Info |
+|----------|-----------|
+| TensorFlow Datasets | [https://www.tensorflow.org/datasets](https://www.tensorflow.org/datasets) |
+| Torchvision | [https://pytorch.org/vision/stable/datasets.html](https://pytorch.org/vision/stable/datasets.html) |
+| Hugging Face | [https://huggingface.co/docs/datasets/index](https://huggingface.co/docs/datasets/index) |
+| Generic Web URL | Publicly downloadable files: `.zip`, `.gz`, `.bz2`, `.txt`, `.csv`, `.png`, `.jpg`, etc. |
+
+### Usage
+
+Dataset catalog example:
+```
+from downloader.datasets import DataDownloader
+
+downloader = DataDownloader('tf_flowers', dataset_dir='/home/user/datasets', catalog='tensorflow_datasets')
+downloader.download(split='train')
+```
+
+URL example:
+```
+from downloader.datasets import DataDownloader
+
+downloader = DataDownloader('my_dataset', dataset_dir='/home/user/datasets', url='http://<domain>/<filename>.zip')
+downloader.download()
+```
+
+## Models
+
+### Supported Model Hubs
+
+| Source | Info |
+|----------|-----------|
+| TensorFlow Hub | [https://www.tensorflow.org/hub](https://www.tensorflow.org/hub) |
+| Torchvision | [https://pytorch.org/vision/stable/models.html](https://pytorch.org/vision/stable/models.html) |
+| Hugging Face | [https://huggingface.co/models](https://huggingface.co/models) (AutoModelForSequenceClassification or TFBertModel types) |
+
+### Usage
+
+Example:
+```
+from downloader.models import ModelDownloader
+
+# Hugging Face
+downloader = ModelDownloader('bert-large-uncased', hub='hugging_face', num_labels=2)
+downloader.download()
+
+# Torchvision
+downloader = ModelDownloader('resnet34', hub='torchvision')
+downloader.download()
+```
+
+## Build and Install
+
+To install the downloader, follow [The setup instructions for Intel Transfer Learning Tool](/README.md#build-and-install). The downloader is currently
+packaged alongside the Intel Transfer Learning Tool and uses its requirements.txt files, but the tools can be separated at some future time. The
+downloader's dependencies are tracked in [requirements.txt](requirements.txt).
+
+## Testing
+With an activated environment that has the dependencies for the downloader and `pytest` in it, run this command from
+the root repository directory:
+
+```
+py.test -s downloader/tests
+```
diff --git a/downloader/__init__.py b/downloader/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..c754cd09acd3651e1431bb4997d7a37b861c32d6
--- /dev/null
+++ b/downloader/__init__.py
@@ -0,0 +1,23 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+BASE_DIR = os.path.dirname(__file__)
diff --git a/downloader/datasets.py b/downloader/datasets.py
new file mode 100644
index 0000000000000000000000000000000000000000..16bfb8d62cdab75f9363e01aacd6dea32686c37c
--- /dev/null
+++ b/downloader/datasets.py
@@ -0,0 +1,129 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+from pydoc import locate
+import tarfile
+import zipfile
+import inspect
+
+from downloader.types import DatasetType
+from downloader import utils
+
+
+class DataDownloader():
+    """
+    A unified dataset downloader class.
+
+    Can download from TensorFlow Datasets, Torchvision, Hugging Face, and generic web URLs. If initialized for a
+    dataset catalog, the download method will return a dataset object of type tensorflow.data.Dataset,
+    torch.utils.data.Dataset, or datasets.arrow_dataset.Dataset. If initialized for a web URL that is a zipfile or a
+    tarfile, the file will be extracted and the path, or list of paths, to the extracted contents will be returned.
+    """
+    def __init__(self, dataset_name, dataset_dir, catalog=None, url=None, **kwargs):
+        """
+        Class constructor for a DataDownloader.
+
+            Args:
+                dataset_name (str): Name of the dataset
+                dataset_dir (str): Local destination directory of dataset
+                catalog (str, optional): The catalog to download the dataset from; options are 'tensorflow_datasets',
+                    'torchvision', 'hugging_face', and None which will result in a GENERIC type dataset which expects
+                    an accompanying url input
+                url (str, optional): If downloading from the web, provide the URL location
+                kwargs (optional): Some catalogs accept additional keyword arguments when downloading
+
+            raises:
+                ValueError if both catalog and url are omitted or if both are provided
+
+        """
+        if catalog is None and url is None:
+            raise ValueError("Must provide either a catalog or url as the source.")
+        if catalog is not None and url is not None:
+            raise ValueError("Only one of catalog or url should be provided. Found {} and {}.".format(catalog, url))
+
+        if not os.path.isdir(dataset_dir):
+            os.makedirs(dataset_dir)
+
+        self._dataset_name = dataset_name
+        self._dataset_dir = dataset_dir
+        self._type = DatasetType.from_str(catalog)
+        self._url = url
+        self._args = kwargs
+
+    def download(self, split='train'):
+        """
+        Download the dataset
+
+            Args:
+                split (str): desired split, optional
+
+            Returns:
+                tensorflow.data.Dataset, torch.utils.data.Dataset, datasets.arrow_dataset.Dataset, str, or list[str]
+
+        """
+        if self._type == DatasetType.TENSORFLOW_DATASETS:
+            import tensorflow_datasets as tfds
+            if isinstance(split, str):
+                split = [split]
+            os.environ['NO_GCE_CHECK'] = 'true'
+            return tfds.load(self._dataset_name,
+                             data_dir=self._dataset_dir,
+                             split=split,
+                             **self._args)
+
+        elif self._type == DatasetType.TORCHVISION:
+            from torchvision.datasets import __all__ as torchvision_datasets
+            dataset_class = locate('torchvision.datasets.{}'.format(self._dataset_name))
+            if dataset_class:
+                params = inspect.signature(dataset_class).parameters
+                kwargs = dict(download=True, split=split, train=split == 'train')
+                kwargs = dict([(k, v) for k, v in kwargs.items() if k in params])
+                return dataset_class(self._dataset_dir, **kwargs)
+            else:
+                raise ValueError("Torchvision dataset {} not found in following: {}"
+                                 .format(self._dataset_name, torchvision_datasets))
+
+        elif self._type == DatasetType.HUGGING_FACE:
+            from datasets import load_dataset
+            if 'subset' in self._args:
+                return load_dataset(self._dataset_name, self._args['subset'], split=split, cache_dir=self._dataset_dir)
+            else:
+                return load_dataset(self._dataset_name, split=split, cache_dir=self._dataset_dir)
+
+        elif self._type == DatasetType.GENERIC:
+            file_path = utils.download_file(self._url, self._dataset_dir)
+            if os.path.isfile(file_path):
+                if tarfile.is_tarfile(file_path):
+                    contents = utils.extract_tar_file(file_path, self._dataset_dir)
+                elif zipfile.is_zipfile(file_path):
+                    contents = utils.extract_zip_file(file_path, self._dataset_dir)
+                else:
+                    return file_path
+
+                # Contents are a list of top-level extracted members
+                # Convert to absolute paths and return a single string if length is 1
+                if len(contents) > 1:
+                    return [os.path.join(self._dataset_dir, i) for i in contents]
+                else:
+                    return os.path.join(self._dataset_dir, contents[0])
+
+            else:
+                raise FileNotFoundError("Unable to find the downloaded file at:", file_path)
diff --git a/downloader/models.py b/downloader/models.py
new file mode 100644
index 0000000000000000000000000000000000000000..d2c93f3c1f19d478c992ab4e324d570383b7bc68
--- /dev/null
+++ b/downloader/models.py
@@ -0,0 +1,119 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+from pydoc import locate
+
+from downloader.types import ModelType
+
+
+class ModelDownloader():
+    """
+    A unified model downloader class.
+
+    Can download models from TF Hub, Torchvision, and Hugging Face.
+    """
+    def __init__(self, model_name, hub, model_dir=None, **kwargs):
+        """
+        Class constructor for a ModelDownloader.
+
+            Args:
+                model_name (str): Name of the model
+                hub (str, optional): The catalog to download the model from; options are 'tf_hub',
+                    'torchvision', 'pytorch_hub', 'hugging_face', and 'keras'
+                model_dir (str): Local destination directory of the model, if None the model hub's default cache
+                    directory will be used
+                kwargs (optional): Some model hubs accept additional keyword arguments when downloading
+
+        """
+        if model_dir is not None and not os.path.isdir(model_dir):
+            os.makedirs(model_dir)
+
+        self._model_name = model_name
+        self._model_dir = model_dir
+        self._type = ModelType.from_str(hub)
+        self._args = kwargs
+
+    def download(self):
+        """
+        Download the model
+
+            Returns:
+                A torch.nn.Module, keras.engine.functional.Functional, or tensorflow_hub.keras_layer.KerasLayer object
+
+        """
+        if self._type == ModelType.TF_HUB:
+            from tensorflow_hub import KerasLayer
+            if self._model_dir is not None:
+                os.environ['TFHUB_CACHE_DIR'] = self._model_dir
+
+            return KerasLayer(self._model_name, **self._args)
+
+        elif self._type == ModelType.TORCHVISION:
+            if self._model_dir is not None:
+                os.environ['TORCH_HOME'] = self._model_dir
+            pretrained_model_class = locate('torchvision.models.{}'.format(self._model_name))
+
+            return pretrained_model_class(**self._args)
+
+        elif self._type == ModelType.PYTORCH_HUB:
+            from tlt.utils.file_utils import read_json_file
+            from tlt import TLT_BASE_DIR
+            import torch
+
+            if self._model_dir is not None:
+                os.environ['TORCH_HOME'] = self._model_dir
+
+            config_file = os.path.join(TLT_BASE_DIR, "models/configs/pytorch_hub_image_classification_models.json")
+            pytorch_hub_model_map = read_json_file(config_file)
+            self._repo = pytorch_hub_model_map[self._model_name]["repo"]
+
+            # Some models have pretrained=True by default, which error out if passed in load()
+            if pytorch_hub_model_map[self._model_name]["pretrained_default"] == "True":
+                return torch.hub.load(self._repo, self._model_name)
+            else:
+                return torch.hub.load(self._repo, self._model_name, pretrained=True)
+
+        elif self._type == ModelType.HUGGING_FACE:
+            if self._model_dir is not None:
+                os.environ['TRANSFORMERS_CACHE'] = self._model_dir
+            # AutoModelForSequenceClassification is currently the only supported model type
+            from transformers import AutoModelForSequenceClassification
+
+            return AutoModelForSequenceClassification.from_pretrained(self._model_name, **self._args)
+
+        elif self._type == ModelType.KERAS_APPLICATIONS:
+            if self._model_dir is not None:
+                os.environ['KERAS_HOME'] = self._model_dir
+            try:
+                pretrained_model_class = locate('keras.applications.{}'.format(self._model_name))
+            except TypeError:
+                pretrained_model_class = locate('keras.applications.{}.{}'.format(self._model_name.lower(),
+                                                                                  self._model_name))
+
+            return pretrained_model_class(**self._args)
+
+        elif self._type == ModelType.TF_BERT_HUGGINGFACE:
+            if self._model_dir is not None:
+                os.environ['TRANSFORMERS_CACHE'] = self._model_dir
+            from transformers import BertConfig, TFBertModel
+
+            config = BertConfig.from_pretrained(self._model_name, output_hidden_states=True)
+            return TFBertModel.from_pretrained(self._model_name, config=config, from_pt=True, **self._args)
diff --git a/downloader/tests/__init__.py b/downloader/tests/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..55899ddaa2b193dbc3b2d314ec2712c6378dd375
--- /dev/null
+++ b/downloader/tests/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/downloader/tests/test_dataset_download.py b/downloader/tests/test_dataset_download.py
new file mode 100644
index 0000000000000000000000000000000000000000..c24d1596160ca962faf066f9367310abba8ef7cb
--- /dev/null
+++ b/downloader/tests/test_dataset_download.py
@@ -0,0 +1,116 @@
+import os
+import pytest
+import shutil
+import tempfile
+
+try:
+    from datasets.arrow_dataset import Dataset as HF_Dataset
+except ModuleNotFoundError:
+    print("WARNING: datasets may not be installed")
+
+try:
+    from torch.utils.data import Dataset as TV_Dataset
+except ModuleNotFoundError:
+    print("WARNING: torch may not be installed")
+
+try:
+    from tensorflow.data import Dataset as TF_Dataset
+except ModuleNotFoundError:
+    print("WARNING: tensorflow may not be installed")
+
+from downloader import datasets
+from downloader.types import DatasetType
+
+
+@pytest.mark.parametrize('dataset_name,catalog,url',
+                         [['foo', 'tfds', 'https:...'],
+                          ['bar', 'bar', None],
+                          ['baz', None, None]])
+def test_bad_download(dataset_name, catalog, url):
+    """
+    Tests downloader throws ValueError for bad inputs
+    """
+    with pytest.raises(ValueError):
+        datasets.DataDownloader(dataset_name, dataset_dir='/tmp/data', catalog=catalog, url=url)
+
+
+class TestDatasetDownload:
+    """
+    Tests the dataset downloader with a temp download directory that is initialized and cleaned up
+    """
+    URLS = {'sms_spam_collection':
+            'https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip',
+            'flowers':
+            'https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz',
+            'imagenet_labels':
+            'https://storage.googleapis.com/download.tensorflow.org/data/ImageNetLabels.txt',
+            'peacock':
+            'https://c8.staticflickr.com/8/7095/7210797228_c7fe51c3cb_z.jpg',
+            'pennfudan':
+            'https://www.cis.upenn.edu/~jshi/ped_html/PennFudanPed.zip'}
+
+    @classmethod
+    def setup_class(cls):
+        cls._dataset_dir = tempfile.mkdtemp()
+
+    @classmethod
+    def teardown_class(cls):
+        if os.path.exists(cls._dataset_dir):
+            print("Deleting test directory:", cls._dataset_dir)
+            shutil.rmtree(cls._dataset_dir)
+
+    @pytest.mark.integration
+    @pytest.mark.parametrize('dataset_name,catalog,split,kwargs,size',
+                             [['tf_flowers', 'tfds', 'train', {}, 3670],
+                              ['CIFAR10', 'torchvision', 'train', {}, 50000],
+                              ['CIFAR10', 'torchvision', 'val', {}, 10000],
+                              ['imdb', 'huggingface', 'train', {}, 25000],
+                              ['glue', 'huggingface', 'test', {'subset': 'sst2'}, 1821]])
+    def test_catalog_download(self, dataset_name, catalog, split, kwargs, size):
+        """
+        Tests downloader for different dataset catalog types and splits
+        """
+        downloader = datasets.DataDownloader(dataset_name, dataset_dir=self._dataset_dir, catalog=catalog, **kwargs)
+        data = downloader.download(split=split)
+
+        # Check the type of the downloader and returned object
+        if catalog == 'tfds':
+            data = data[0]  # TFDS returns a list with the dataset in it
+            assert downloader._type == DatasetType.TENSORFLOW_DATASETS
+            assert isinstance(data, TF_Dataset)
+        elif catalog == 'torchvision':
+            assert downloader._type == DatasetType.TORCHVISION
+            assert isinstance(data, TV_Dataset)
+        elif catalog == 'huggingface':
+            assert downloader._type == DatasetType.HUGGING_FACE
+            assert isinstance(data, HF_Dataset)
+
+        # Verify the split size
+        assert len(data) == size
+
+        # Check that the directory is not empty
+        assert os.listdir(self._dataset_dir) is not None
+
+    @pytest.mark.parametrize('dataset_name,url,num_contents',
+                             [['sms_spam_collection', URLS['sms_spam_collection'], 2],
+                              ['flowers', URLS['flowers'], 1],
+                              ['imagenet_labels', URLS['imagenet_labels'], 1],
+                              ['peacock', URLS['peacock'], 1],
+                              ['pennfudan', URLS['pennfudan'], 1]])
+    def test_generic_download(self, dataset_name, url, num_contents):
+        """
+        Tests downloader for different web URLs and file types
+        """
+        downloader = datasets.DataDownloader(dataset_name, dataset_dir=self._dataset_dir, url=url)
+        data_path = downloader.download()
+
+        assert downloader._type == DatasetType.GENERIC
+
+        # Test that the returned object is the expected type and length
+        if num_contents == 1:
+            assert isinstance(data_path, str)
+            assert os.path.exists(data_path)
+        else:
+            assert isinstance(data_path, list)
+            for path in data_path:
+                assert os.path.exists(path)
diff --git a/downloader/tests/test_model_download.py b/downloader/tests/test_model_download.py
new file mode 100644
index 0000000000000000000000000000000000000000..d79068c11f3ba16b9db56e3ac60748f13e5bf3f7
--- /dev/null
+++ b/downloader/tests/test_model_download.py
@@ -0,0 +1,91 @@
+import os
+import pytest
+import shutil
+import tempfile
+
+try:
+    from torch.nn import Module
+except ModuleNotFoundError:
+    print("WARNING: Unable to import torch. Torch may not be installed")
+
+try:
+    from tensorflow_hub.keras_layer import KerasLayer
+except ModuleNotFoundError:
+    print("WARNING: Unable to import KerasLayer. Tensorflow Hub may not be installed")
+
+try:
+    from tensorflow.keras import Model
+except ModuleNotFoundError:
+    print("WARNING: Unable to import Keras Model. Tensorflow may not be installed")
+
+from downloader import models
+from downloader.types import ModelType
+
+
+@pytest.mark.parametrize('hub',
+                         [['foo'],
+                          ['bar'],
+                          ['baz']])
+def test_bad_hub(hub):
+    """
+    Tests downloader throws ValueError for bad inputs
+    """
+    model_name = 'model'
+    with pytest.raises(ValueError):
+        models.ModelDownloader(model_name, hub)
+
+
+class TestModelDownload:
+    """
+    Tests the model downloader with a temp download directory that is initialized and cleaned up
+    """
+    @classmethod
+    def setup_class(cls):
+        cls._model_dir = tempfile.mkdtemp()
+
+    @classmethod
+    def teardown_class(cls):
+        if os.path.exists(cls._model_dir):
+            print("Deleting test directory:", cls._model_dir)
+            shutil.rmtree(cls._model_dir)
+
+    # Has previously been skipped due to HTTP Error 403: rate limit exceeded')
+    @pytest.mark.parametrize('model_name,hub,kwargs',
+                             [['https://tfhub.dev/google/efficientnet/b0/feature-vector/1', 'tf_hub', {}],
+                              ['https://tfhub.dev/tensorflow/bert_en_uncased_L-12_H-768_A-12/3', 'tfhub',
+                               {'name': 'encoder', 'trainable': True}],
+                              ['resnet34', 'torchvision', {}],
+                              ['mobilenet_v2', 'torchvision', {}],
+                              ['resnet18_ssl', 'pytorch_hub', {}],
+                              ['resnet50_swsl', 'pytorch_hub', {}],
+                              ['distilbert-base-uncased', 'huggingface', {}],
+                              ['bert-base-cased', 'hugging_face', {}],
+                              ['Xception', 'keras_applications', {}],
+                              ['ResNet50', 'keras', {'weights': 'imagenet', 'include_top': False}],
+                              ['google/bert_uncased_L-2_H-128_A-2', 'tf_bert_huggingface', {}],
+                              ['bert-base-uncased', 'tf_bert_hugging_face', {}]])
+    def test_hub_download(self, model_name, hub, kwargs):
+        """
+        Tests downloader for different model hubs
+        """
+        downloader = models.ModelDownloader(model_name, hub, model_dir=self._model_dir, **kwargs)
+        model = downloader.download()
+
+        # Check the type of the downloader and returned object
+        if downloader._type == ModelType.TF_HUB:
+            assert isinstance(model, KerasLayer)
+        elif downloader._type == ModelType.TORCHVISION:
+            assert isinstance(model, Module)
+        elif downloader._type == ModelType.PYTORCH_HUB:
+            assert isinstance(model, Module)
+        elif downloader._type == ModelType.HUGGING_FACE:
+            assert isinstance(model, Module)
+        elif downloader._type == ModelType.KERAS_APPLICATIONS:
+            assert isinstance(model, Model)
+        elif downloader._type == ModelType.TF_BERT_HUGGINGFACE:
+            assert isinstance(model, Model)
+        else:
+            assert False
+
+        # Check that the directory is not empty
+        assert os.listdir(self._model_dir) is not None
diff --git a/downloader/types.py b/downloader/types.py
new file mode 100644
index 0000000000000000000000000000000000000000..a935fef8288e617e58d5b9b36ac5e393d987bdea
--- /dev/null
+++ b/downloader/types.py
@@ -0,0 +1,91 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from enum import Enum, auto
+
+
+class DatasetType(Enum):
+    TENSORFLOW_DATASETS = auto()
+    TORCHVISION = auto()
+    HUGGING_FACE = auto()
+    GENERIC = auto()
+
+    def __str__(self):
+        return self.name.lower()
+
+    @staticmethod
+    def from_str(dataset_str):
+        if dataset_str is None:
+            return DatasetType.GENERIC
+
+        dataset_str = dataset_str.lower()
+
+        if dataset_str in ["tfds", "tensorflow", "tensorflow_datasets", "tensorflow datasets", "tensorflow_dataset",
+                           "tensorflow dataset"]:
+            return DatasetType.TENSORFLOW_DATASETS
+        elif dataset_str in ["torchvision"]:
+            return DatasetType.TORCHVISION
+        elif dataset_str in ["huggingface", "hugging_face", "hugging face"]:
+            return DatasetType.HUGGING_FACE
+        elif dataset_str in ["generic"]:
+            return DatasetType.GENERIC
+        else:
+            options = [e.name for e in DatasetType]
+            raise ValueError("Unsupported dataset type: {} (Select from: {})".format(
+                dataset_str, options))
+
+
+class ModelType(Enum):
+    TF_HUB = auto()
+    TORCHVISION = auto()
+    PYTORCH_HUB = auto()
+    HUGGING_FACE = auto()
+    KERAS_APPLICATIONS = auto()
+    TF_BERT_HUGGINGFACE = auto()
+    GENERIC = auto()
+
+    def __str__(self):
+        return self.name.lower()
+
+    @staticmethod
+    def from_str(model_str):
+        if model_str is None:
+            return ModelType.GENERIC
+
+            model_str = model_str.lower()
+
+        if model_str in ["tfhub", "tf_hub", "tf hub", "tensorflow_hub", "tensorflow hub"]:
+            return ModelType.TF_HUB
+        elif model_str in ["torchvision"]:
+            return ModelType.TORCHVISION
+        elif model_str in ["pytorch_hub", "pyt_hub", "torch_hub", "torch hub", "pytorch hub"]:
+            return ModelType.PYTORCH_HUB
+        elif model_str in ["huggingface", "hugging_face", "hugging face"]:
+            return ModelType.HUGGING_FACE
+        elif model_str in ["keras", "keras_applications", "keras applications"]:
+            return ModelType.KERAS_APPLICATIONS
+        elif model_str in ["tf_bert_huggingface", "tf bert huggingface", "tf_bert_hugging_face",
+                           "tf bert hugging face"]:
+            return ModelType.TF_BERT_HUGGINGFACE
+        elif model_str in ["generic"]:
+            return ModelType.GENERIC
+        else:
+            options = [e.name for e in ModelType]
+            raise ValueError("Unsupported model type: {} (Select from: {})".format(model_str, options))
diff --git a/downloader/utils.py b/downloader/utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..0ae94b4d6a29926326fbe67827bc70f2ce1f8486
--- /dev/null
+++ b/downloader/utils.py
@@ -0,0 +1,73 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import tarfile
+import requests
+import shutil
+import zipfile
+
+
+def download_file(download_url, destination_directory):
+    """
+    Downloads a file using the specified url to the destination directory. Returns the
+    path to the downloaded file.
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    destination_file_path = os.path.join(destination_directory, os.path.basename(download_url))
+
+    print("Downloading {} to {}".format(download_url, destination_directory))
+    response = requests.get(download_url, stream=True, timeout=30)
+    with open(destination_file_path, 'wb') as out_file:
+        shutil.copyfileobj(response.raw, out_file)
+
+    return destination_file_path
+
+
+def extract_tar_file(tar_file_path, destination_directory):
+    """
+    Extracts a tar file on the local file system to the destination directory. Returns a list
+    of top-level contents (files and folders) of the extracted archive.
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    print("Extracting {} to {}".format(tar_file_path, destination_directory))
+    with tarfile.open(tar_file_path) as t:
+        t.extractall(path=destination_directory)
+        contents = {i.split('/')[0] for i in t.getnames()}
+        return list(contents)
+
+
+def extract_zip_file(zip_file_path, destination_directory):
+    """
+    Extracts a zip file on the local file system to the destination directory. Returns a list
+    of top-level contents (files and folders) of the extracted archive.
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    print("Extracting {} to {}".format(zip_file_path, destination_directory))
+    with zipfile.ZipFile(zip_file_path, "r") as z:
+        z.extractall(path=destination_directory)
+        contents = {i.split('/')[0] for i in z.namelist()}
+        return list(contents)
diff --git a/examples/README.md b/examples/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..951bf606e5acefae844735dc1024abcf6160bd08
--- /dev/null
+++ b/examples/README.md
@@ -0,0 +1,11 @@
+# Examples
+
+Here are some examples using no-code bash commands:
+
+* [Beyond Get Started CLI Example](cli/README.md)
+* [Text Classification Intel® Transfer Learning Tool CLI Example](cli/text_classification.md)
+* [Image Classification Intel® Transfer Learning Tool CLI Example](cli/image_classification.md)
+
+Here are Jupyter notebook examples using low-code Python\* API calls:
+
+* [Intel® Transfer Learning Tool API Examples](../notebooks/README.md)
diff --git a/examples/cli/README.md b/examples/cli/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..f0dc6d3c2217fd95972d177a7e0a7741e87ce0bb
--- /dev/null
+++ b/examples/cli/README.md
@@ -0,0 +1,227 @@
+# Beyond Get Started CLI Example
+
+If you already walked through the [Get Started Guide](/GetStarted.md), this
+example begins with the same training steps and then continues with more examples of
+using CLI commands to work with that trained model.
+
+The following example walks through a full workflow using the Intel Transfer Learning
+Tool CLI to train a model, and then benchmark, quantize, and optimize the
+trained model. It uses a TensorFlow image classification model, but the
+same commands and concepts can be applied when working with other frameworks
+and use cases.
+
+Use `tlt --help` to see the list of CLI commands. More detailed information on
+each command can be found using `tlt <command> --help` (such as `tlt train --help`).
+
+## List the Available Models
+
+Use the `tlt list` command to see a list of available models for each framework.
+Use the `--use-case` flag to limit the list to models for a particular use case.
+```
+tlt list models --use-case image_classification
+```
+```
+------------------------------
+IMAGE CLASSIFICATION
+------------------------------
+alexnet (pytorch)
+convnext_base (pytorch)
+convnext_large (pytorch)
+convnext_small (pytorch)
+convnext_tiny (pytorch)
+densenet121 (pytorch)
+densenet161 (pytorch)
+densenet169 (pytorch)
+densenet201 (pytorch)
+efficientnet_b0 (pytorch)
+efficientnet_b0 (tensorflow)
+efficientnet_b1 (pytorch)
+efficientnet_b1 (tensorflow)
+efficientnet_b2 (pytorch)
+efficientnet_b2 (tensorflow)
+efficientnet_b3 (pytorch)
+efficientnet_b3 (tensorflow)
+efficientnet_b4 (pytorch)
+efficientnet_b4 (tensorflow)
+...
+```
+
+## Train a Model
+
+For this example, we use the TensorFlow flowers dataset. Download and extract
+the dataset by following this example:
+```
+# Create a directory for the dataset to be downloaded
+DATASET_DIR=/tmp/dataset
+mkdir -p ${DATASET_DIR}
+
+# Download and extract the dataset
+wget -P ${DATASET_DIR} https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz
+tar -xzf ${DATASET_DIR}/flower_photos.tgz -C ${DATASET_DIR}
+
+# Set the DATASET_DIR to the extracted images folder
+DATASET_DIR=${DATASET_DIR}/flower_photos
+
+# Supress debug information from TensorFlow 2.12
+TF_CPP_MIN_LOG_LEVEL=2
+```
+
+After the dataset directory is ready, use the `tlt train` command to train one of the models from
+`tlt list`. In this example, we use the TensorFlow ResNet50v1.5 model. Make sure to specify
+your own file path for the `output-dir`. The `dataset-dir` should point to the extracted dataset folder.
+```
+tlt train -f tensorflow --model-name resnet_v1_50 --dataset-dir ${DATASET_DIR} --output-dir /tmp/output
+```
+```
+Model name: resnet_v1_50
+Framework: tensorflow
+Training epochs: 1
+Dataset dir: /tmp/dataset/flower_photos
+Output directory: /tmp/output
+Found 3670 files belonging to 5 classes.
+...
+Model: "sequential"
+_________________________________________________________________
+Layer (type)                Output Shape              Param #
+=================================================================
+keras_layer (KerasLayer)    (None, 2048)              23561152
+dense (Dense)               (None, 5)                 10245
+=================================================================
+Total params: 23,571,397
+Trainable params: 10,245
+Non-trainable params: 23,561,152
+_________________________________________________________________
+Checkpoint directory: /tmp/output/resnet_v1_50_checkpoints
+86/86 [==============================] - 24s 248ms/step - loss: 0.4600 - acc: 0.8438
+Saved model directory: /tmp/output/resnet_v1_50/1
+```
+
+The `tlt train` command evaluates the model after training completes. The loss and
+accuracy values are printed toward the end of the console output, along with the
+location where the trained model has been saved (including a new numbered folder for
+each run).
+
+A trained model can also be evaluated using the `tlt eval` command:
+```
+tlt eval --model-dir /tmp/output/resnet_v1_50/1 --dataset-dir ${DATASET_DIR}
+```
+
+## Benchmark the Trained Model
+
+Benchmark the performance of the trained model using `tlt benchmark`.  Make sure
+to specify your own file paths for `model-dir` (including the numbered folder).
+The `dataset-dir` should point to the extracted dataset folder.
+```
+tlt benchmark --model-dir /tmp/output/resnet_v1_50/1 --dataset-dir ${DATASET_DIR} --batch-size 512
+```
+```
+Model directory: /tmp/output/resnet_v1_50/1
+Dataset directory: /tmp/dataset/flower_photos
+Batch size: 512
+Model name: resnet_v1_50
+Framework: tensorflow
+...
+performance mode benchmark result:
+2022-06-28 10:22:10 [INFO] Batch size = 512
+2022-06-28 10:22:10 [INFO] Latency: 3.031 ms
+2022-06-28 10:22:10 [INFO] Throughput: 329.878 images/sec
+   ```
+
+## Quantize the Model
+
+Perform post-training quantization using the [Intel® Neural
+Compressor](https://intel.github.io/neural-compressor) using the `tlt quantize`
+command. Make sure to specify your own file paths for `model-dir` (including the
+numbered folder), `dataset-dir`, and `output-dir`.  The quantized model will be
+saved to the output directory.
+```
+tlt quantize --model-dir /tmp/output/resnet_v1_50/1 --dataset-dir ${DATASET_DIR} --batch-size 512 \
+--accuracy-criterion 0.01 --output-dir /tmp/output
+```
+```
+Model directory: /tmp/output/resnet_v1_50/1
+Dataset directory: /tmp/dataset/flower_photos
+Accuracy criterion: 0.01
+Exit policy timeout: 0
+Exit policy max trials: 50
+Batch size: 512
+Output directory: /tmp/output
+...
+2022-06-28 10:25:58 [INFO] |******Mixed Precision Statistics*****|
+2022-06-28 10:25:58 [INFO] +-----------------+----------+--------+
+2022-06-28 10:25:58 [INFO] |     Op Type     |  Total   |  INT8  |
+2022-06-28 10:25:58 [INFO] +-----------------+----------+--------+
+2022-06-28 10:25:58 [INFO] |      Conv2D     |    53    |   53   |
+2022-06-28 10:25:58 [INFO] |      MatMul     |    1     |   1    |
+2022-06-28 10:25:58 [INFO] |     MaxPool     |    4     |   4    |
+2022-06-28 10:25:58 [INFO] |    QuantizeV2   |    5     |   5    |
+2022-06-28 10:25:58 [INFO] |    Dequantize   |    4     |   4    |
+2022-06-28 10:25:58 [INFO] +-----------------+----------+--------+
+2022-06-28 10:25:58 [INFO] Pass quantize model elapsed time: 32164.27 ms
+2022-06-28 10:25:58 [INFO] Start to evaluate the TensorFlow model.
+2022-06-28 10:26:12 [INFO] Model inference elapsed time: 13921.64 ms
+2022-06-28 10:26:12 [INFO] Tune 1 result is: [Accuracy (int8|fp32): 0.9008|0.9022, Duration (seconds) (int8|fp32): 13.9226|17.3321], Best tune result is: [Accuracy: 0.9008, Duration (seconds): 13.9226]
+2022-06-28 10:26:12 [INFO] |**********************Tune Result Statistics**********************|
+2022-06-28 10:26:12 [INFO] +--------------------+----------+---------------+------------------+
+2022-06-28 10:26:12 [INFO] |     Info Type      | Baseline | Tune 1 result | Best tune result |
+2022-06-28 10:26:12 [INFO] +--------------------+----------+---------------+------------------+
+2022-06-28 10:26:12 [INFO] |      Accuracy      | 0.9022   |    0.9008     |     0.9008       |
+2022-06-28 10:26:12 [INFO] | Duration (seconds) | 17.3321  |    13.9226    |     13.9226      |
+2022-06-28 10:26:12 [INFO] +--------------------+----------+---------------+------------------+
+2022-06-28 10:26:12 [INFO] Save tuning history to /tmp/output/nc_workspace/./history.snapshot.
+2022-06-28 10:26:12 [INFO] Specified timeout or max trials is reached! Found a quantized model which meet accuracy goal. Exit.
+..
+INFO:tensorflow:SavedModel written to: /tmp/output/quantized/resnet_v1_50/1/saved_model.pb
+2022-06-28 10:26:13 [INFO] SavedModel written to: /tmp/output/quantized/resnet_v1_50/1/saved_model.pb
+2022-06-28 10:26:13 [INFO] Save quantized model to /tmp/output/quantized/resnet_v1_50/1
+```
+
+## Benchmark the Quantized Model
+
+The `tlt benchmark` command is used again, but this time the `model-dir` should point
+to the quantized model directory.
+Make sure to specify your own file paths for `model-dir` and `dataset-dir`. You can then compare
+the performance of the full precision model to the quantized model.
+```
+tlt benchmark --model-dir /tmp/output/quantized/resnet_v1_50/1 --dataset-dir ${DATASET_DIR} --batch-size 512
+```
+```
+Model directory: /tmp/output/quantized/resnet_v1_50/1
+Dataset directory: /tmp/dataset/flower_photos
+Benchmarking mode: performance
+Batch size: 512
+Model name: resnet_v1_50
+Framework: tensorflow
+...
+performance mode benchmark result:
+2022-06-28 10:28:33 [INFO] Batch size = 512
+2022-06-28 10:28:33 [INFO] Latency: 0.946 ms
+2022-06-28 10:28:33 [INFO] Throughput: 1056.940 images/sec
+```
+
+## Perform Graph Optimization on the Trained Model
+
+Alternatively, the [Intel Neural Compressor](https://intel.github.io/neural-compressor) can be used to optimize
+the full precision graph. Make sure to specify your own file paths for `model-dir` and `output-dir`.
+Note that graph optimization is also done as part of the quantization flow, so there is no need to call
+`tlt optimize` on a quantized model.
+```
+tlt optimize --model-dir /tmp/output/resnet_v1_50/1 --output-dir /tmp/output
+```
+```
+Model directory: /tmp/output/resnet_v1_50/1
+Model name: resnet_v1_50
+Output directory: /tmp/output
+Framework: tensorflow
+Starting graph optimization
+...
+2022-06-28 13:50:01 [INFO] Graph optimization is done.
+...
+2022-06-28 13:51:21 [INFO] SavedModel written to: /tmp/output/optimized/resnet_v1_50/1/saved_model.pb
+```
+
+## Addititional CLI Examples
+
+More CLI examples can be found here:
+* [Image classification examples](/examples/cli/image_classification.md)
+* [Text classification examples](/examples/cli/text_classification.md)
diff --git a/examples/cli/image_classification.md b/examples/cli/image_classification.md
new file mode 100644
index 0000000000000000000000000000000000000000..86d6cbb1e8888725bb9f647cfc4f30e4f4bfaaa2
--- /dev/null
+++ b/examples/cli/image_classification.md
@@ -0,0 +1,84 @@
+# Image Classification Intel® Transfer Learning Tool CLI Example
+
+## Transfer Learning Using your Own Dataset
+
+The example below shows how the Intel Transfer Learning Tool CLI can be used for image classification transfer learning
+using your own dataset. The dataset is expected to be organized with subfolders for each image
+class. Each subfolder should contain .jpg images for the class. The name of the subfolder will
+be used as the class label.
+
+This example downloads a flower photos dataset from TensorFlow, which has images of
+flowers belonging to 5 classes: daisy, dandelion, roses, sunflowers, and tulips. The extracted
+dataset is already formatted in the expected format with subfolders for each class.
+```bash
+# Create dataset and output directories
+DATASET_DIR=/tmp/data
+OUTPUT_DIR=/tmp/output
+mkdir -p ${DATASET_DIR}
+mkdir -p ${OUTPUT_DIR}
+
+# Download and extract the dataset
+wget -P ${DATASET_DIR} https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz
+tar -xzf ${DATASET_DIR}/flower_photos.tgz -C ${DATASET_DIR}
+
+# Set the DATASET_DIR to the extracted images folder
+DATASET_DIR=${DATASET_DIR}/flower_photos
+
+# Train resnet_v1_50 using the flower photos directory
+tlt train \
+    -f tensorflow \
+    --model-name resnet_v1_50 \
+    --dataset-dir ${DATASET_DIR} \
+    --output-dir ${OUTPUT_DIR} \
+    --epochs 2
+
+# Evaluate the model exported after training
+# Note that your --model-dir path may vary, since each training run creates a new directory
+tlt eval \
+    --model-dir /tmp/output/resnet_v1_50/1 \
+    --dataset-dir ${DATASET_DIR}
+```
+
+## Transfer Learning Using a Dataset from the TFDS Catalog
+
+This example shows the Intel Transfer Learning Tool CLI being used for image classification transfer learning
+using the `tf_flowers` dataset from the
+[TensorFlow Datasets (TFDS) catalog](https://www.tensorflow.org/datasets/catalog/overview).
+
+```bash
+# Create dataset and output directories
+DATASET_DIR=/tmp/data
+OUTPUT_DIR=/tmp/output
+mkdir -p ${DATASET_DIR}
+mkdir -p ${OUTPUT_DIR}
+
+# Name of the dataset to use
+DATASET_NAME=tf_flowers
+
+# Train resnet_v1_50 using the TFDS catalog dataset
+tlt train \
+    -f tensorflow \
+    --model-name resnet_v1_50 \
+    --dataset-name ${DATASET_NAME} \
+    --dataset-dir ${DATASET_DIR} \
+    --output-dir ${OUTPUT_DIR} \
+    --epochs 2
+
+# Evaluate the model exported after training
+# Note that your --model-dir path may vary, since each training run creates a new directory
+tlt eval \
+    --model-dir ${OUTPUT_DIR}/resnet_v1_50/1 \
+    --dataset-name ${DATASET_NAME} \
+    --dataset-dir ${DATASET_DIR}
+```
+
+## Citations
+
+```
+@ONLINE {tfflowers,
+author = "The TensorFlow Team",
+title = "Flowers",
+month = "jan",
+year = "2019",
+url = "http://download.tensorflow.org/example_images/flower_photos.tgz" }
+```
diff --git a/examples/cli/text_classification.md b/examples/cli/text_classification.md
new file mode 100644
index 0000000000000000000000000000000000000000..cdd417b4e21e72c104e8d79220377c383c125b70
--- /dev/null
+++ b/examples/cli/text_classification.md
@@ -0,0 +1,183 @@
+# Text Classification Intel® Transfer Learning Tool CLI Example
+
+## Fine Tuning Using Your Own Dataset
+
+The example below shows how to fine tune a TensorFlow text classification model using your own
+dataset in the .csv format. The .csv file is expected to have 2 columns: a numerical class label
+and the text/sentence to classify. Note that although the TLT API is more flexible and allows for
+providing map functions to translate string class names to numerical values and filtering which
+columns are being used, the CLI only allows using .csv files in the expected format.
+
+The `--dataset-dir` argument is the path to the directory where your dataset is located, and the
+`--dataset-file` is the name of the .csv file to load from that directory. Use the `--class-names`
+argument to specify a list of the classes and the `--delimiter` to specify the character that
+separates the two columns. If no `--delimiter` is specified, the CLI will default to use a comma (`,`).
+
+This example is downloading the [SMS Spam Collection](https://archive.ics.uci.edu/dataset/228/sms+spam+collection)
+dataset, which has a tab separated value file in the .zip file. This dataset has labeled SMS text
+messages that are either being classified as `ham` or `spam`. The first column in the data file has
+the label (`ham` or `spam`) and the second column is the text of the SMS message. The string class
+labels are replaced with numerical values before training.
+```bash
+# Create dataset and output directories
+DATASET_DIR=/tmp/data
+OUTPUT_DIR=/tmp/output
+mkdir -p ${DATASET_DIR}
+mkdir -p ${OUTPUT_DIR}
+
+# Download and extract the dataset
+wget -P ${DATASET_DIR} https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip
+unzip ${DATASET_DIR}/sms+spam+collection.zip
+
+# Make a copy of the .csv file with 'numerical' in the file name
+DATASET_FILE=SMSSpamCollection_numerical.csv
+cp ${DATASET_DIR}/SMSSpamCollection ${DATASET_DIR}/${DATASET_FILE}
+
+# Replace string class labels with numerical values in the .csv file\
+# The list numerical class labels passed as the --class-names during training and evaluation
+sed -i 's/ham/0/g' ${DATASET_DIR}/${DATASET_FILE}
+sed -i 's/spam/1/g' ${DATASET_DIR}/${DATASET_FILE}
+
+# Train google/bert_uncased_L-10_H-256_A-4 using our dataset file, which has tab delimiters
+tlt train \
+    -f tensorflow \
+    --model-name google/bert_uncased_L-10_H-256_A-4 \
+    --output-dir ${OUTPUT_DIR} \
+    --dataset-dir ${DATASET_DIR} \
+    --dataset-file ${DATASET_FILE} \
+    --epochs 2 \
+    --class-names 0,1 \
+    --delimiter $'\t'
+
+# Evaluate the model exported after training
+# Note that your --model-dir path may vary, since each training run creates a new directory
+tlt eval \
+    --model-dir ${OUTPUT_DIR}/google_bert_uncased_L-10_H-256_A-4/1 \
+    --model-name google/bert_uncased_L-10_H-256_A-4 \
+    --dataset-dir ${DATASET_DIR} \
+    --dataset-file ${DATASET_FILE} \
+    --class-names 0,1 \
+    --delimiter $'\t'
+```
+
+## Fine Tuning Using a Dataset from the TFDS Catalog
+
+This example demonstrates using the Intel Transfer Learning Tool CLI to fine tune a text classification model using a
+dataset from the [TensorFlow Datasets (TFDS) catalog](https://www.tensorflow.org/datasets/catalog/overview).
+Intel Transfer Learning Tool supports the following text classification datasets from TFDS:
+[imdb_reviews](https://www.tensorflow.org/datasets/catalog/imdb_reviews),
+[glue/sst2](https://www.tensorflow.org/datasets/catalog/imdb_reviews),
+and [glue/cola](https://www.tensorflow.org/datasets/catalog/glue#gluecola_default_config).
+
+```bash
+# Create dataset and output directories
+DATASET_DIR=/tmp/data
+OUTPUT_DIR=/tmp/output
+mkdir -p ${DATASET_DIR}
+mkdir -p ${OUTPUT_DIR}
+
+# Name of the dataset to use
+DATASET_NAME=imdb_reviews
+
+# Train google/bert_uncased_L-10_H-256_A-4 using the TFDS dataset
+tlt train \
+    -f tensorflow \
+    --model-name google/bert_uncased_L-10_H-256_A-4 \
+    --output-dir ${OUTPUT_DIR} \
+    --dataset-dir ${DATASET_DIR} \
+    --dataset-name ${DATASET_NAME} \
+    --epochs 2
+
+# Evaluate the model exported after training
+# Note that your --model-dir path may vary, since each training run creates a new directory
+tlt eval \
+    --model-dir ${OUTPUT_DIR}/google_bert_uncased_L-10_H-256_A-4/2 \
+    --model-name google/bert_uncased_L-10_H-256_A-4 \
+    --dataset-dir ${DATASET_DIR} \
+    --dataset-name ${DATASET_NAME}
+```
+
+## Distributed Transfer Learning Using a Dataset from Hugging Face
+This example runs a distributed PyTorch training job using the TLT CLI. It fine tunes a text classification model
+for document-level sentiment analysis using a dataset from the [Hugging Face catalog](https://huggingface.co/datasets).
+Intel Transfer Learning Tool supports the following text classification datasets from Hugging Face:
+* [imdb](https://huggingface.co/datasets/imdb)
+* [tweet_eval](https://huggingface.co/datasets/tweet_eval)
+* [rotten_tomatoes](https://huggingface.co/datasets/rotten_tomatoes)
+* [ag_news](https://huggingface.co/datasets/ag_news)
+* [sst2](https://huggingface.co/datasets/sst2)
+
+Follow [these instructions](/tlt/distributed/README.md) to set up your machines for distributed training with PyTorch. This will
+ensure your environment has the right prerequisites, package dependencies, and hostfile configuration. When
+you have successfully run the sanity check, the following commands will fine-tune `bert-large-uncased` with sst2 for
+one epoch using 2 nodes and 2 processes per node.
+
+```bash
+# Create dataset and output directories
+DATASET_DIR=/tmp/data
+OUTPUT_DIR=/tmp/output
+mkdir -p ${DATASET_DIR}
+mkdir -p ${OUTPUT_DIR}
+
+# Name of the dataset to use
+DATASET_NAME=sst2
+
+# Train bert-large-uncased using the Hugging Face dataset sst2
+tlt train \
+    -f pytorch \
+    --model_name bert-large-uncased \
+    --dataset_name sst2 \
+    --output_dir $OUTPUT_DIR \
+    --dataset_dir $DATASET_DIR \
+    --distributed \
+    --hostfile hostfile \
+    --nnodes 2 \
+    --nproc_per_node 2
+```
+
+## Citations
+```
+@InProceedings{maas-EtAl:2011:ACL-HLT2011,
+  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},
+  title     = {Learning Word Vectors for Sentiment Analysis},
+  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},
+  month     = {June},
+  year      = {2011},
+  address   = {Portland, Oregon, USA},
+  publisher = {Association for Computational Linguistics},
+  pages     = {142--150},
+  url       = {http://www.aclweb.org/anthology/P11-1015}
+}
+
+@inproceedings{wang2019glue,
+  title={{GLUE}: A Multi-Task Benchmark and Analysis Platform for Natural Language Understanding},
+  author={Wang, Alex and Singh, Amanpreet and Michael, Julian and Hill, Felix and Levy, Omer and Bowman, Samuel R.},
+  note={In the Proceedings of ICLR.},
+  year={2019}
+}
+
+@misc{misc_sms_spam_collection_228,
+  author       = {Almeida, Tiago},
+  title        = {{SMS Spam Collection}},
+  year         = {2012},
+  howpublished = {UCI Machine Learning Repository}
+}
+
+@inproceedings{socher-etal-2013-recursive,
+    title = "Recursive Deep Models for Semantic Compositionality Over a Sentiment Treebank",
+    author = "Socher, Richard  and
+      Perelygin, Alex  and
+      Wu, Jean  and
+      Chuang, Jason  and
+      Manning, Christopher D.  and
+      Ng, Andrew  and
+      Potts, Christopher",
+    booktitle = "Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing",
+    month = oct,
+    year = "2013",
+    address = "Seattle, Washington, USA",
+    publisher = "Association for Computational Linguistics",
+    url = "https://www.aclweb.org/anthology/D13-1170",
+    pages = "1631--1642",
+}
+```
diff --git a/images/Jupyter_logo.svg b/images/Jupyter_logo.svg
new file mode 100644
index 0000000000000000000000000000000000000000..ab255087431725b5ae37c0fe279a6572f1064252
--- /dev/null
+++ b/images/Jupyter_logo.svg
@@ -0,0 +1,90 @@
+<svg width="44" height="51" viewBox="0 0 44 51" version="2.0" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:figma="http://www.figma.com/figma/ns">
+<title>Group.svg</title>
+<desc>Created using Figma 0.90</desc>
+<g id="Canvas" transform="translate(-1640 -2453)" figma:type="canvas">
+<g id="Group" style="mix-blend-mode:normal;" figma:type="group">
+<g id="Group" style="mix-blend-mode:normal;" figma:type="group">
+<g id="Group" style="mix-blend-mode:normal;" figma:type="group">
+<g id="g" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path9 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path0_fill" transform="translate(1640.54 2474.36)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path10 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path1_fill" transform="translate(1645.68 2474.37)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path11 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path2_fill" transform="translate(1653.39 2474.26)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path12 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path3_fill" transform="translate(1660.43 2474.39)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path13 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path4_fill" transform="translate(1667.55 2472.54)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path14 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path5_fill" transform="translate(1672.47 2474.29)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path15 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path6_fill" transform="translate(1679.98 2474.24)" fill="#4E4E4E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+</g>
+</g>
+<g id="g" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path16 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path7_fill" transform="translate(1673.48 2453.69)" fill="#767677" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path17 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path8_fill" transform="translate(1643.21 2484.27)" fill="#F37726" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path18 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path9_fill" transform="translate(1643.21 2457.88)" fill="#F37726" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path19 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path10_fill" transform="translate(1643.28 2496.09)" fill="#9E9E9E" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+<g id="path" style="mix-blend-mode:normal;" figma:type="group">
+<g id="path20 fill" style="mix-blend-mode:normal;" figma:type="vector">
+<use xlink:href="#path11_fill" transform="translate(1641.87 2458.43)" fill="#616262" style="mix-blend-mode:normal;"/>
+</g>
+</g>
+</g>
+</g>
+</g>
+</g>
+<defs>
+<path id="path0_fill" d="M 1.74498 5.47533C 1.74498 7.03335 1.62034 7.54082 1.29983 7.91474C 0.943119 8.23595 0.480024 8.41358 0 8.41331L 0.124642 9.3036C 0.86884 9.31366 1.59095 9.05078 2.15452 8.56466C 2.45775 8.19487 2.6834 7.76781 2.818 7.30893C 2.95261 6.85005 2.99341 6.36876 2.93798 5.89377L 2.93798 0L 1.74498 0L 1.74498 5.43972L 1.74498 5.47533Z"/>
+<path id="path1_fill" d="M 5.50204 4.76309C 5.50204 5.43081 5.50204 6.02731 5.55545 6.54368L 4.496 6.54368L 4.42478 5.48423C 4.20318 5.85909 3.88627 6.16858 3.50628 6.38125C 3.12628 6.59392 2.69675 6.70219 2.26135 6.69503C 1.22861 6.69503 0 6.13415 0 3.84608L 0 0.0445149L 1.193 0.0445149L 1.193 3.6057C 1.193 4.84322 1.57583 5.67119 2.65309 5.67119C 2.87472 5.67358 3.09459 5.63168 3.29982 5.54796C 3.50505 5.46424 3.69149 5.34039 3.84822 5.18366C 4.00494 5.02694 4.1288 4.84049 4.21252 4.63527C 4.29623 4.43004 4.33813 4.21016 4.33575 3.98853L 4.33575 0L 5.52874 0L 5.52874 4.72748L 5.50204 4.76309Z"/>
+<path id="path2_fill" d="M 0.0534178 2.27264C 0.0534178 1.44466 0.0534178 0.768036 0 0.153731L 1.06836 0.153731L 1.12177 1.2666C 1.3598 0.864535 1.70247 0.534594 2.11325 0.311954C 2.52404 0.0893145 2.98754 -0.0176786 3.45435 0.00238095C 5.03908 0.00238095 6.23208 1.32892 6.23208 3.30538C 6.23208 5.63796 4.7987 6.79535 3.24958 6.79535C 2.85309 6.81304 2.45874 6.7281 2.10469 6.54874C 1.75064 6.36937 1.44888 6.10166 1.22861 5.77151L 1.22861 5.77151L 1.22861 9.33269L 0.0534178 9.33269L 0.0534178 2.29935L 0.0534178 2.27264ZM 1.22861 4.00872C 1.23184 4.17026 1.24972 4.33117 1.28203 4.48948C 1.38304 4.88479 1.61299 5.23513 1.93548 5.48506C 2.25798 5.735 2.65461 5.87026 3.06262 5.86944C 4.31794 5.86944 5.05689 4.8456 5.05689 3.3588C 5.05689 2.05897 4.36246 0.946096 3.10714 0.946096C 2.61036 0.986777 2.14548 1.20726 1.79965 1.5662C 1.45382 1.92514 1.25079 2.3979 1.22861 2.89585L 1.22861 4.00872Z"/>
+<path id="path3_fill" d="M 1.31764 0.0178059L 2.75102 3.85499C 2.90237 4.28233 3.06262 4.7987 3.16946 5.18153C 3.2941 4.7898 3.42764 4.29123 3.5879 3.82828L 4.88773 0.0178059L 6.14305 0.0178059L 4.36246 4.64735C 3.47216 6.87309 2.92908 8.02158 2.11 8.71601C 1.69745 9.09283 1.19448 9.35658 0.649917 9.48166L 0.356119 8.48453C 0.736886 8.35942 1.09038 8.16304 1.39777 7.90584C 1.8321 7.55188 2.17678 7.10044 2.4038 6.5882C 2.45239 6.49949 2.48551 6.40314 2.50173 6.3033C 2.49161 6.19586 2.46457 6.0907 2.42161 5.9917L 0 0L 1.29983 0L 1.31764 0.0178059Z"/>
+<path id="path4_fill" d="M 2.19013 0L 2.19013 1.86962L 3.8995 1.86962L 3.8995 2.75992L 2.19013 2.75992L 2.19013 6.26769C 2.19013 7.06896 2.42161 7.53191 3.08043 7.53191C 3.31442 7.53574 3.54789 7.5088 3.77486 7.45179L 3.82828 8.34208C 3.48794 8.45999 3.12881 8.51431 2.76882 8.50234C 2.53042 8.51726 2.29161 8.48043 2.06878 8.39437C 1.84595 8.30831 1.64438 8.17506 1.47789 8.00377C 1.11525 7.51873 0.949826 6.91431 1.01494 6.31221L 1.01494 2.75102L 0 2.75102L 0 1.86072L 1.03274 1.86072L 1.03274 0.275992L 2.19013 0Z"/>
+<path id="path5_fill" d="M 1.17716 3.57899C 1.153 3.88093 1.19468 4.18451 1.29933 4.46876C 1.40398 4.75301 1.5691 5.01114 1.78329 5.22532C 1.99747 5.43951 2.2556 5.60463 2.53985 5.70928C 2.8241 5.81393 3.12768 5.85561 3.42962 5.83145C 4.04033 5.84511 4.64706 5.72983 5.21021 5.49313L 5.41498 6.38343C 4.72393 6.66809 3.98085 6.80458 3.23375 6.78406C 2.79821 6.81388 2.36138 6.74914 1.95322 6.59427C 1.54505 6.43941 1.17522 6.19809 0.869071 5.88688C 0.562928 5.57566 0.327723 5.2019 0.179591 4.79125C 0.0314584 4.38059 -0.0260962 3.94276 0.0108748 3.50777C 0.0108748 1.54912 1.17716 0 3.0824 0C 5.21911 0 5.75329 1.86962 5.75329 3.06262C 5.76471 3.24644 5.76471 3.43079 5.75329 3.61461L 1.15046 3.61461L 1.17716 3.57899ZM 4.66713 2.6887C 4.70149 2.45067 4.68443 2.20805 4.61709 1.97718C 4.54976 1.74631 4.43372 1.53255 4.2768 1.35031C 4.11987 1.16808 3.92571 1.0216 3.70739 0.920744C 3.48907 0.81989 3.25166 0.767006 3.01118 0.765656C 2.52201 0.801064 2.06371 1.01788 1.72609 1.37362C 1.38847 1.72935 1.19588 2.19835 1.18607 2.6887L 4.66713 2.6887Z"/>
+<path id="path6_fill" d="M 0.0534178 2.19228C 0.0534178 1.42663 0.0534178 0.767806 0 0.162404L 1.06836 0.162404L 1.06836 1.43553L 1.12177 1.43553C 1.23391 1.04259 1.4656 0.694314 1.78468 0.439049C 2.10376 0.183783 2.4944 0.034196 2.90237 0.0110538C 3.01466 -0.00368459 3.12839 -0.00368459 3.24068 0.0110538L 3.24068 1.12393C 3.10462 1.10817 2.9672 1.10817 2.83114 1.12393C 2.427 1.13958 2.04237 1.30182 1.7491 1.58035C 1.45583 1.85887 1.27398 2.23462 1.23751 2.63743C 1.20422 2.8196 1.18635 3.00425 1.1841 3.18941L 1.1841 6.65267L 0.00890297 6.65267L 0.00890297 2.20118L 0.0534178 2.19228Z"/>
+<path id="path7_fill" d="M 6.03059 2.83565C 6.06715 3.43376 5.92485 4.02921 5.6218 4.54615C 5.31875 5.0631 4.86869 5.47813 4.32893 5.73839C 3.78917 5.99864 3.18416 6.09233 2.59097 6.00753C 1.99778 5.92272 1.44326 5.66326 0.998048 5.26219C 0.552837 4.86113 0.23709 4.33661 0.0910307 3.75546C -0.0550287 3.17431 -0.0247891 2.56283 0.177897 1.99893C 0.380583 1.43503 0.746541 0.944221 1.22915 0.589037C 1.71176 0.233853 2.28918 0.0303686 2.88784 0.00450543C 3.28035 -0.0170932 3.67326 0.0391144 4.04396 0.169896C 4.41467 0.300677 4.75587 0.503453 5.04794 0.766561C 5.34 1.02967 5.57718 1.34792 5.74582 1.70301C 5.91446 2.0581 6.01124 2.44303 6.03059 2.83565L 6.03059 2.83565Z"/>
+<path id="path8_fill" d="M 18.6962 7.12238C 10.6836 7.12238 3.64131 4.24672 0 0C 1.41284 3.82041 3.96215 7.1163 7.30479 9.44404C 10.6474 11.7718 14.623 13.0196 18.6962 13.0196C 22.7695 13.0196 26.745 11.7718 30.0877 9.44404C 33.4303 7.1163 35.9796 3.82041 37.3925 4.0486e-13C 33.7601 4.24672 26.7445 7.12238 18.6962 7.12238Z"/>
+<path id="path9_fill" d="M 18.6962 5.89725C 26.7089 5.89725 33.7512 8.77291 37.3925 13.0196C 35.9796 9.19922 33.4303 5.90333 30.0877 3.57559C 26.745 1.24785 22.7695 4.0486e-13 18.6962 0C 14.623 4.0486e-13 10.6474 1.24785 7.30479 3.57559C 3.96215 5.90333 1.41284 9.19922 0 13.0196C 3.64131 8.76401 10.648 5.89725 18.6962 5.89725Z"/>
+<path id="path10_fill" d="M 7.59576 3.56656C 7.64276 4.31992 7.46442 5.07022 7.08347 5.72186C 6.70251 6.3735 6.13619 6.89698 5.45666 7.22561C 4.77713 7.55424 4.01515 7.67314 3.26781 7.56716C 2.52046 7.46117 1.82158 7.13511 1.26021 6.63051C 0.698839 6.12591 0.300394 5.46561 0.115637 4.73375C -0.0691191 4.00188 -0.0318219 3.23159 0.222777 2.52099C 0.477376 1.8104 0.93775 1.19169 1.54524 0.743685C 2.15274 0.295678 2.87985 0.0386595 3.63394 0.00537589C 4.12793 -0.0210471 4.62229 0.0501173 5.08878 0.214803C 5.55526 0.37949 5.98473 0.63447 6.35264 0.965179C 6.72055 1.29589 7.01971 1.69584 7.233 2.1422C 7.4463 2.58855 7.56957 3.07256 7.59576 3.56656L 7.59576 3.56656Z"/>
+<path id="path11_fill" d="M 2.25061 4.37943C 1.81886 4.39135 1.39322 4.27535 1.02722 4.04602C 0.661224 3.81668 0.371206 3.48424 0.193641 3.09052C 0.0160762 2.69679 -0.0411078 2.25935 0.0292804 1.83321C 0.0996686 1.40707 0.294486 1.01125 0.589233 0.695542C 0.883981 0.37983 1.2655 0.158316 1.68581 0.0588577C 2.10611 -0.0406005 2.54644 -0.0135622 2.95143 0.136572C 3.35641 0.286707 3.70796 0.553234 3.96186 0.902636C 4.21577 1.25204 4.3607 1.66872 4.37842 2.10027C 4.39529 2.6838 4.18131 3.25044 3.78293 3.67715C 3.38455 4.10387 2.83392 4.35623 2.25061 4.37943Z"/>
+</defs>
+</svg>
diff --git a/images/TLT-GSG_flow.svg b/images/TLT-GSG_flow.svg
new file mode 100644
index 0000000000000000000000000000000000000000..070d7d7596ab20e75ade5b678b28ffdc1d739ef8
--- /dev/null
+++ b/images/TLT-GSG_flow.svg
@@ -0,0 +1,59 @@
+<svg xmlns="http://www.w3.org/2000/svg" xml:space="preserve" version="1.1" viewBox="0 0 736 200">
+  <style>
+    @import url("https://fonts.googleapis.com/css?family=Roboto:400,700");
+    text {
+      font-family: Roboto, Arial, Helvetica, sans-serif;
+      font-weight:400;
+      font-size: 14px;
+      fill: #fff;
+      text-anchor: middle
+    }
+    .heavy {
+      font-weight: 700
+    }
+    .st0,.st1{fill:none;stroke:#e9e9e9;stroke-width:2}
+    .st1{stroke:#525252}
+    .st2{fill:#525252}
+    .st3{fill:#0068b5}
+    .st7{ font-size:12px }
+  </style>
+  <rect width="100%" height="100%" fill="white"/>
+  <line x1="368" x2="368" y2="200" class="st0"/>
+  <line x1="176" x2="176" y2="200" class="st0"/>
+  <line x2="560" y1="100" y2="100" class="st1"/>
+  <path d="M460 94.5v12l8-6-8-6z" class="st2"/>
+  <rect width="160" height="72" y="62.5" class="st3"/>
+  <text transform="translate(80 94)">
+    <tspan  x="0">Check system</tspan>
+    <tspan dy="1.2em" x="0">requirements</tspan>
+  </text>
+  <rect width="160" height="72" x="192" y="62.5" class="st3"/>
+  <text transform="translate(272 88)">
+    <tspan  x="0">Install the Intel</tspan>
+    <tspan dy="1.2em" x="0">Transfer Learning</tspan>
+    <tspan dy="1.2em" x="0">Tool</tspan>
+  </text>
+  <path d="M400 62.5h128c8.8 0 16 7.1 16 15.8v40.4c0 8.7-7.2 15.8-16 15.8H400c-8.8 0-16-7.1-16-15.8V78.3c0-8.7 7.2-15.8 16-15.8z" class="st2"/>
+  <text class="st7" transform="translate(464 88)">
+    <tspan  x="0">Choose how to run</tspan>
+    <tspan dy="1.2em" x="0">the Intel Transfer</tspan>
+    <tspan dy="1.2em" x="0">Learning Tool</tspan>
+  </text>
+  <rect width="160" height="84" x="576" class="st3"/>
+  <text transform="translate(656 38)">
+    <tspan  x="0">a) Run using No-</tspan>
+    <tspan dy="1.2em" x="0">Code CLI</tspan>
+  </text>
+  <rect width="160" height="84" x="576" y="116" class="st3"/>
+  <text transform="translate(656 154)">
+    <tspan  x="0">b) Run using Low-</tspan>
+    <tspan dy="1.2em" x="0">Code API</tspan>
+  </text>
+  <text class="st2 st7 heavy" transform="translate(16 28.2)">1</text>
+  <path d="M16 9c8.3 0 15 6.7 15 15s-6.7 15-15 15S1 32.3 1 24 7.7 9 16 9z" class="st1"/>
+  <text class="st2 st7 heavy" transform="translate(208 28.2)">2</text>
+  <path d="M208 9c8.3 0 15 6.7 15 15s-6.7 15-15 15-15-6.7-15-15 6.7-15 15-15z" class="st1"/>
+  <text class="st2  st7 heavy" transform="translate(400 28.2)">3</text>
+  <path d="M400 9c8.3 0 15 6.7 15 15s-6.7 15-15 15-15-6.7-15-15 6.7-15 15-15z" class="st1"/>
+  <polyline points="576,42 560,42 560,158 576,158" class="st1"/>
+</svg>
diff --git a/images/TLT-tool_flow.svg b/images/TLT-tool_flow.svg
new file mode 100644
index 0000000000000000000000000000000000000000..7f67c1da2b77cddfc2c26ef454dd0f0ab0e8bbb1
--- /dev/null
+++ b/images/TLT-tool_flow.svg
@@ -0,0 +1,89 @@
+<?xml version="1.0" encoding="utf-8"?>
+<svg xmlns="http://www.w3.org/2000/svg" xml:space="preserve" viewBox="0 0 544 632">
+ <style>
+    @import url("https://fonts.googleapis.com/css?family=Roboto:400,700");
+    text {
+      font-family: Roboto, Arial, Helvetica, sans-serif;
+      font-weight:400;
+      font-size: 14px;
+      fill: #fff;
+      text-anchor: middle
+    }
+    .st0{fill:none;stroke:#525252;stroke-width:2;stroke-miterlimit:10}
+    .st3{fill:#525252}
+    .st4{fill:#fff;stroke:#0068b5;stroke-width:2;stroke-miterlimit:10}
+    .st5{fill:#0068b5}
+    .reverseText{fill:#2b2c30}
+    .boxHeading{font-weight:700;}
+    .boxBody{font-size:12px}
+    .key,.medium{font-weight:700}
+    .key{fill:#2b2c30;font-size:12px;text-anchor:start}
+  </style>
+  <rect width="100%" height="100%" fill="white"/>
+  <g id="Layer_1">
+    <line x1="503.2" x2="528" y1="338" y2="338" class="st0"/>
+    <line x1="503.2" x2="528" y1="424" y2="424" class="st0"/>
+    <line x1="16" x2="40.8" y1="338" y2="338" class="st0"/>
+    <line x1="16" x2="40.8" y1="424" y2="424" class="st0"/>
+    <line x1="272" x2="272" y1="5.2" y2="396" class="st0"/>
+    <polyline points="304,250 528,250 528,512 304,512" class="st0"/>
+    <polyline points="240,512 16,512 16,338" class="st0"/>
+    <polyline fill="none" stroke="#525252" stroke-dasharray="8,4" stroke-width="2" points="16,338 16,250 240,250"/>
+    <path id="Vector_2_x5F_3" d="M278 392h-12l6 8 6-8z" class="st3"/>
+    <path id="Vector_2" d="M10 392.7h12l-6-9.6-6 9.6z" class="st3"/>
+    <path id="Vector_2_x5F_2" d="M534 383.1h-12l6 9.6 6-9.6z" class="st3"/>
+    <rect width="464" height="112" x="40" class="st4"/>
+    <rect width="464" height="64" x="40" y="136" class="st4"/>
+    <rect width="464" height="64" x="40" y="224" class="st5"/>
+    <rect width="464" height="64" x="40" y="312" class="st5"/>
+    <rect width="464" height="64" x="40" y="400" class="st5"/>
+    <text class="reverseText" transform="translate(272 27)">
+      <tspan x="0" class="boxHeading">Select Framework, Use Case, Dataset &amp; Model</tspan>
+      <tspan x="0" dy="1.6em" class="boxBody"><tspan class="medium">Framework</tspan> : TensorFlow, PyTorch</tspan>
+      <tspan x="0" dy="1.3em" class="boxBody"><tspan class="medium">Use Case</tspan> : Image Classification, Text Classification</tspan>
+      <tspan x="0" dy="1.3em" class="boxBody"><tspan class="medium">Dataset</tspan> : Public catalog (TF Hub, Torchvision, Hugging face), or Custom</tspan>
+      <tspan x="0" dy="1.3em" class="boxBody"><tspan class="medium">Model</tspan> : EfficientNet, InceptionV3, MobileNetV2, ResNet, BERT…</tspan>
+    </text>
+    <text class="reverseText" transform="translate(272 163)">
+      <tspan x="0" class="boxHeading">Pre-Process &amp; Split Dataset</tspan>
+      <tspan x="0" dy="1.6em" class="boxBody">Resize, Batch, Split Train/Val, Augmentation</tspan>
+    </text>
+    <text transform="translate(272 251)">
+      <tspan x="0" class="boxHeading">Train</tspan>
+      <tspan x="0" dy="1.6em" class="boxBody">Num Epochs, Initial Checkpoint, Distributed…</tspan>
+    </text>
+    <text transform="translate(272 339)">
+      <tspan x="0" class="boxHeading">Evaluate &amp; Predict</tspan>
+      <tspan x="0" dy="1.6em" class="boxBody">Evaluation, Prediction, Benchmarking</tspan>
+    </text>
+    <text transform="translate(272 427)">
+      <tspan x="0" class="boxHeading">Optimize</tspan>
+      <tspan x="0" dy="1.6em" class="boxBody">Quantization or FP32 Graph Optimization</tspan>
+    </text>
+    <path id="Vector" d="M289.1 516.4v-8.7c2-.6 3.4-2.5 3.4-4.7 0-2.7-2.2-4.9-4.9-4.9-1.2 0-2.4.5-3.3 1.3l-7.6-4.4c.1-.4.1-.7.1-1.1 0-2.7-2.2-4.9-4.9-4.9s-4.9 2.2-4.9 4.9c0 .3 0 .7.1 1.1l-7.6 4.4c-.9-.8-2.1-1.3-3.3-1.3-2.7 0-4.9 2.2-4.9 4.9 0 2.2 1.4 4 3.4 4.7v8.7c-2 .6-3.4 2.5-3.4 4.7 0 2.7 2.2 4.9 4.9 4.9 1.2 0 2.4-.5 3.3-1.3l7.6 4.4c-.1.4-.1.7-.1 1.1 0 2.7 2.2 4.9 4.9 4.9s4.9-2.2 4.9-4.9c0-.3 0-.7-.1-1.1l7.6-4.4c.9.8 2.1 1.3 3.3 1.3 2.7 0 4.9-2.2 4.9-4.9.1-2.2-1.3-4.1-3.4-4.7zm-1.4-11.5c-1.1 0-2-.9-2-2s.9-2 2-2 2 .9 2 2-.9 2-2 2zm0 14.2c1.1 0 2 .9 2 2s-.9 2-2 2-2-.9-2-2 .9-2 2-2zm-10.8-8.2 7.4-4.3c.5.5 1.2.9 1.8 1.1v8.7c-.7.2-1.4.6-1.9 1.2l-7.4-4.4c.1-.5.2-.9.2-1.3s0-.7-.1-1zm6 11.2-7.6 4.4c-.5-.5-1.2-.8-1.8-1.1v-8.9c.6-.2 1.2-.5 1.7-.9l7.7 4.5c-.1.3-.1.6-.1.9 0 .4 0 .7.1 1.1zm-21.8-2.3 7.8-4.4c.5.4 1.1.8 1.7 1v9c-.7.2-1.3.6-1.8 1.1l-7.6-4.4c.1-.4.1-.7.1-1.1 0-.3-.1-.8-.2-1.2zm0-17.9 7.6-4.4c.6.5 1.2.9 2 1.1l-.1 8.5c-.7.2-1.4.6-1.9 1.2l-7.5-4.4c.1-.4.1-.7.1-1.1s-.1-.5-.2-.9zm11 11.9c-1.1 0-2-.9-2-2s.9-2 2-2 2 .9 2 2-.9 2-2 2zm-.1-17.9c-1.1 0-2-.9-2-2s.9-2 2-2 2 .9 2 2-.9 2-2 2zm0 32.2c1.1 0 2 .9 2 2s-.9 2-2 2-2-.9-2-2 .9-2 2-2zm10.9-24.1-7.4 4.3c-.6-.5-1.2-.9-2-1.2l.1-8.6c.6-.2 1.2-.6 1.7-1l7.6 4.4c-.1.4-.1.7-.1 1.1s0 .7.1 1zm-15.5 8.9-7.8 4.4c-.5-.4-1.1-.8-1.7-1v-8.7c.7-.2 1.3-.6 1.8-1.1l7.6 4.4c-.1.3-.1.6-.1.8 0 .5.1.8.2 1.2zM256.3 501c1.1 0 2 .9 2 2s-.9 2-2 2-2-.9-2-2 1-2 2-2zm0 18.1c1.1 0 2 .9 2 2s-.9 2-2 2-2-.9-2-2 1-2 2-2z" class="st5"/>
+    <text class="reverseText boxBody medium" transform="translate(272 550.72)">Export Model</text>
+    <g id="Key_item">
+      <defs>
+        <rect id="SVGID_1_" width="24" height="24" x="40" y="576"/>
+      </defs>
+      <g id="Key_item_link" clip-path="url(#SVGID_00000118372852810006914920000018349303243660350108_)">
+        <rect id="Colours_6" width="24" height="24" x="40" y="576" class="st5"/>
+      </g>
+      <text transform="translate(72 592.2)" class="key">Optimizations for Intel</text>
+    </g>
+    <g id="Key_item_x5F_2">
+      <defs>
+        <rect id="SVGID_00000101068924030577568470000007297780801334610855_" width="24" height="24" x="40" y="608"/>
+      </defs>
+      <g id="Key_item_link_x5F_2" clip-path="url(#SVGID_00000065770435734207191060000005076644969967626119_)">
+        <path id="Colours_7" d="M52 608c6.6 0 12 5.4 12 12s-5.4 12-12 12-12-5.4-12-12 5.4-12 12-12z" class="st3"/>
+        <text transform="translate(52 624.2)" class="boxHeading">A</text>
+      </g>
+      <text transform="translate(72 624.2)" class="key">Retraining not possible once optimized</text>
+    </g>
+    <g id="Connection_Label">
+      <path d="M16 278c8.8 0 16 7.2 16 16s-7.2 16-16 16-16-7.2-16-16 7.2-16 16-16z" class="st3"/>
+      <text transform="translate(16 298.2)" class="boxHeading">A</text>
+    </g>
+  </g>
+</svg>
diff --git a/images/favicon-intel-32x32.png b/images/favicon-intel-32x32.png
new file mode 100644
index 0000000000000000000000000000000000000000..5a6b7816762e4d5a558c24986fe539c6a6c3e3b8
Binary files /dev/null and b/images/favicon-intel-32x32.png differ
diff --git a/notebooks/README.md b/notebooks/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..dcb95e2203e270b2cb07883a0ddd15ec60c2e929
--- /dev/null
+++ b/notebooks/README.md
@@ -0,0 +1,48 @@
+# Transfer Learning Notebooks
+
+## Environment setup and running the notebooks
+
+Use the [setup instructions](setup.md) to install the dependencies required to run the notebooks.
+
+This directory has Jupyter notebooks that demonstrate transfer learning with
+and without Intel® Transfer Learning Tool. All of the notebooks use models from public model repositories
+and leverage optimized libraries [Intel-optimized TensorFlow](https://pypi.org/project/intel-tensorflow/)
+and [Intel Extension for PyTorch](https://github.com/intel/intel-extension-for-pytorch).
+
+## Intel® Transfer Learning Tool Tutorial Notebooks
+
+| Notebook | Domain: Use Case | Framework| Description |
+| ---------| ---------|----------|-------------|
+| [BERT Text Classification with TensorFlow using the Intel® Transfer Learning Tool](/notebooks/text_classification/tlt_api_tf_text_classification) | NLP: Text Classification | TensorFlow and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to fine tune a BERT model from Hugging Face using text classification datasets. |
+| [BERT Text Classification with PyTorch using the Intel® Transfer Learning Tool](/notebooks/text_classification/tlt_api_pyt_text_classification) | NLP: Text Classification | PyTorch and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to fine tune a BERT model from Hugging Face using text classification datasets. |
+| [Image Classification with TensorFlow using Intel® Transfer Learning Tool](/notebooks/image_classification/tlt_api_tf_image_classification) | CV: Image Classification | TensorFlow and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for image classification using a TensorFlow model. |
+| [Image Classification with TensorFlow using Graph Optimization and Intel® Transfer Learning Tool](/notebooks/image_classification/tlt_api_tf_image_classification) | CV: Image Classification | TensorFlow and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning with graph optimization that increases throughput for image classification using a TensorFlow model. |
+| [Image Classification with PyTorch using Intel® Transfer Learning Tool](/notebooks/image_classification/tlt_api_pyt_image_classification) | CV: Image Classification | PyTorch and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for image classification using a PyTorch model. |
+| [Image Anomaly Detection with PyTorch using Intel® Transfer Learning Tool](/notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection) | CV: Image Anomaly Detection| PyTorch and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do feature extraction and pca analysis using a single function for image anomaly detection using a Torchvision model. |
+
+## Native Framework Transfer Learning Notebooks
+
+| Notebook | Domain: Use Case | Framework| Description |
+| ---------| ---------|----------|-------------|
+| [BERT SQuAD fine tuning with TF Hub](/notebooks/question_answering/tfhub_question_answering) | NLP: Question Answering | TensorFlow | Demonstrates BERT fine tuning using scripts from the [TensorFlow Model Garden](https://github.com/tensorflow/models) and the [SQuAD dataset](https://rajpurkar.github.io/SQuAD-explorer/). The notebook allows for selecting a BERT large or BERT base model from [TF Hub](https://tfhub.dev). The fine tuned model is evaluated and exported as a saved model. |
+| [BERT Text Classification with TF Hub](/notebooks/text_classification/tfhub_text_classification) | NLP: Text Classification | TensorFlow | Demonstrates BERT binary text classification fine tuning using the [IMDb movie review dataset](https://www.tensorflow.org/datasets/catalog/imdb_reviews) and multiclass text classification fine tuning using the [AG News datasets](https://www.tensorflow.org/datasets/catalog/ag_news_subset) from [TensorFlow Datasets](https://www.tensorflow.org/datasets) or a custom dataset (for binary classification). The notebook allows for selecting a BERT encoder (BERT large, BERT base, or small BERT) to use along with a preprocessor from [TF Hub](https://tfhub.dev). The fine tuned model is evaluated and exported as a saved model. |
+| [Text Classifier fine tuning with PyTorch & Hugging Face](/notebooks/text_classification/pytorch_text_classification) | NLP: Text Classification | PyTorch |Demonstrates fine tuning [Hugging Face models](https://huggingface.co/models) to do sentiment analysis using the [IMDb movie review dataset from Hugging Face Datasets](https://huggingface.co/datasets/imdb) or a custom dataset with [Intel® Extension for PyTorch*](https://github.com/intel/intel-extension-for-pytorch) |
+| [Image Classification with TF Hub](/notebooks/image_classification/tf_image_classification) | CV: Image Classification | TensorFlow | Demonstrates transfer learning with multiple [TF Hub](https://tfhub.dev) image classifiers, TF datasets, and custom image datasets |
+| [Image Classification with PyTorch & Torchvision](/notebooks/image_classification/pytorch_image_classification) | CV: Image Classification | PyTorch | Demonstrates transfer learning with multiple [Torchvision](https://pytorch.org/vision/stable/index.html) image classification models, Torchvision datasets, and custom datasets |
+
+## Transfer Learning Tool End-to-End Pipelines
+
+| Notebook | Domain: Use Case | Framework| Description |
+| ---------| ---------|----------|-------------|
+| [Document-Level Sentiment Analysis (SST2) using PyTorch and the Intel® Transfer Learning Tool API](/notebooks/e2e_workflows/Document_Level_Sentiment_Analysis.ipynb) | NLP: Text Classification | PyTorch and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for text classification using a PyTorch model from Hugging Face for a document-level sentiment analysis workflow. |
+| [Medical Imaging Classification (Colorectal histology) using TensorFlow and the Intel® Transfer Learning Tool API](/notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb) | CV: Image Classification | TensorFlow and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for image classification using a TensorFlow model for a medical imaging classification application. |
+| [Remote Sensing Image Scene Classification (Resisc) using TensorFlow and the Intel® Transfer Learning Tool API](/notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb) | CV: Image Classification | TensorFlow and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for image classification using a TensorFlow model for a remote sensing image scene classification application. |
+| [Multimodal Cancer Detection using TensorFlow, PyTorch, and the Intel® Transfer Learning Tool API](/notebooks/e2e_workflows/Multimodal_Cancer_Detection.ipynb) | CV: Image Classification<br>NLP: Text Classification | TensorFlow, PyTorch, and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for a late fusion multimodal ensemble application using both NLP and computer vision models from PyTorch and Tensorflow, respectively. |
+| [Anomaly Detection with PyTorch using Intel® Transfer Learning Tool](/notebooks/e2e_workflows/Anomaly_Detection_MVTec.ipynb) | CV: Image Anomaly Detection | PyTorch and the Intel Transfer Learning Tool API | Demonstrates how to use the Intel Transfer Learning Tool API to do feature extraction and pca analysis using dedicated function calls for image anomaly detection using a Torchvision model. |
+
+## Performance Comparison Notebooks
+
+| Notebook | Domain: Use Case | Framework| Description |
+| ---------| -----------------|----------|-------------|
+| [Performance Comparison: Image Classification Transfer Learning with TensorFlow and the Intel Transfer Learning Tool](/notebooks/performance/tf_image_classification_performance.ipynb) | CV: Image Classification | TensorFlow and the Intel Transfer Learning Tool API | Compares training and evaluation metrics and performance for image classification transfer learning using TensorFlow libraries and the Intel Transfer Learning Tool. |
+| [Performance Comparison: Text Classification Transfer Learning with Hugging Face and the Intel Transfer Learning Tool](/notebooks/performance/hf_text_classification_performance.ipynb) | NLP: Text Classification | Hugging Face, PyTorch, and the Intel Transfer Learning Tool API | Compares training and evaluation metrics for text classification transfer learning using the Hugging Face Trainer and the Intel Transfer Learning Tool. |
diff --git a/notebooks/e2e_workflows/Anomaly_Detection_MVTec.ipynb b/notebooks/e2e_workflows/Anomaly_Detection_MVTec.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..186def4bc2204297b7e8735a15dfb8ca1a038356
--- /dev/null
+++ b/notebooks/e2e_workflows/Anomaly_Detection_MVTec.ipynb
@@ -0,0 +1,603 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "3405d28d",
+   "metadata": {},
+   "source": [
+    "# Image Anomaly Detection  with PyTorch using <br>Intel® Transfer Learning Tool\n",
+    "\n",
+    "This notebook demonstrates anomaly detection using the Intel Transfer Learning Toolkit. It performs defect analysis with the MVTec dataset using PyTorch. The workflow uses a pretrained ResNet50 v1.5 model from torchvision."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d61b7ac",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a PyTorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a0bf9fd0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import PIL.Image as Image\n",
+    "import torch, torchvision\n",
+    "from torchvision.transforms.functional import InterpolationMode\n",
+    "import requests\n",
+    "from io import BytesIO\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file, download_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8f1fc78c",
+   "metadata": {},
+   "source": [
+    "## 2. Get or load the model\n",
+    "\n",
+    "In this step, we use the model factory to get the desired model. The `get_model` function returns a pretrained model object from a public model hub, while the `load_model` function loads a pretrained model from a checkpoint on your local disk or in memory.\n",
+    "\n",
+    "Here we are getting the pretrained `resnet50` model from Torchvision:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad4aeafd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name=\"resnet50\", framework=\"pytorch\", use_case='anomaly_detection')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9d087ee7",
+   "metadata": {},
+   "source": [
+    "To load a previously trained model from a file, use this:\n",
+    "```\n",
+    "model = model_factory.load_model(model_name=\"resnet50\", model=<PATH_TO_MODEL_FILE>, framework=\"pytorch\",     \n",
+    "                                 use_case='anomaly_detection')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dabd4183",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2d314ba0",
+   "metadata": {},
+   "source": [
+    "To use [MVTec](https://www.mvtec.com/company/research/datasets/mvtec-ad) or your own image dataset for anomaly detection, your image files (`.jpg` or `.png`) should be arranged in one of two ways. \n",
+    "\n",
+    "### Method 1: Category Folders\n",
+    "\n",
+    "Arrange them in folders in the root dataset directory like this:\n",
+    "\n",
+    "```\n",
+    "hazelnut\n",
+    "  └── crack\n",
+    "  └── cut\n",
+    "  └── good\n",
+    "  └── hole\n",
+    "  └── print\n",
+    "```\n",
+    "\n",
+    "<b>IMPORTANT:</b> There must be a subfolder named `good` and at least one other folder of defective examples. It does not matter what the names of the other folders are or how many there, as long as there is at least one. This would also be an acceptable Method 1 layout:\n",
+    "\n",
+    "```\n",
+    "toothbrush\n",
+    "  └── defective\n",
+    "  └── good\n",
+    "```\n",
+    "\n",
+    "TLT will encode all of the non-good images as \"bad\" and use the \"good\" images in the training set and a mix of good and bad images in the validation set.\n",
+    "\n",
+    "### Method 2: Train & Test Folders with Category Subfolders\n",
+    "\n",
+    "Arrange them in folders in the root dataset directory like this:\n",
+    "\n",
+    "```\n",
+    "hazelnut\n",
+    "  └── train\n",
+    "      └── good\n",
+    "  └── test\n",
+    "      └── crack\n",
+    "      └── cut\n",
+    "      └── good\n",
+    "      └── hole\n",
+    "      └── print\n",
+    "```\n",
+    "\n",
+    "When using this layout, TLT will use the exact defined split for train and validation subsets unless you use the `shuffle_split` method to re-shuffle and split up the \"good\" images with certain percentages. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "64b24c5b-9b48-4041-a6a2-7c438ca3a0c5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "img_dir = os.path.join(dataset_dir, 'hazelnut')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "357f3dfd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Select the subdirectory in dataset_dir to use\n",
+    "dataset = dataset_factory.load_dataset(img_dir,\n",
+    "                                       use_case='image_anomaly_detection', \n",
+    "                                       framework=\"pytorch\")\n",
+    "\n",
+    "print(dataset._dataset)\n",
+    "print(\"Class names:\", str(dataset.class_names))\n",
+    "print(\"Defect names:\", dataset.defect_names)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2200ef4e",
+   "metadata": {},
+   "source": [
+    "Note: The defects argument can be used to filter the validation set to use only a subset of defect types. For example:\n",
+    "```\n",
+    "dataset = dataset_factory.load_dataset(img_dir, \n",
+    "                                       use_case='image_anomaly_detection', \n",
+    "                                       framework=\"pytorch\",\n",
+    "                                       defects=['crack', 'hole'])\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "99f23249",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "Once you have your dataset, use the following cells to split and preprocess the data. We split them into training and test subsets, then resize the images to match the selected model, and then batch the images. Pass in optional arguments to customize the [Resize](https://pytorch.org/vision/main/generated/torchvision.transforms.Resize.html) or [Normalize](https://pytorch.org/vision/main/generated/torchvision.transforms.Normalize.html) transforms.\n",
+    "Data augmentation can be applied to the training set by specifying the augmentations to be applied in the `add_aug` parameter. Supported augmentations are given below:\n",
+    "1. hflip - RandomHorizontalFlip\n",
+    "2. rotate - RandomRotate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "dd91fbcf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# If using Method 1 layout, split the dataset into training and test subsets.\n",
+    "if dataset._validation_type is None:\n",
+    "    dataset.shuffle_split(train_pct=.75, val_pct=0.0, test_pct=0.25)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4fbe27a3-1b1e-4add-9725-28bceb62c474",
+   "metadata": {},
+   "source": [
+    "For __cutpaste__ feature extractor, cutpaste_type can be specified in the dataset.preprocess() method as follows. The option available are - _normal_, _scar_, _3way_ and _union_. Default is _normal_.\n",
+    "```\n",
+    "dataset.preprocess(224, batch_size=batch_size, interpolation=InterpolationMode.LANCZOS, cutpaste_type='normal')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e7c95a70",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess with an image size that matches the model, batch size 32, and the desired interpolation method\n",
+    "batch_size = 64\n",
+    "cutpaste_type = 'normal'\n",
+    "dataset.preprocess(224, batch_size=batch_size, interpolation=InterpolationMode.LANCZOS, cutpaste_type=cutpaste_type)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3704772b",
+   "metadata": {},
+   "source": [
+    "## 5. Visualize samples from the dataset\n",
+    "\n",
+    "We get a single batch from our training and test subsets and visualize the images as a sanity check."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cd6782b0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def plot_images(images, labels, sup_title, predictions=None):\n",
+    "    plt.figure(figsize=(18,14))\n",
+    "    plt.subplots_adjust(hspace=0.5)\n",
+    "    for n in range(min(batch_size, 30)):\n",
+    "        plt.subplot(6,5,n+1)\n",
+    "        inp = images[n]\n",
+    "        inp = inp.numpy().transpose((1, 2, 0))\n",
+    "        mean = np.array([0.485, 0.456, 0.406])\n",
+    "        std = np.array([0.229, 0.224, 0.225])\n",
+    "        inp = std * inp + mean\n",
+    "        inp = np.clip(inp, 0, 1)\n",
+    "        plt.imshow(inp)\n",
+    "        if predictions:\n",
+    "            correct_prediction = labels[n] == predictions[n]\n",
+    "            color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "            title = predictions[n] if correct_prediction else \"{}\".format(predictions[n])\n",
+    "        else:\n",
+    "            good_sample = labels[n] == 'good'\n",
+    "            color = \"darkgreen\" if labels[n] == 'good' else (\"crimson\" if labels[n] == 'bad' else \"black\")\n",
+    "            title = labels[n]\n",
+    "        plt.title(title, fontsize=14, color=color)\n",
+    "        plt.axis('off')\n",
+    "    _ = plt.suptitle(sup_title, fontsize=20)\n",
+    "    plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ffcd2071",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot some images from the training set\n",
+    "images, labels = dataset.get_batch()\n",
+    "labels = [dataset.class_names[id] for id in labels]\n",
+    "plot_images(images, labels, 'Training Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d37b808f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot some images from the test set\n",
+    "test_images, test_labels = dataset.get_batch(subset='test')\n",
+    "test_labels = [dataset.class_names[id] for id in test_labels]\n",
+    "plot_images(test_images, test_labels, 'Test Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a49ec7b7",
+   "metadata": {},
+   "source": [
+    "## 6. Training and Evaluation\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the torchvision feature extractor for the user's desired layer and extract features from the training set. The extracted features are used to perform a [principal component analysis](https://scikit-learn.org/stable/modules/generated/sklearn.decomposition.PCA.html). The model's evaluate function returns the AUROC metric ([area under](https://scikit-learn.org/stable/modules/generated/sklearn.metrics.auc.html) the [roc curve](https://scikit-learn.org/stable/modules/generated/sklearn.metrics.roc_curve.html)) calculated from the dataset's test subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ab510f51",
+   "metadata": {},
+   "source": [
+    "### Train Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageAnomalyDetectionDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory\n",
+    "\n",
+    "#### Optional\n",
+    "-  **generate_checkpoints** (bool): Whether to save/preserve the best weights during SimSiam training (default: True)\n",
+    "-  **initial_checkpoints** (str): The path to a starting weights file\n",
+    "-  **layer_name** (str): The layer name whose output is desired for the extracted features\n",
+    "-  **pooling** (str): Pooling to be applied on the extracted layer ('avg' or 'max') (default: 'avg')\n",
+    "-  **kernel_size** (int): Kernel size in the pooling layer (default: 2)\n",
+    "-  **pca_threshold** (float): Threshold to apply to PCA model (default: 0.99)\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8cd9420d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Examine the model's layers and decide which to use for feature extraction\n",
+    "model.list_layers(verbose=False)\n",
+    "layer = 'layer3'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b19be956-e3c6-4d9d-847d-779c1c35da38",
+   "metadata": {},
+   "source": [
+    "## Feature Extraction\n",
+    "There are three feature extractor options available within the `model.train()` function.\n",
+    "1. __No fine-tuning__ - To use a pretrained ResNet50/ResNet18 model for feature extraction, simply call `model.load_pretrained_model()`\n",
+    "2. [__SimSiam__](https://arxiv.org/abs/2011.10566) - A self-supervised neural network based on Siamese networks. It learns a meaningful representation of dataset without using any labels. If selected, SimSiam generates quality features that can help differentiate between regular and anomaly images in a given context. SimSiam produces two different augmented images from one underlying image. The end goal is to train the network to produce the same features for both images. It takes a ResNet model as the backbone and fine-tunes the model on the augmented dataset to get a better feature embedding. To use this feature extractor, download the SimSiam weights based on ResNet50 - https://dl.fbaipublicfiles.com/simsiam/models/100ep-256bs/pretrain/checkpoint_0099.pth.tar - set `initial_checkpoints` to the path of the downloaded checkpoints in the `model.train_simsiam()` function.\n",
+    "3. [__Cut-paste__](https://arxiv.org/abs/2104.04015#) - A self-supervised method for Anomaly Detection and Localization that takes ResNet50/ ResNet18 model as backbone and fine-tune the model on custom dataset to get better feature embedding. data augmentation strategy that cuts an image patch and pastes at a random location of a large image. To use this feature extractor, call `model.train_cutpaste()` function.\n",
+    "\n",
+    "\n",
+    "### Optional: The SimSiam TwoCropTransform\n",
+    "To train a Simsiam model, it is required to apply a TwoCropTransform augmentation technique on the dataset used for training. You can preview this augmentation on a sample batch after preprocessing by using `get_batch(simsiam=True)` and then use them for simsiam training in `model.train_simsiam()`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6b49522f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a batch of training data with the simsiam transform applied to it\n",
+    "simsiam_images, _ = dataset.get_batch(simsiam=True)\n",
+    "\n",
+    "# Plot the \"A\" samples showing the first set of augmented images\n",
+    "plot_images(simsiam_images[0], ['{}A'.format(i) for i in range(batch_size)], 'SimSiam \"A\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a5da06df",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Now plot the \"B\" samples showing the second set of augmented images based on the same underlying originals\n",
+    "plot_images(simsiam_images[1], ['{}B'.format(i) for i in range(batch_size)], 'SimSiam \"B\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ace7d296-74d9-47c1-aeaf-386433bac411",
+   "metadata": {},
+   "source": [
+    "### Optional: The Cut-paste Transforms\n",
+    "To train a model with Cut-paste , it is required to apply one of the four augmentations - __CutPasteNormal, CutPasteScar, CutPaste3Way, CutPasteUnion__ on the dataset used for training. You can preview this augmentation on a sample batch after preprocessing by using `get_batch(cutpaste=True)` and then use them for cutpaste training in `model.train_cutpaste()`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "21cbadd5-8387-4130-b5b4-e016d4ea4e5e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a batch of training data with the cutpaste transform applied to it\n",
+    "cutpaste_images, _ = dataset.get_batch(cutpaste=True)\n",
+    "\n",
+    "# Plot the \"A\" samples showing the first set of augmented images\n",
+    "plot_images(cutpaste_images[1], ['{}A'.format(i) for i in range(batch_size)], 'CutPaste \"A\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "750bc599-80e4-4e70-8aaf-5f63082b9198",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if cutpaste_type == '3way':\n",
+    "    # Now plot the \"B\" samples showing the second set of augmented images based on the same underlying originals\n",
+    "    plot_images(cutpaste_images[2], ['{}B'.format(i) for i in range(batch_size)], 'CutPaste \"B\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "73ecdb31-4105-40fa-a1b1-89c1a9b08108",
+   "metadata": {},
+   "source": [
+    "To use a ResNet50 model for feature extraction, run the below command."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5663a407-44d7-447d-aa75-a05ae8355716",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "extract_model = model.load_pretrained_model()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "275002cd-4708-4b19-a0bc-3e4a74af9ee2",
+   "metadata": {},
+   "source": [
+    "There is no fine-tuning being demonstrated here, but you can use `simsiam` or `cutpaste` if desired.\n",
+    "\n",
+    "To use simsiam, pass the checkpoint file in `initial_checkpoints` to `model.train_simsiam()` as follows\n",
+    "```\n",
+    "components = model.train_simsiam(dataset, output_dir, epochs=2, feature_dim=1000,\n",
+    "                         pred_dim=250, initial_checkpoints=<PATH_TO_CHECKPOINTS_FILE>,\n",
+    "                         generate_checkpoints=False, precision='float32')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "392f7546-0ae5-4b6b-bba7-fbcf6220d0f0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "extract_model = model.train_simsiam(dataset, output_dir, epochs=2, feature_dim=1000, \n",
+    "                                    pred_dim=250, initial_checkpoints=None,\n",
+    "                                    generate_checkpoints=False, precision='float32')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bd5c4fb9-0f81-4753-b990-c9a721dc95e0",
+   "metadata": {},
+   "source": [
+    "To use cutpaste, run `model.train_cutpaste` as given below. Optionally, to load a pretrained checkpoint pass the checkpoint file  in `initial_checkpoints` to `model.train_cutpaste()` as follows.\n",
+    "```\n",
+    "components = model.train_cutpaste(dataset, output_dir, optim='sgd', epochs=2, freeze_resnet=20,\n",
+    "                         head_layer=2, cutpaste_type='normal', initial_checkpoints=<PATH_TO_CHECKPOINTS_FILE>,\n",
+    "                         generate_checkpoints=False, precision='float32')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1b34e029-5235-4593-ab0b-12d27e672461",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "extract_model = model.train_cutpaste(dataset, output_dir, optim='sgd', epochs=2, freeze_resnet=20, head_layer=2, cutpaste_type='normal',\n",
+    "                                     generate_checkpoints=False, precision='float32')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "30fc18dd-7d78-4b77-b29b-8895e249cd34",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from tqdm import tqdm\n",
+    "from tlt.models.image_anomaly_detection.pytorch_image_anomaly_detection_model import extract_features, pca, get_feature_extraction_model\n",
+    "\n",
+    "layer_name = layer\n",
+    "pool = 'avg'\n",
+    "kernel_size = 2\n",
+    "dataset._dataset.transform = dataset._train_transform\n",
+    "images, labels = dataset.get_batch()\n",
+    "extract_model = get_feature_extraction_model(extract_model, layer_name)\n",
+    "outputs_inner = extract_features(extract_model, images.to('cpu'), layer_name,\n",
+    "                                      pooling=[pool, kernel_size])\n",
+    "data_mats_orig = torch.empty((outputs_inner.shape[1], len(dataset.train_subset))).to('cpu')\n",
+    "\n",
+    "# Feature extraction\n",
+    "with torch.no_grad():\n",
+    "    data_idx = 0\n",
+    "    num_ims = 0\n",
+    "    for images, labels in tqdm(dataset._train_loader):\n",
+    "        images, labels = images.to('cpu'), labels.to('cpu')\n",
+    "        num_samples = len(labels)\n",
+    "        outputs = extract_features(extract_model, images, layer_name, pooling=[pool, kernel_size])\n",
+    "        oi = torch.squeeze(outputs)\n",
+    "        data_mats_orig[:, data_idx:data_idx + num_samples] = oi.transpose(1, 0)\n",
+    "        num_ims += 1\n",
+    "        data_idx += num_samples"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "030f5e0e-b7db-41e8-9a13-bcd16d9457c2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# PCA\n",
+    "pca_threshold = 0.99\n",
+    "_pca_mats = pca(data_mats_orig, pca_threshold)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6f60192d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "threshold, auroc = model.evaluate(dataset, _pca_mats, use_test_set=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0a877f33",
+   "metadata": {},
+   "source": [
+    "## 7. Export"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "abc054ff",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.export(os.path.join(output_dir, 'anomaly'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0947915a",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "Paul Bergmann, Kilian Batzner, Michael Fauser, David Sattlegger, Carsten Steger: The MVTec Anomaly Detection Dataset: A Comprehensive Real-World Dataset for Unsupervised Anomaly Detection; in: International Journal of Computer Vision 129(4):1038-1059, 2021, DOI: 10.1007/s11263-020-01400-4.\n",
+    "\n",
+    "Paul Bergmann, Michael Fauser, David Sattlegger, Carsten Steger: MVTec AD — A Comprehensive Real-World Dataset for Unsupervised Anomaly Detection; in: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 9584-9592, 2019, DOI: 10.1109/CVPR.2019.00982."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.13"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/e2e_workflows/Document_Level_Sentiment_Analysis.ipynb b/notebooks/e2e_workflows/Document_Level_Sentiment_Analysis.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..d3753e8bfa7e886e8724b6346c2c9e011f63a522
--- /dev/null
+++ b/notebooks/e2e_workflows/Document_Level_Sentiment_Analysis.ipynb
@@ -0,0 +1,362 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "ac1059eb",
+   "metadata": {},
+   "source": [
+    "# Document-Level Sentiment Analysis using<br>PyTorch and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the Intel® Transfer Learning Tool to fine-tune a HuggingFace pretrained BERT model for text classification. While this notebook runs on a single node, this workload can also be run in a multinode setting using the TLT CLI. Consult the project documentation and examples to run it using PyTorch distributed training."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0bb70464",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a Pytorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "20ab9972",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import intel_extension_for_pytorch as ipex\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "47787deb",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported Huggingface text classification models. This is a list of pretrained models from Huggingface that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models()` function call to get more information about each model (such as the links to Huggingface, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "52a4af60",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available text classification models\n",
+    "model_factory.print_supported_models(use_case='text_classification', framework='pytorch')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7293733f",
+   "metadata": {},
+   "source": [
+    "Use the TLT model factory to get one of the models listed in the previous cell. The `get_model` function returns a  model object that will later be used for training. For this example, we will use bert-large-uncased."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "050d7b0a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"bert-large-uncased\"\n",
+    "framework = \"pytorch\"\n",
+    "\n",
+    "model = model_factory.get_model(model_name, framework, num_classes=2)\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "37bf5a93",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "c833ce65",
+   "metadata": {},
+   "source": [
+    "### Option A: Use the Hugging Face catalog\n",
+    "\n",
+    "Here we are using the dataset in the [Hugging Face datasets catalog](https://huggingface.co/datasets)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cf29cc7e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset_name = \"sst2\"\n",
+    "dataset = dataset_factory.get_dataset(dataset_dir, model.use_case, model.framework, dataset_name,\n",
+    "                                      dataset_catalog=\"huggingface\", shuffle_files=True, \n",
+    "                                      split=['train', 'validation'])\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "28504679",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [4. Preprocess the dataset](#4.-Preprocess-the-dataset) to continue using your own dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6867f79e",
+   "metadata": {},
+   "source": [
+    "### Option B: Download the SST2 dataset\n",
+    "Option B explicitly downloads the `SST-2.zip` file and extracts a `.tsv` file of training data that is tab separated. The dataset factory expects custom text classification input files to have at least two columns where one is the label and the second column is the text/sentence to classify.\n",
+    "\n",
+    "For example, the header and first three rows of the file should look similar to this:\n",
+    "```\n",
+    "sentence\tlabel\n",
+    "hide new secretions from the parental units \t0\n",
+    "contains no wit , only labored gags \t0\n",
+    "that loves its characters and communicates something rather beautiful about human nature \t1\n",
+    "```\n",
+    "\n",
+    "When using your own dataset, update the path to your dataset directory, as well the other variables with properties about the dataset like the .csv (or .tsv) file name, class names, delimiter, header, and the map function (if string labels need to be translated into numerical values)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41edc8fc",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Modify the variables below to use a different dataset or a csv file on your local system.\n",
+    "dataset_url = \"https://dl.fbaipublicfiles.com/glue/data/SST-2.zip\"\n",
+    "csv_name = \"train.tsv\"\n",
+    "delimiter = \"\\t\"\n",
+    "dataset_subdir = os.path.join(dataset_dir, 'SST-2')\n",
+    "# If we don't already have the csv file, download and extract the zip file to get it.\n",
+    "if not os.path.exists(os.path.join(dataset_subdir, csv_name)):\n",
+    "    download_and_extract_zip_file(dataset_url, dataset_dir)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "94e348c2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.load_dataset(dataset_dir=dataset_subdir, \n",
+    "                                       use_case=\"text_classification\",\n",
+    "                                       framework=\"pytorch\", csv_file_name=csv_name,\n",
+    "                                       column_names=[\"sentence\", \"label\"], \n",
+    "                                       delimiter=delimiter, header=True, label_col=1)\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6e0771e4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create splits for training and validation\n",
+    "dataset.shuffle_split(train_pct=0.75, val_pct=0.25)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "539d53b7",
+   "metadata": {},
+   "source": [
+    "## 4. Preprocess the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cell to preprocess the dataset. The dataset subsets are tokenized and then batched."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "587d1d9e",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "dataset.preprocess(model_name, batch_size=32, max_length=55)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "352eda54",
+   "metadata": {},
+   "source": [
+    "## 5. Fine tuning\n",
+    "\n",
+    "The TLT model's train function is called with the dataset that was just prepared, along with an output directory for checkpoints, and the number of training epochs.\n",
+    "\n",
+    "With the do_eval paramter set to True by default, this step will also show how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "492ee811",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **ipex_optimize** (bool): Optimize the model using Intel® Extension for PyTorch (default: True)\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "955a4a7e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = model.train(dataset, output_dir, epochs=1, ipex_optimize=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7e08a1c9",
+   "metadata": {},
+   "source": [
+    "## 6. Predict\n",
+    "\n",
+    "The model's predict function can be called with a sentence."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6f3cbd35",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "result = model.predict(\"Terrible movie\")\n",
+    "\n",
+    "print(\"Predicted score:\", float(result))\n",
+    "print(\"Predicted label:\", dataset.get_str_label(float(result)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "64ada826",
+   "metadata": {},
+   "source": [
+    "## 7. Export the saved model\n",
+    "\n",
+    "Lastly, we can call the model export function to generate a saved_model.pb. Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3981b2f5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3d0ed367",
+   "metadata": {},
+   "source": [
+    "## Citation\n",
+    "\n",
+    "```\n",
+    "@inproceedings{socher-etal-2013-recursive,\n",
+    "    title = \"Recursive Deep Models for Semantic Compositionality Over a Sentiment Treebank\",\n",
+    "    author = \"Socher, Richard  and\n",
+    "      Perelygin, Alex  and\n",
+    "      Wu, Jean  and\n",
+    "      Chuang, Jason  and\n",
+    "      Manning, Christopher D.  and\n",
+    "      Ng, Andrew  and\n",
+    "      Potts, Christopher\",\n",
+    "    booktitle = \"Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing\",\n",
+    "    month = oct,\n",
+    "    year = \"2013\",\n",
+    "    address = \"Seattle, Washington, USA\",\n",
+    "    publisher = \"Association for Computational Linguistics\",\n",
+    "    url = \"https://www.aclweb.org/anthology/D13-1170\",\n",
+    "    pages = \"1631--1642\",\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb b/notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..3045a212f73cb059f98dd25ca264985708981a03
--- /dev/null
+++ b/notebooks/e2e_workflows/Medical_Imaging_Classification.ipynb
@@ -0,0 +1,413 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "fcfb563d-3f9c-4731-be1f-9c9c4b2c9dfd",
+   "metadata": {
+    "tags": []
+   },
+   "source": [
+    "# Medical Imaging Classification (Colorectal histology) using TensorFlow and the Intel® Transfer Learning Tool API"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "353f2782-043f-4afd-9858-cc773275e6c5",
+   "metadata": {},
+   "source": [
+    "This notebook facilitates implementation of medical imaging classification using Transfer Learning Toolkit. It performs Multi-class texture analysis in colorectal cancer histology dataset. The workflow uses pretrained SOTA models ( RESNET V1.5) from TF hub and transfers the knowledge from a pretrained domain to a different custom domain achieving required accuracy."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8325300b-4a75-42fb-aa14-2b089b4edea5",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "04e3f113-4887-49c9-aa8b-a3c2058157a4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import pickle\n",
+    "import tensorflow as tf\n",
+    "from sklearn.metrics import classification_report\n",
+    "\n",
+    "#tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.types import FrameworkType, UseCaseType\n",
+    "\n",
+    "from notebooks.plot_utils import plot_curves\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a47ea534-0661-4cbe-97ed-ca288b6203e5",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "c9548167-cdfd-44ad-be60-cc3d131850a3",
+   "metadata": {},
+   "source": [
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported TensorFlow image classification models. This is a list of pretrained models from TFHub that we tested with our API. Optionally, the verbose=True argument can be added to the print_supported_models function call to get more information about each model (such as the link to TFHub, image size, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bae74045-f024-498f-9ea7-3ee8ac2ea5d3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available models\n",
+    "model_factory.print_supported_models(use_case='image_classification', framework='tensorflow')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3c06b359-1054-45c5-9223-47d4e1b7772d",
+   "metadata": {},
+   "source": [
+    "#### Option A: Load a model\n",
+    "\n",
+    "Next, use the model factory to get one of the models listed in the previous cell. The `get_model` function returns a model object that will later be used for training. By default, resnet_v1_50 is used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bf842217-d992-4b6f-99bf-aef475fa13dd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the model\n",
+    "model = model_factory.get_model(model_name=\"resnet_v1_50\", framework=\"tensorflow\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "afa83899-0a99-4c9e-9e3d-00b040fe3e1f",
+   "metadata": {},
+   "source": [
+    "#### Option B: Load a pretrained checkpoint\n",
+    "\n",
+    "Optionally, to continue training using a pretrained checkpoint, the user can specify the path to folder containing __saved_model.pb__. The user can specify the path in __model__ parameter.\n",
+    "\n",
+    "_Note: The path is same as saved_model_dir_"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9b49423b-e57d-478c-87b0-7daec6401b76",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#Load a pretrained checkpoint\n",
+    "model = model_factory.load_model(model_name='resnet_v1_50', \n",
+    "                                 model='/home/intel/output/resnet_v1_50/1', \n",
+    "                                 framework='tensorflow', use_case='image_classification')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ba2e4d10-458b-4479-8d1f-8cc67304d5c2",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset\n",
+    "Use dataset __colorectal_histology__ from the TensorFlow Datasets catalog"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cddcfdcf-ba16-4faa-a708-61f6aa01b3b0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.get_dataset(dataset_dir=dataset_dir,\n",
+    "                                      use_case='image_classification', \n",
+    "                                      framework='tensorflow',\n",
+    "                                      dataset_name='colorectal_histology',\n",
+    "                                      dataset_catalog='tf_datasets')\n",
+    "\n",
+    "print(dataset.info)\n",
+    "\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8ae3d375-554c-487b-8907-e895396d20e7",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cells to preprocess the dataset. We resize the images to match the selected models and batch the images, then split them into training and validation subsets.  Data augmentation can be applied by specifying the augmentations to be applied in __add_aug__ parameter. Supported augmentations are \n",
+    "1. hvflip - RandomHorizontalandVerticalFlip\n",
+    "2. hflip - RandomHorizontalFlip\n",
+    "3. vflip - RandomVerticalFlip\n",
+    "4. rotate - RandomRotate\n",
+    "5. zoom - RandomZoom"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "00d529b1-fe40-482a-b3f0-3875b13ba534",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess the dataset with an image size that matches the model and a batch size of 32\n",
+    "batch_size = 32\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size, add_aug=['hvflip', 'rotate'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1c4af8c6-c418-45d1-b0bc-dd8c7e2625c9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Split the dataset into training, validation and test subsets\n",
+    "dataset.shuffle_split(train_pct=.80, val_pct=.10, test_pct=0.10)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ab02c7d0-5b63-4be3-b6a6-cdfc03e48995",
+   "metadata": {},
+   "source": [
+    "## 5. Transfer Learning"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "feeb23c9-66a0-4670-8fd0-f7950dd2832e",
+   "metadata": {},
+   "source": [
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the TFHub feature vector and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. With the do_eval paramter set to True by default, this step will also show how the model can be evaluated and will return a list of metrics calculated from the dataset's validation subset.\n",
+    "### Arguments\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **enable_auto_mixed_precision** (bool or None): Enable auto mixed precision for training. Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance. If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "fa477dbb-58a9-4e06-9933-047699c35797",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory.\n",
+    "# It is recommended to enable auto mixed precision training when running on platforms that support\n",
+    "# bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that\n",
+    "# does not support bfloat16, it can be detrimental to the training performance.\n",
+    "# If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when\n",
+    "# running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "enable_auto_mixed_precision = None\n",
+    "\n",
+    "# Train the model using the dataset\n",
+    "history = model.train(dataset, output_dir=output_dir, epochs=50, \n",
+    "                      enable_auto_mixed_precision=None, early_stopping=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "40e11437-5666-49c0-9547-22e7696c0ea0",
+   "metadata": {},
+   "source": [
+    "## 6. Evaluate"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d413b5d-ed24-4756-928d-dbb8e7bf1af2",
+   "metadata": {},
+   "source": [
+    "The next step shows how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f5bfc8e8-f8c6-4b56-bfc8-51b88288fcdd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Evaluate model on validation subset\n",
+    "val_loss, val_acc = model.evaluate(dataset)\n",
+    "print(\"Validation Accuracy :\", val_acc)\n",
+    "print(\"Validation Loss :\", val_loss)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c478191f-2c0c-49d6-a295-0a3acfd183a2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plot_curves(history, os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name)))\n",
+    "pickle.dump(history, open(os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name), 'hist.pkl'), 'wb'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3c6fd051-97af-4142-b039-482cb742d988",
+   "metadata": {},
+   "source": [
+    "## 7. Export"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9225921d-5340-4865-ad4b-a2c19a5210ed",
+   "metadata": {},
+   "source": [
+    "Next, we can call the model export function to generate a saved_model.pb. The model is saved in a format that is ready to use with TensorFlow Serving. Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2c4fc5f8-cb72-4ab5-989b-43d7ad315e8b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5d79f06c-39cf-4c05-93bf-b35377ec06b1",
+   "metadata": {},
+   "source": [
+    "## 8. Inference\n",
+    "To perform only Inference using a saved model, follow the steps below\n",
+    "1. Execute Step 2(b) to load a pretrained checkpoint with the appropriate model name.\n",
+    "2. Execute Steps 3 and 4 to load and prepare the dataset.\n",
+    "3. Continue with the steps below"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "abb2182c-6302-474b-abab-7cf16c6b0966",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = pickle.load(open(os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name), 'hist.pkl'), 'rb'))\n",
+    "plot_curves(history, os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name)))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e5da7be1-76d9-4554-ace6-7bf6ef0f8c21",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "loss, accuracy = model.evaluate(dataset, use_test_set=True)\n",
+    "print('Test accuracy :', accuracy)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "eb585ceb-d120-4ded-a3b2-e78a5bd3dd7b",
+   "metadata": {},
+   "source": [
+    "We get the test subset from our dataset, and use that to call predict on our model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9e1e0450-f6b7-4abd-990c-b65b8d77e599",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "actual_labels = np.concatenate([y for x, y in dataset._test_subset], axis=0)\n",
+    "predicted_labels = model.predict(dataset._test_subset)\n",
+    "report = classification_report(actual_labels, predicted_labels)\n",
+    "print(\"Classification report\")\n",
+    "print(report)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7863e336-7996-4518-9ada-2b7fdd9672b5",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "@article{kather2016multi,<br>\n",
+    "      title={Multi-class texture analysis in colorectal cancer histology},<br>\n",
+    "      author={Kather, Jakob Nikolas and Weis, Cleo-Aron and Bianconi, Francesco and Melchers, Susanne M and Schad, Lothar R and Gaiser, Timo and Marx, Alexander and Z{\"o}llner, Frank Gerrit},<br>\n",
+    "      journal={Scientific reports},<br>\n",
+    "      volume={6},<br>\n",
+    "      pages={27988},<br>\n",
+    "      year={2016},<br>\n",
+    "      publisher={Nature Publishing Group}<br>\n",
+    "    }\n",
+    "    \n",
+    "Kather, J. N., Zöllner, F. G., Bianconi, F., Melchers, S. M., Schad, L. R., Gaiser, T., Marx, A., & Weis, C.-A. (2016). Collection of textures in colorectal cancer histology [Data set]. Zenodo. https://doi.org/10.5281/zenodo.53169"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.13"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/e2e_workflows/Multimodal_Cancer_Detection.ipynb b/notebooks/e2e_workflows/Multimodal_Cancer_Detection.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..f07eee98b5e3540917ccf914416460778ee40b5e
--- /dev/null
+++ b/notebooks/e2e_workflows/Multimodal_Cancer_Detection.ipynb
@@ -0,0 +1,511 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "2e3e807d",
+   "metadata": {},
+   "source": [
+    "# Multimodal Cancer Detection using the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This application is a multimodal solution for predicting cancer diagnosis using categorized contrast enhanced mammography data and radiology notes. It trains two models - one for image classification and the other for text classification - which can be combined into an ensemble classifier.\n",
+    "\n",
+    "## Import Dependencies and Setup Directories"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f2a722a7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "import torch\n",
+    "\n",
+    "from transformers import EvalPrediction, TrainingArguments\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "\n",
+    "# Specify the root directory where the images and annotations are located\n",
+    "dataset_dir = os.path.join(os.environ[\"DATASET_DIR\"]) if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bb53162b",
+   "metadata": {},
+   "source": [
+    "## Dataset\n",
+    "\n",
+    "Download the images and radiology annotations from https://wiki.cancerimagingarchive.net/pages/viewpage.action?pageId=109379611\n",
+    "\n",
+    "Image files should have the .jpg extension and be arranged in subfolders for each class. The annotation file should be a .csv. The data directory should look something like this:\n",
+    "\n",
+    "```\n",
+    "brca\n",
+    "  ├── annotation\n",
+    "  │   └── annotation.csv\n",
+    "  └── vision_images\n",
+    "      ├── Benign\n",
+    "      │   ├── P100_L_CM_CC.jpg\n",
+    "      │   ├── P100_L_CM_MLO.jpg\n",
+    "      │   └── ...\n",
+    "      ├── Malignant\n",
+    "      │   ├── P102_R_CM_CC.jpg\n",
+    "      │   ├── P102_R_CM_MLO.jpg\n",
+    "      │   └── ...\n",
+    "      └── Normal\n",
+    "          ├── P100_R_CM_CC.jpg\n",
+    "          ├── P100_R_CM_MLO.jpg\n",
+    "          └── ...\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bd9c3ef2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# User input needed - supply the path to the images in the dataset_dir according to your system\n",
+    "source_image_path = os.path.join(dataset_dir, 'brca', 'vision_images')\n",
+    "image_path = source_image_path\n",
+    "\n",
+    "# User input needed - supply the path and name of the annotation file in the dataset_dir\n",
+    "source_annotation_path = os.path.join(dataset_dir, 'brca', 'annotation', 'annotation.csv')\n",
+    "annotation_path = source_annotation_path\n",
+    "label_col = 3  # Index of the label column in the data file"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "245df47c",
+   "metadata": {},
+   "source": [
+    "### Optional: Group Data by Patient ID\n",
+    "\n",
+    "This section is not required to run the workload, but it is helpful to assign all of a subject's records to be entirely in the train set or test set. This section will do a random stratification based on patient ID and save new copies of the grouped data files."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "44dbd990",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from data_utils import split_images, split_annotation\n",
+    "\n",
+    "grouped_image_path = '{}_grouped'.format(source_image_path)\n",
+    "\n",
+    "if os.path.isdir(grouped_image_path):\n",
+    "    print(\"Grouped directory already exists and will be used: {}\".format(grouped_image_path))\n",
+    "else:\n",
+    "    split_images(source_image_path, grouped_image_path)\n",
+    "\n",
+    "image_path = grouped_image_path"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0d21bdff",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "file_dir, file_name = os.path.split(source_annotation_path)\n",
+    "grouped_annotation_path = os.path.join(file_dir, '{}_grouped.csv'.format(os.path.splitext(file_name)[0]))\n",
+    "\n",
+    "if os.path.isfile(grouped_annotation_path):\n",
+    "    print(\"Grouped annotation already exists and will be used: {}\".format(grouped_annotation_path))\n",
+    "else:\n",
+    "    train_dataset = split_annotation(file_dir, file_name, image_path)\n",
+    "    train_dataset.to_csv(grouped_annotation_path)\n",
+    "    print('Grouped annotation saved to: {}'.format(grouped_annotation_path))\n",
+    "\n",
+    "annotation_path = grouped_annotation_path\n",
+    "label_col = 1  # Index of the label column in the grouped data file"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "01e9e5cf",
+   "metadata": {},
+   "source": [
+    "## Model 1: Image Classification with TensorFlow\n",
+    "\n",
+    "### Get the Model and Dataset\n",
+    "Call the model factory to get a pretrained model from TensorFlow Hub and the dataset factory to load the images from their location. The `get_model` function returns a model object that will later be used for training. We will use resnet_v1_50 by default."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d9c93b18",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name=\"resnet_v1_50\", framework='tensorflow')\n",
+    "\n",
+    "# Load the dataset from the custom dataset path\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=image_path,\n",
+    "                                       use_case='image_classification',\n",
+    "                                       framework='tensorflow')\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6472bedd",
+   "metadata": {},
+   "source": [
+    "### Data Preparation\n",
+    "Once you have your dataset loaded, use the following cell to preprocess the dataset. We split the images into training and validation subsets, resize them to match the model, and then batch the images."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "98dcf057",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "batch_size = 16\n",
+    "if 'grouped' not in image_path:\n",
+    "    # Split if not pre-defined\n",
+    "    dataset.shuffle_split(train_pct=.80, val_pct=0.0, test_pct=0.2)\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f2f49c77",
+   "metadata": {},
+   "source": [
+    "### Transfer Learning\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the TFHub feature vector and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. We also add two more dense layers using the `extra_layers` parameter.\n",
+    "\n",
+    "To optionally insert additional dense layers between the base model and output layer, `extra_layers=[1024, 512]` will insert two dense layers, the first with 1024 neurons and the second with 512 neurons."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "21a92e4e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = model.train(dataset, output_dir=output_dir, epochs=5, seed=10, extra_layers=[1024, 512], do_eval=False)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "45289d48",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "metrics = model.evaluate(dataset, use_test_set=True)\n",
+    "for metric_name, metric_value in zip(model._model.metrics_names, metrics):\n",
+    "    print(\"{}: {}\".format(metric_name, metric_value))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bce6bafe",
+   "metadata": {},
+   "source": [
+    "### Save the Computer Vision Model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "093905b2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5621b571",
+   "metadata": {},
+   "source": [
+    "## Model 2: Text Classification with PyTorch\n",
+    "\n",
+    "### Get the Model and Dataset\n",
+    "Now we will call the model factory to get a pretrained model from Hugging Face and load the annotation file using the dataset factory. We will use clinical-bert for this part."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d18cebff",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Set up NLP parameters\n",
+    "model_name = 'clinical-bert'\n",
+    "seq_length = 64\n",
+    "batch_size = 5\n",
+    "quantization_criterion = 0.05\n",
+    "quantization_max_trial = 50\n",
+    "epochs = 3"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d939924f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name=model_name, framework='pytorch')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2e9dff00",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create a label map function and reverse label map for the dataset\n",
+    "def label_map_func(label):\n",
+    "        if label == 'Benign':\n",
+    "            return 0\n",
+    "        elif label == 'Malignant':\n",
+    "            return 1\n",
+    "        elif label == 'Normal':\n",
+    "            return 2\n",
+    "    \n",
+    "reverse_label_map = {0: 'Benign', 1: 'Malignant', 2: 'Normal'}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "879bad74",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "file_dir, file_name = os.path.split(annotation_path)\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=file_dir,\n",
+    "                       use_case='text_classification',\n",
+    "                       framework='pytorch',\n",
+    "                       dataset_name='brca',\n",
+    "                       csv_file_name=file_name,\n",
+    "                       label_map_func=label_map_func,\n",
+    "                       class_names=['Benign', 'Malignant', 'Normal'],\n",
+    "                       header=True,\n",
+    "                       label_col=label_col,\n",
+    "                       shuffle_files=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e2b9ddba",
+   "metadata": {},
+   "source": [
+    "### Data Preparation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "b166b757",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset.preprocess(model.hub_name, batch_size=batch_size, max_length=seq_length)\n",
+    "dataset.shuffle_split(train_pct=0.67, val_pct=0.33)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "020303ee",
+   "metadata": {},
+   "source": [
+    "### Transfer Learning\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the pretrained model from HuggingFace and add on a dense layer based on the number of classes in the dataset. The model is then trained using an instance of Hugging Face Trainer for the number of epochs specified. If desired, a native PyTorch loop can be invoked instead of Trainer by setting `use_trainer=False`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41fb0612",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = model.train(dataset, output_dir, epochs=epochs, use_trainer=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "de70a029",
+   "metadata": {},
+   "source": [
+    "### Save the NLP Model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ba08847d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "45752dd6",
+   "metadata": {},
+   "source": [
+    "### Int8 Quantization\n",
+    "\n",
+    "We can use the [Intel® Extension for Transformers](https://github.com/intel/intel-extension-for-transformers) to quantize the trained model for faster inference. If you want to run this part of the notebook, make sure you have `intel-extension-for-transformers` installed in your environment."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "44036b44",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install intel-extension-for-transformers==1.0.1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ce0687ce",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from intel_extension_for_transformers.optimization.trainer import NLPTrainer\n",
+    "from intel_extension_for_transformers.optimization import metrics, objectives, OptimizedModel, QuantizationConfig"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f9557a68",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Set up quantization config\n",
+    "tune_metric = metrics.Metric(\n",
+    "    name=\"eval_accuracy\",\n",
+    "    greater_is_better=True,\n",
+    "    is_relative=True,\n",
+    "    criterion=quantization_criterion,\n",
+    "    weight_ratio=None,\n",
+    ")\n",
+    "\n",
+    "objective = objectives.Objective(\n",
+    "    name=\"performance\", greater_is_better=True, weight_ratio=None\n",
+    ")\n",
+    "\n",
+    "quantization_config = QuantizationConfig(\n",
+    "    approach=\"PostTrainingDynamic\",\n",
+    "    max_trials=quantization_max_trial,\n",
+    "    metrics=[tune_metric],\n",
+    "    objectives=[objective],\n",
+    ")\n",
+    "\n",
+    "# Set up metrics computation\n",
+    "def compute_metrics(p: EvalPrediction):\n",
+    "    preds = p.predictions[0] if isinstance(p.predictions, tuple) else p.predictions\n",
+    "    preds = np.argmax(preds, axis=1)\n",
+    "    return {\"accuracy\": (preds == p.label_ids).astype(np.float32).mean().item()}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f406d6db",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "quantizer = NLPTrainer(model=model._model,\n",
+    "                       train_dataset=dataset.train_subset,\n",
+    "                       eval_dataset=dataset.validation_subset,\n",
+    "                       compute_metrics=compute_metrics,\n",
+    "                       tokenizer=dataset._tokenizer)\n",
+    "quantized_model = quantizer.quantize(quant_config=quantization_config)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "56e5f2f5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "results = quantizer.evaluate()\n",
+    "eval_acc = results.get(\"eval_accuracy\")\n",
+    "print(\"Final Eval Accuracy: {:.5f}\".format(eval_acc))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b69df1a0",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "### Data Citation\n",
+    "Khaled R., Helal M., Alfarghaly O., Mokhtar O., Elkorany A., El Kassas H., Fahmy A. <b>Categorized Digital Database for Low energy and Subtracted Contrast Enhanced Spectral Mammography images [Dataset].</b> (2021) The Cancer Imaging Archive. DOI:  [10.7937/29kw-ae92](https://doi.org/10.7937/29kw-ae92)\n",
+    "\n",
+    "### Publication Citation\n",
+    "Khaled, R., Helal, M., Alfarghaly, O., Mokhtar, O., Elkorany, A., El Kassas, H., & Fahmy, A. <b>Categorized contrast enhanced mammography dataset for diagnostic and artificial intelligence research.</b> (2022) Scientific Data, Volume 9, Issue 1. DOI: [10.1038/s41597-022-01238-0](https://doi.org/10.1038/s41597-022-01238-0)\n",
+    "\n",
+    "### TCIA Citation\n",
+    "Clark K, Vendt B, Smith K, Freymann J, Kirby J, Koppel P, Moore S, Phillips S, Maffitt D, Pringle M, Tarbox L, Prior F. <b>The Cancer Imaging Archive (TCIA): Maintaining and Operating a Public Information Repository</b>, Journal of Digital Imaging, Volume 26, Number 6, December, 2013, pp 1045-1057. DOI: [10.1007/s10278-013-9622-7](https://doi.org/10.1007/s10278-013-9622-7)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb b/notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..7cf0478d3b33209c0a69c4d5c8f109d6a9138e54
--- /dev/null
+++ b/notebooks/e2e_workflows/Remote_Sensing_Image_Scene_Classification.ipynb
@@ -0,0 +1,427 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "fcfb563d-3f9c-4731-be1f-9c9c4b2c9dfd",
+   "metadata": {
+    "tags": []
+   },
+   "source": [
+    "# Remote Sensing Image Scene Classification (Resisc) using TensorFlow and the Intel® Transfer Learning Tool API"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "353f2782-043f-4afd-9858-cc773275e6c5",
+   "metadata": {},
+   "source": [
+    "This notebook facilitates implementation of remote sensing image scene classification using Transfer Learning Toolkit. It performs Multi-class scene classification on RESISC45 dataset. The workflow uses pretrained SOTA models ( RESNET V1.5) from TF hub and transfers the knowledge from a pretrained domain to a different custom domain achieving required accuracy."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8325300b-4a75-42fb-aa14-2b089b4edea5",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "04e3f113-4887-49c9-aa8b-a3c2058157a4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import pickle\n",
+    "import tensorflow as tf\n",
+    "from sklearn.metrics import classification_report\n",
+    "\n",
+    "#tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.types import FrameworkType, UseCaseType\n",
+    "\n",
+    "from notebooks.plot_utils import plot_curves\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a47ea534-0661-4cbe-97ed-ca288b6203e5",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "c9548167-cdfd-44ad-be60-cc3d131850a3",
+   "metadata": {},
+   "source": [
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported TensorFlow image classification models. This is a list of pretrained models from TFHub that we tested with our API. Optionally, the verbose=True argument can be added to the print_supported_models function call to get more information about each model (such as the link to TFHub, image size, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "df3c14ab-c4d3-4aa4-bd24-5265ccd7b534",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available models\n",
+    "model_factory.print_supported_models(use_case='image_classification', framework='tensorflow')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3c06b359-1054-45c5-9223-47d4e1b7772d",
+   "metadata": {},
+   "source": [
+    "#### Option A: Load a model\n",
+    "\n",
+    "Next, use the model factory to get one of the models listed in the previous cell. The `get_model` function returns a model object that will later be used for training. By default, resnet_v1_50 is used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bf842217-d992-4b6f-99bf-aef475fa13dd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the model\n",
+    "model = model_factory.get_model(model_name=\"resnet_v1_50\", framework=\"tensorflow\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "afa83899-0a99-4c9e-9e3d-00b040fe3e1f",
+   "metadata": {},
+   "source": [
+    "#### Option B: Load a pretrained checkpoint\n",
+    "\n",
+    "Optionally, to continue training using a pretrained checkpoint, the user can specify the path to folder containing __saved_model.pb__. The user can specify the path in __model__ parameter.\n",
+    "\n",
+    "_Note: The path is same as saved_model_dir_"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9b49423b-e57d-478c-87b0-7daec6401b76",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#Load a pretrained checkpoint\n",
+    "model = model_factory.load_model(model_name='resnet_v1_50', \n",
+    "                                 model='/home/intel/output/resnet_v1_50/1', \n",
+    "                                 framework='tensorflow', use_case='image_classification')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ba2e4d10-458b-4479-8d1f-8cc67304d5c2",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0bff208b-e899-49cc-a4d5-5abab6baa4c9",
+   "metadata": {},
+   "source": [
+    "The dataset used for remote sensing domain is resisc45. More details are at the location : https://www.tensorflow.org/datasets/catalog/resisc45. \n",
+    "To download dataset follow the steps:\n",
+    "1. Download the rar file from https://onedrive.live.com/?authkey=%21AHHNaHIlzp%5FIXjs&cid=5C5E061130630A68&id=5C5E061130630A68%21107&parId=5C5E061130630A68%21112&action=locate \n",
+    "2. Unzip the folder\n",
+    "3. Set custom_dataset_path to point to resisc folder"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d1840f1a-2a32-4ef7-89b2-d32ee231463b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Set the custom_dataset_path to point to your dataset's directory.\n",
+    "custom_dataset_path = os.path.join(dataset_dir, \"resisc/\")\n",
+    "\n",
+    "# Load the dataset from the custom dataset path\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=custom_dataset_path,\n",
+    "                                       use_case='image_classification', \n",
+    "                                       framework='tensorflow')\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a27d6271-5afa-46b2-aed9-f543c62e1443",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cells to preprocess the dataset. We resize the images to match the selected models and batch the images, then split them into training and validation subsets.  Data augmentation can be applied by specifying the augmentations to be applied in __add_aug__ parameter. Supported augmentations are \n",
+    "1. hvflip - RandomHorizontalandVerticalFlip\n",
+    "2. hflip - RandomHorizontalFlip\n",
+    "3. vflip - RandomVerticalFlip\n",
+    "4. rotate - RandomRotate\n",
+    "5. zoom - RandomZoom"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "00d529b1-fe40-482a-b3f0-3875b13ba534",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess the dataset with an image size that matches the model and a batch size of 256\n",
+    "batch_size = 256\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size, add_aug=['hvflip', 'rotate', 'zoom'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1c4af8c6-c418-45d1-b0bc-dd8c7e2625c9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Split the dataset into training, validation and test subsets\n",
+    "dataset.shuffle_split(train_pct=.80, val_pct=.10, test_pct=0.10)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ab02c7d0-5b63-4be3-b6a6-cdfc03e48995",
+   "metadata": {},
+   "source": [
+    "## 5. Transfer Learning"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "feeb23c9-66a0-4670-8fd0-f7950dd2832e",
+   "metadata": {},
+   "source": [
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the TFHub feature vector and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. With the do_eval paramter set to True by default, this step will also show how the model can be evaluated and will return a list of metrics calculated from the dataset's validation subset.\n",
+    "### Arguments\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **enable_auto_mixed_precision** (bool or None): Enable auto mixed precision for training. Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance. If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "fa477dbb-58a9-4e06-9933-047699c35797",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory.\n",
+    "# It is recommended to enable auto mixed precision training when running on platforms that support\n",
+    "# bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that\n",
+    "# does not support bfloat16, it can be detrimental to the training performance.\n",
+    "# If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when\n",
+    "# running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "enable_auto_mixed_precision = None\n",
+    "\n",
+    "# Train the model using the dataset\n",
+    "history = model.train(dataset, output_dir=output_dir, epochs=50, \n",
+    "            enable_auto_mixed_precision=None, extra_layers=[1024,512], early_stopping=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "40e11437-5666-49c0-9547-22e7696c0ea0",
+   "metadata": {},
+   "source": [
+    "## 6. Evaluate"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d413b5d-ed24-4756-928d-dbb8e7bf1af2",
+   "metadata": {},
+   "source": [
+    "The next step shows how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f5bfc8e8-f8c6-4b56-bfc8-51b88288fcdd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Evaluate model on validation subset\n",
+    "val_loss, val_acc = model.evaluate(dataset)\n",
+    "print(\"Validation Accuracy :\", val_acc)\n",
+    "print(\"Validation Loss :\", val_loss)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "685f31eb-a32a-4198-afba-782e31ed506a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plot_curves(history, os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name)))\n",
+    "pickle.dump(history, open(os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name), 'resisc45_hist.pkl'), 'wb'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3c6fd051-97af-4142-b039-482cb742d988",
+   "metadata": {},
+   "source": [
+    "## 7. Export"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9225921d-5340-4865-ad4b-a2c19a5210ed",
+   "metadata": {},
+   "source": [
+    "Next, we can call the model export function to generate a saved_model.pb. The model is saved in a format that is ready to use with TensorFlow Serving. Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2c4fc5f8-cb72-4ab5-989b-43d7ad315e8b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bb29d2b5-31e5-4136-a9d5-9f97d556d4a8",
+   "metadata": {},
+   "source": [
+    "## 8. Inference\n",
+    "To perform only Inference using a saved model, follow the steps below\n",
+    "1. Execute Step 2(b) to load a pretrained checkpoint with the appropriate model name.\n",
+    "2. Execute Steps 3 and 4 to load and prepare the dataset.\n",
+    "3. Continue with the steps below"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ef0819f7-c9fa-4eae-be48-f83a74777002",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = pickle.load(open(os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name), 'resisc45_hist.pkl'), 'rb'))\n",
+    "plot_curves(history, os.path.join(output_dir, \"{}_checkpoints\".format(model.model_name)))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "39a5b54a-6781-4496-b29f-55a1ce18d8e4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "loss, accuracy = model.evaluate(dataset, use_test_set=True)\n",
+    "print('Test accuracy :', accuracy)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f517d0f1-011c-4704-85fa-fd7d57f8aaa4",
+   "metadata": {},
+   "source": [
+    "We get the test subset from our dataset, and use that to call predict on our model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "295ac0ab-accd-4433-8143-a087e7b218b5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "actual_labels = np.concatenate([y for x, y in dataset._test_subset], axis=0)\n",
+    "predicted_labels = model.predict(dataset._test_subset)\n",
+    "report = classification_report(actual_labels, predicted_labels)\n",
+    "print(\"Classification report\")\n",
+    "print(report)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "27daa00f-4e83-419c-ba75-38c03a0d2475",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "@article{Cheng_2017,<br>\n",
+    "   title={Remote Sensing Image Scene Classification: Benchmark and State of the Art},<br>\n",
+    "   volume={105},<br>\n",
+    "   ISSN={1558-2256},<br>\n",
+    "   url={http://dx.doi.org/10.1109/JPROC.2017.2675998},<br>\n",
+    "   DOI={10.1109/jproc.2017.2675998},<br>\n",
+    "   number={10},<br>\n",
+    "   journal={Proceedings of the IEEE},<br>\n",
+    "   publisher={Institute of Electrical and Electronics Engineers (IEEE)},<br>\n",
+    "   author={Cheng, Gong and Han, Junwei and Lu, Xiaoqiang},<br>\n",
+    "   year={2017},<br>\n",
+    "   month={Oct},<br>\n",
+    "   pages={1865-1883}<br>\n",
+    "}"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.13"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/e2e_workflows/data_utils.py b/notebooks/e2e_workflows/data_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..0975dc57bcc2b18bc8fc31f1fbe92449650c91a0
--- /dev/null
+++ b/notebooks/e2e_workflows/data_utils.py
@@ -0,0 +1,159 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import shutil
+import numpy as np
+import pandas as pd
+from sklearn.model_selection import train_test_split
+from collections import defaultdict
+
+
+def copy_files_src_to_tgt(samples, fns_dict, src_folder, tgt_folder):
+    for sample in samples:
+        files_to_copy = fns_dict.get(sample)
+        for _file in files_to_copy:
+            src_fn = os.path.join(src_folder, _file)
+            tgt_fn = os.path.join(tgt_folder, _file)
+            shutil.copy2(src_fn, tgt_fn)
+
+
+def split_images(src_folder, tgt_folder):
+    labels = os.listdir(src_folder)
+    print("Number of labels = ", len(labels))
+    print("Labels are: \n", labels)
+    for label in labels:
+        fns = os.listdir(os.path.join(src_folder, label))
+        fns.sort()
+        fns_root = ['_'.join(x.split('_')[:2]) for x in fns]
+        # Convert list of tuples to dictionary value lists
+        print("\nCreating default dict for stratifying the subject in {}.".format(label))
+        fns_dict = defaultdict(list)
+        for i, j in zip(fns_root, fns):
+            fns_dict[i].append(j)
+        train_samples, test_samples = train_test_split(list(fns_dict.keys()), test_size=0.2, random_state=100)
+
+        src_dir = os.path.join(src_folder, label)
+        tgt_dir = os.path.join(tgt_folder, 'train', label)
+        os.makedirs(tgt_dir, exist_ok=True)
+        copy_files_src_to_tgt(train_samples, fns_dict, src_dir, tgt_dir)
+
+        tgt_dir = os.path.join(tgt_folder, 'test', label)
+        os.makedirs(tgt_dir, exist_ok=True)
+        copy_files_src_to_tgt(test_samples, fns_dict, src_dir, tgt_dir)
+
+        print("Done splitting the files for label = {}\n".format(label))
+    print("Done splitting the data. Output data is here: ", tgt_folder)
+
+
+def get_subject_id(image_name):
+    image_name = image_name.split("/")[-1]
+    patient_id = "".join(image_name.split("_")[:2])[1:]
+    return patient_id
+
+
+def create_patient_id_list(image_data_folder, folder):
+    folder_pth = os.path.join(folder, image_data_folder)
+    patient_id_list = []
+    for fldr in os.listdir(folder_pth):
+        for f in os.listdir(os.path.join(folder_pth, fldr)):
+            patient_id_list.append(get_subject_id(f))
+
+    return np.unique(patient_id_list)
+
+
+def read_annotation_file(
+    folder,
+    file_name,
+    label_column,
+    data_column,
+    patient_id,
+    patient_id_list,
+    image_data_folder
+):
+    df_path = os.path.join(folder, file_name)
+    df = pd.read_csv(df_path)
+    label_map, reverse_label_map = label2map(df, label_column)
+
+    if patient_id_list is not None:
+        df = df[df[patient_id].isin(patient_id_list)]
+    else:
+        image_name_list = []
+        for label in os.listdir(image_data_folder):
+            image_name_list.extend(os.listdir(os.path.join(image_data_folder, label)))
+        df = df[df[patient_id].isin(np.unique([get_subject_id(i) for i in image_name_list]))]
+
+    df_new = pd.DataFrame(columns=[label_column, data_column, patient_id])
+    for i in df[patient_id].unique():
+        annotation = " ".join(df[df[patient_id].isin([i])][data_column].to_list())
+        temp_labels = df[df[patient_id] == i][label_column].unique()
+        if len(temp_labels) == 1:
+            df_new.loc[len(df_new)] = [temp_labels[0], annotation, i]
+        else:
+            if patient_id_list is not None:
+                # this is the case only shows for inference
+                # label assigne as a place holder
+                df_new.loc[len(df_new)] = ["Normal", annotation, i]
+            else:
+                Warning("Conflict in labelling ....")
+
+    return df_new, label_map, reverse_label_map
+
+
+def label2map(df, label_column):
+    label_map, reverse_label_map = {}, {}
+    for i, v in enumerate(df[label_column].unique().tolist()):
+        label_map[v] = i
+        reverse_label_map[i] = v
+
+    return label_map, reverse_label_map
+
+
+def create_train_test_set(df, patient_id, patient_id_list):
+    train_label, test_label = train_test_split(
+        patient_id_list, test_size=0.33, random_state=42
+    )
+
+    df_test = df[df[patient_id].isin(test_label)]
+    df_train = df[df[patient_id].isin(train_label)]
+
+    return df_train, df_test
+
+
+def split_annotation(folder, file_name, image_data_folder):
+    label_column = "label"
+    data_column = "symptoms"
+    patient_id = "Patient_ID"
+    patient_id_list = None
+
+    df, label_map, reverse_label_map = read_annotation_file(
+        folder,
+        file_name,
+        label_column,
+        data_column,
+        patient_id,
+        patient_id_list,
+        image_data_folder
+    )
+
+    patient_id_list = create_patient_id_list(image_data_folder, folder)
+    df_train, df_test = create_train_test_set(df, patient_id, patient_id_list)
+
+    return df_train
diff --git a/notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection/Anomaly_Detection.ipynb b/notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection/Anomaly_Detection.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..f8e386ca307e05187a63cca15088285bbffd3be0
--- /dev/null
+++ b/notebooks/image_anomaly_detection/tlt_api_pyt_anomaly_detection/Anomaly_Detection.ipynb
@@ -0,0 +1,558 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "3405d28d",
+   "metadata": {},
+   "source": [
+    "# Image Anomaly Detection  with PyTorch using <br>Intel® Transfer Learning Tool\n",
+    "\n",
+    "This notebook demonstrates anomaly detection using the Intel Transfer Learning Toolkit. It performs defect analysis with the MVTec dataset using PyTorch. The workflow uses a pretrained ResNet50 v1.5 model from torchvision."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d61b7ac",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a PyTorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a0bf9fd0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import PIL.Image as Image\n",
+    "import torch, torchvision\n",
+    "from torchvision.transforms.functional import InterpolationMode\n",
+    "import requests\n",
+    "from io import BytesIO\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file, download_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8f1fc78c",
+   "metadata": {},
+   "source": [
+    "## 2. Get or load the model\n",
+    "\n",
+    "In this step, we use the model factory to get the desired model. The `get_model` function returns a pretrained model object from a public model hub, while the `load_model` function loads a pretrained model from a checkpoint on your local disk or in memory.\n",
+    "\n",
+    "Here we are getting the pretrained `resnet50` model from Torchvision:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad4aeafd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name=\"resnet50\", framework=\"pytorch\", use_case='anomaly_detection')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9d087ee7",
+   "metadata": {},
+   "source": [
+    "To load a previously trained model from a file, use this:\n",
+    "```\n",
+    "model = model_factory.load_model(model_name=\"resnet50\", model=<PATH_TO_MODEL_FILE>, framework=\"pytorch\",     \n",
+    "                                 use_case='anomaly_detection')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dabd4183",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2d314ba0",
+   "metadata": {},
+   "source": [
+    "To use [MVTec](https://www.mvtec.com/company/research/datasets/mvtec-ad) or your own image dataset for anomaly detection, your image files (`.jpg` or `.png`) should be arranged in one of two ways. \n",
+    "\n",
+    "### Method 1: Category Folders\n",
+    "\n",
+    "Arrange them in folders in the root dataset directory like this:\n",
+    "\n",
+    "```\n",
+    "hazelnut\n",
+    "  └── crack\n",
+    "  └── cut\n",
+    "  └── good\n",
+    "  └── hole\n",
+    "  └── print\n",
+    "```\n",
+    "\n",
+    "<b>IMPORTANT:</b> There must be a subfolder named `good` and at least one other folder of defective examples. It does not matter what the names of the other folders are or how many there, as long as there is at least one. This would also be an acceptable Method 1 layout:\n",
+    "\n",
+    "```\n",
+    "toothbrush\n",
+    "  └── defective\n",
+    "  └── good\n",
+    "```\n",
+    "\n",
+    "TLT will encode all of the non-good images as \"bad\" and use the \"good\" images in the training set and a mix of good and bad images in the validation set.\n",
+    "\n",
+    "### Method 2: Train & Test Folders with Category Subfolders\n",
+    "\n",
+    "Arrange them in folders in the root dataset directory like this:\n",
+    "\n",
+    "```\n",
+    "hazelnut\n",
+    "  └── train\n",
+    "      └── good\n",
+    "  └── test\n",
+    "      └── crack\n",
+    "      └── cut\n",
+    "      └── good\n",
+    "      └── hole\n",
+    "      └── print\n",
+    "```\n",
+    "\n",
+    "When using this layout, TLT will use the exact defined split for train and validation subsets unless you use the `shuffle_split` method to re-shuffle and split up the \"good\" images with certain percentages. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "64b24c5b-9b48-4041-a6a2-7c438ca3a0c5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "img_dir = os.path.join(dataset_dir, 'hazelnut')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "357f3dfd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.load_dataset(img_dir, \n",
+    "                                       use_case='image_anomaly_detection', \n",
+    "                                       framework=\"pytorch\")\n",
+    "\n",
+    "print(dataset._dataset)\n",
+    "print(\"Class names:\", str(dataset.class_names))\n",
+    "print(\"Defect names:\", dataset.defect_names)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2200ef4e",
+   "metadata": {},
+   "source": [
+    "Note: The defects argument can be used to filter the validation set to use only a subset of defect types. For example:\n",
+    "```\n",
+    "dataset = dataset_factory.load_dataset(img_dir, \n",
+    "                                       use_case='image_anomaly_detection', \n",
+    "                                       framework=\"pytorch\",\n",
+    "                                       defects=['crack', 'hole'])\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "99f23249",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "Once you have your dataset, use the following cells to split and preprocess the data. We split them into training and test subsets, then resize the images to match the selected model, and then batch the images. Pass in optional arguments to customize the [Resize](https://pytorch.org/vision/main/generated/torchvision.transforms.Resize.html) or [Normalize](https://pytorch.org/vision/main/generated/torchvision.transforms.Normalize.html) transforms.\n",
+    "Data augmentation can be applied to the training set by specifying the augmentations to be applied in the `add_aug` parameter. Supported augmentations are given below:\n",
+    "1. hflip - RandomHorizontalFlip\n",
+    "2. rotate - RandomRotate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "dd91fbcf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# If using Method 1 layout, split the dataset into training and test subsets.\n",
+    "if dataset._validation_type is None:\n",
+    "    dataset.shuffle_split(train_pct=.75, val_pct=0.0, test_pct=0.25)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4fbe27a3-1b1e-4add-9725-28bceb62c474",
+   "metadata": {},
+   "source": [
+    "For __cutpaste__ feature extractor, cutpaste_type can be specified in the dataset.preprocess() method as follows. The option available are - _normal_, _scar_, _3way_ and _union_. Default is _normal_.\n",
+    "```\n",
+    "dataset.preprocess(224, batch_size=batch_size, interpolation=InterpolationMode.LANCZOS, cutpaste_type='normal')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e7c95a70",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess with an image size that matches the model, batch size 32, and the desired interpolation method\n",
+    "batch_size = 64\n",
+    "cutpaste_type = 'normal'\n",
+    "dataset.preprocess(image_size=224, batch_size=batch_size, interpolation=InterpolationMode.LANCZOS, cutpaste_type=cutpaste_type)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3704772b",
+   "metadata": {},
+   "source": [
+    "## 5. Visualize samples from the dataset\n",
+    "\n",
+    "We get a single batch from our training and test subsets and visualize the images as a sanity check."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cd6782b0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def plot_images(images, labels, sup_title, predictions=None):\n",
+    "    plt.figure(figsize=(18,14))\n",
+    "    plt.subplots_adjust(hspace=0.5)\n",
+    "    for n in range(min(batch_size, 30)):\n",
+    "        plt.subplot(6,5,n+1)\n",
+    "        inp = images[n]\n",
+    "        inp = inp.numpy().transpose((1, 2, 0))\n",
+    "        mean = np.array([0.485, 0.456, 0.406])\n",
+    "        std = np.array([0.229, 0.224, 0.225])\n",
+    "        inp = std * inp + mean\n",
+    "        inp = np.clip(inp, 0, 1)\n",
+    "        plt.imshow(inp)\n",
+    "        if predictions:\n",
+    "            correct_prediction = labels[n] == predictions[n]\n",
+    "            color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "            title = predictions[n] if correct_prediction else \"{}\".format(predictions[n])\n",
+    "        else:\n",
+    "            good_sample = labels[n] == 'good'\n",
+    "            color = \"darkgreen\" if labels[n] == 'good' else (\"crimson\" if labels[n] == 'bad' else \"black\")\n",
+    "            title = labels[n]\n",
+    "        plt.title(title, fontsize=14, color=color)\n",
+    "        plt.axis('off')\n",
+    "    _ = plt.suptitle(sup_title, fontsize=20)\n",
+    "    plt.show()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ffcd2071",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot some images from the training set\n",
+    "images, labels = dataset.get_batch()\n",
+    "labels = [dataset.class_names[id] for id in labels]\n",
+    "plot_images(images, labels, 'Training Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d37b808f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot some images from the test set\n",
+    "images, labels = dataset.get_batch(subset='test')\n",
+    "labels = [dataset.class_names[id] for id in labels]\n",
+    "plot_images(images, labels, 'Test Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a49ec7b7",
+   "metadata": {},
+   "source": [
+    "## 6. Training and Evaluation\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the torchvision feature extractor for the user's desired layer and extract features from the training set. The extracted features are used to perform a [principal component analysis](https://scikit-learn.org/stable/modules/generated/sklearn.decomposition.PCA.html). The model's evaluate function returns the AUROC metric ([area under](https://scikit-learn.org/stable/modules/generated/sklearn.metrics.auc.html) the [roc curve](https://scikit-learn.org/stable/modules/generated/sklearn.metrics.roc_curve.html)) calculated from the dataset's test subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ab510f51",
+   "metadata": {},
+   "source": [
+    "### Train Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageAnomalyDetectionDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory\n",
+    "\n",
+    "#### Optional\n",
+    "-  **generate_checkpoints** (bool): Whether to save/preserve the best weights during SimSiam training (default: True)\n",
+    "-  **initial_checkpoints** (str): The path to a starting weights file\n",
+    "-  **layer_name** (str): The layer name whose output is desired for the extracted features\n",
+    "-  **pooling** (str): Pooling to be applied on the extracted layer ('avg' or 'max') (default: 'avg')\n",
+    "-  **kernel_size** (int): Kernel size in the pooling layer (default: 2)\n",
+    "-  **pca_threshold** (float): Threshold to apply to PCA model (default: 0.99)\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8cd9420d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Examine the model's layers and decide which to use for feature extraction\n",
+    "model.list_layers(verbose=False)\n",
+    "layer = 'layer3'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b19be956-e3c6-4d9d-847d-779c1c35da38",
+   "metadata": {},
+   "source": [
+    "## Feature Extraction\n",
+    "There are three feature extractor options available within the `model.train()` function.\n",
+    "1. __No fine-tuning__ - To use a pretrained ResNet50/ResNet18 model for feature extraction, simply do not change the default `simsiam=False` input argument.\n",
+    "2. [__SimSiam__](https://arxiv.org/abs/2011.10566) - A self-supervised neural network based on Siamese networks. It learns a meaningful representation of dataset without using any labels. If selected, SimSiam generates quality features that can help differentiate between regular and anomaly images in a given context. SimSiam produces two different augmented images from one underlying image. The end goal is to train the network to produce the same features for both images. It takes a ResNet model as the backbone and fine-tunes the model on the augmented dataset to get a better feature embedding. To use this feature extractor, download the SimSiam weights based on ResNet50 - https://dl.fbaipublicfiles.com/simsiam/models/100ep-256bs/pretrain/checkpoint_0099.pth.tar - set `simsiam=True`, and set `initial_checkpoints` to the path of the downloaded checkpoints in the `model.train()` function.\n",
+    "3. [__Cut-paste__](https://arxiv.org/abs/2104.04015#) - A self-supervised method for Anomaly Detection and Localization that takes ResNet50/ ResNet18 model as backbone and fine-tune the model on custom dataset to get better feature embedding. data augmentation strategy that cuts an image patch and pastes at a random location of a large image. To use this feature extractor, set `cutpaste=True` in the `model.train()` function.\n",
+    "\n",
+    "\n",
+    "### Optional: The SimSiam TwoCropTransform\n",
+    "To train a Simsiam model, it is required to apply a TwoCropTransform augmentation technique on the dataset used for training. You can preview this augmentation on a sample batch after preprocessing by using `get_batch(simsiam=True)` and then use them for simsiam training by using `simsiam=True` in `model.train()` also."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6b49522f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a batch of training data with the simsiam transform applied to it\n",
+    "simsiam_images, _ = dataset.get_batch(simsiam=True)\n",
+    "\n",
+    "# Plot the \"A\" samples showing the first set of augmented images\n",
+    "plot_images(simsiam_images[0], ['{}A'.format(i) for i in range(batch_size)], 'SimSiam \"A\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a5da06df",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Now plot the \"B\" samples showing the second set of augmented images based on the same underlying originals\n",
+    "plot_images(simsiam_images[1], ['{}B'.format(i) for i in range(batch_size)], 'SimSiam \"B\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ace7d296-74d9-47c1-aeaf-386433bac411",
+   "metadata": {},
+   "source": [
+    "### Optional: The Cut-paste Transforms\n",
+    "To train a model with Cut-paste , it is required to apply one of the four augmentations - __CutPasteNormal, CutPasteScar, CutPaste3Way, CutPasteUnion__ on the dataset used for training. You can preview this augmentation on a sample batch after preprocessing by using `get_batch(cutpaste=True)` and then use them for cutpaste training by using `cutpaste=True` in `model.train()` also."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "21cbadd5-8387-4130-b5b4-e016d4ea4e5e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a batch of training data with the cutpaste transform applied to it\n",
+    "cutpaste_images, _ = dataset.get_batch(cutpaste=True)\n",
+    "\n",
+    "# Plot the \"A\" samples showing the first set of augmented images\n",
+    "plot_images(cutpaste_images[1], ['{}A'.format(i) for i in range(batch_size)], 'CutPaste \"A\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "750bc599-80e4-4e70-8aaf-5f63082b9198",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if cutpaste_type == '3way':\n",
+    "    # Now plot the \"B\" samples showing the third set of augmented images based on the same underlying originals\n",
+    "    plot_images(cutpaste_images[2], ['{}B'.format(i) for i in range(batch_size)], 'CutPaste \"B\" Samples')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a2ba878d-1b03-4f7c-8f5a-6507ee1494a9",
+   "metadata": {},
+   "source": [
+    "There is no fine-tuning being demonstrated here, but you can use `simsiam` or `cutpaste` if desired.\n",
+    "\n",
+    "To use simsiam, set `simsiam=True` and pass the checkpoint file to `model.train()` as follows\n",
+    "```\n",
+    "pca_components, trained_model = model.train(dataset, output_dir, epochs=2, feature_dim=1000,\n",
+    "                         pred_dim=250, initial_checkpoints=<PATH_TO_CHECKPOINTS_FILE>,\n",
+    "                         pooling='avg', kernel_size=2, pca_threshold=0.99, simsiam=True,\n",
+    "                         generate_checkpoints=False, precision='float32')\n",
+    "```\n",
+    "\n",
+    "To use cutpaste, set `cutpaste=True`. Optionally, to load a pretrained checkpoint pass the checkpoint file to `model.train()` as follows.\n",
+    "```\n",
+    "pca_components, trained_model = model.train(dataset, output_dir, optim='sgd', epochs=2, freeze_resnet=20,\n",
+    "                         head_layer=2, cutpaste_type='normal', initial_checkpoints=<PATH_TO_CHECKPOINTS_FILE>,\n",
+    "                         pooling='avg', kernel_size=2, pca_threshold=0.99, cutpaste=True,\n",
+    "                         generate_checkpoints=False, precision='float32')\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a2b601fc",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "pca_components, trained_model = model.train(dataset, output_dir, layer_name=layer, epochs=2,\n",
+    "                                            seed=None, pooling='avg', kernel_size=2, pca_threshold=0.99,\n",
+    "                                            precision='float32')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6f60192d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "threshold, auroc = model.evaluate(dataset, pca_components, use_test_set=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3cb8fc62",
+   "metadata": {},
+   "source": [
+    "## 7. Predict\n",
+    "\n",
+    "Using the same batch of test samples from above, get and view the model's predictions."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1f7ffe59",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "predictions = model.predict(images, pca_components, return_type='class', threshold=threshold)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a40d0670",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plot_images(images, labels, 'Predictions', predictions=predictions)\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red\")\n",
+    "\n",
+    "accuracy = sum([1 if p==labels[i] else 0 for i, p in enumerate(predictions)])/len(predictions)\n",
+    "print(\"Accuracy: {}\".format(accuracy))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0a877f33",
+   "metadata": {},
+   "source": [
+    "## 8. Export"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "abc054ff",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.export(os.path.join(output_dir, 'anomaly'))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0947915a",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "Paul Bergmann, Kilian Batzner, Michael Fauser, David Sattlegger, Carsten Steger: The MVTec Anomaly Detection Dataset: A Comprehensive Real-World Dataset for Unsupervised Anomaly Detection; in: International Journal of Computer Vision 129(4):1038-1059, 2021, DOI: 10.1007/s11263-020-01400-4.\n",
+    "\n",
+    "Paul Bergmann, Michael Fauser, David Sattlegger, Carsten Steger: MVTec AD — A Comprehensive Real-World Dataset for Unsupervised Anomaly Detection; in: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 9584-9592, 2019, DOI: 10.1109/CVPR.2019.00982."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.13"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/image_classification/pytorch_image_classification/PyTorch_Image_Classification_Transfer_Learning.ipynb b/notebooks/image_classification/pytorch_image_classification/PyTorch_Image_Classification_Transfer_Learning.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..e99ec5a6b2799fe0f81bdde5bf402154882e8132
--- /dev/null
+++ b/notebooks/image_classification/pytorch_image_classification/PyTorch_Image_Classification_Transfer_Learning.ipynb
@@ -0,0 +1,640 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "67b1e912",
+   "metadata": {},
+   "source": [
+    "# Transfer Learning for Image Classification\n",
+    "\n",
+    "This notebook uses image classification models from [Torchvision](https://pytorch.org/vision/stable/index.html) that were originally trained using [ImageNet](https://image-net.org/) and does transfer learning with a Torchvision dataset or your own raw images.\n",
+    "\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset)\n",
+    "3. [Predict using the original model](#3.-Predict-using-the-original-model)\n",
+    "4. [Transfer learning](#4.-Transfer-learning)\n",
+    "5. [Visualize the model output](#5.-Visualize-the-model-output)\n",
+    "6. [Export the saved model](#6.-Export-the-saved-model)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "939a7f98",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [README.md](/notebooks/README.md) to setup a PyTorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "25f98c12",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import time\n",
+    "import math\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import torch\n",
+    "import torchvision\n",
+    "from torchvision import datasets, models, transforms\n",
+    "from PIL import Image\n",
+    "from pydoc import locate\n",
+    "import warnings\n",
+    "\n",
+    "import intel_extension_for_pytorch as ipex\n",
+    "import matplotlib.pyplot as plt\n",
+    "\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file, download_file\n",
+    "from model_utils import torchvision_model_map, get_retrainable_model\n",
+    "\n",
+    "warnings.filterwarnings(\"ignore\")\n",
+    "\n",
+    "print('Supported models:')\n",
+    "print('\\n'.join(torchvision_model_map.keys()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e42b6e79",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Specify a model from the list above\n",
+    "model_name = \"efficientnet_b0\"\n",
+    "\n",
+    "# Specify the the parent directory for the custom or Torchvision dataset\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "    \n",
+    "# Specify a directory for output\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "# Batch size\n",
+    "batch_size = 32\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_directory)\n",
+    "print(\"Output directory:\", output_directory)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "00f85b73",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if model_name not in torchvision_model_map.keys():\n",
+    "    raise ValueError(\"The specified model_name ({}) is invalid. Please select from: {}\".\n",
+    "                     format(model_name, torchvision_model_map.keys()))\n",
+    "    \n",
+    "print(\"Pretrained Image Classification Model:\", model_name)   "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1aaecdff",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "98db4b34",
+   "metadata": {},
+   "source": [
+    "Define transforms for data resizing and augmentation. The normalization means and standard deviations `[0.485, 0.456, 0.406], [0.229, 0.224, 0.225]` are specific to torchvision image classification models and are explained in the [documentation](https://pytorch.org/vision/stable/models.html#classification)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "429a90ea",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocessing transforms\n",
+    "import torchvision.transforms as T\n",
+    "\n",
+    "def get_transform(train):\n",
+    "    transforms = []\n",
+    "    transforms.append(T.Resize([256, 256]))\n",
+    "    if train:\n",
+    "        transforms.append(T.RandomHorizontalFlip())\n",
+    "    transforms.append(T.ToTensor())\n",
+    "    transforms.append(T.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]))\n",
+    "    \n",
+    "    return T.Compose(transforms)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "7cd4df40",
+   "metadata": {},
+   "source": [
+    "### Option A: Use a Torchvision dataset"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "f0b814cb",
+   "metadata": {},
+   "source": [
+    "To use a Torchvision dataset, load from the Torchvision.datasets library, applying transforms for image augmentation, normalization, and resizing. This example uses the Food101 dataset from the [Torchvision datasets for image classification](https://pytorch.org/vision/stable/datasets.html#image-classification), but you can choose from a variety of options. If the dataset is not found in the dataset directory it is downloaded. Subsequent runs will reuse the already downloaded dataset.\n",
+    "\n",
+    "Note: Some Torchvision datasets use a `train=True/False` argument and others have a `split=\"train\"/\"test\"` convention. See the Torchvision documentation to see how to specify the subset you want to use."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "537d83e1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = torchvision.datasets.Food101(dataset_directory, split='train',\n",
+    "                                       transform=get_transform(True), download=True)\n",
+    "dataset_test = torchvision.datasets.Food101(dataset_directory, split='test',\n",
+    "                                            transform=get_transform(False), download=True)   \n",
+    "class_names = dataset.classes\n",
+    "\n",
+    "print('Training data size: {}'.format(len(dataset)))\n",
+    "print('Validation data size: {}'.format(len(dataset_test)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "93bb716b",
+   "metadata": {},
+   "source": [
+    "Now skip ahead to the [Predict using the original model](#3.-Predict-using-the-original-model) section."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "43f9656f",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a downloaded or custom dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f235fa0f",
+   "metadata": {},
+   "source": [
+    "To use your own image dataset for transfer learning with the rest of this notebook, format your images as `.jpg` files and save them in folders named after the classes that you want the model to predict. To provide a working example using the correct layout, we will download and extract a flower species dataset. After downloading and extracting, you will have the following  subdirectories in your dataset directory. Each species subfolder will contain numerous `.jpg` files:\n",
+    "\n",
+    "```\n",
+    "dataset_directory\n",
+    "└── flower_photos\n",
+    "    └── daisy\n",
+    "    └── dandelion\n",
+    "    └── roses\n",
+    "    └── sunflowers\n",
+    "    └── tulips\n",
+    "```\n",
+    "\n",
+    "Use this as an example to organize your own image files accordingly."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "29105a9e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# When you have your own properly organized subdirectory of images, adjust this variable\n",
+    "dataset_subdir = os.path.join(dataset_directory, \"flower_photos\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "13e96b9e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Only run this if you want to use the example flowers dataset\n",
+    "if not os.path.exists(dataset_subdir):\n",
+    "    os.makedirs(dataset_subdir)\n",
+    "    dataset_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    \n",
+    "    # Download and extract the tar\n",
+    "    download_and_extract_tar_file(dataset_url, dataset_directory)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a5482b8a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset = datasets.ImageFolder(dataset_subdir, get_transform(True))\n",
+    "dataset_test = datasets.ImageFolder(dataset_subdir, get_transform(False))\n",
+    "class_names = dataset.classes"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e791a208",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Use 25% for validation and 75% for training\n",
+    "indices = torch.randperm(len(dataset)).tolist()\n",
+    "num_training_samples = math.floor(len(dataset)*.75)\n",
+    "\n",
+    "dataset_test = torch.utils.data.Subset(dataset, indices[-num_training_samples:])\n",
+    "dataset = torch.utils.data.Subset(dataset, indices[:num_training_samples])   "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dbc2c043",
+   "metadata": {},
+   "source": [
+    "## 3. Predict using the original model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a89f78d4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create a data loader just for visualization\n",
+    "data_loader = torch.utils.data.DataLoader(dataset, batch_size=30,\n",
+    "                                          shuffle=True, num_workers=4)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "be4fa7fe",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the ImageNet labels for displaying with the predictions\n",
+    "imagenet_classes = []\n",
+    "labels_file_url = 'https://storage.googleapis.com/download.tensorflow.org/data/ImageNetLabels.txt'\n",
+    "labels_file_path = os.path.join(dataset_directory, os.path.basename(labels_file_url))\n",
+    "if not os.path.exists(labels_file_url):\n",
+    "    download_file(labels_file_url, dataset_directory)\n",
+    "\n",
+    "with open(labels_file_path) as f:\n",
+    "    imagenet_labels = f.readlines()\n",
+    "    imagenet_classes = [l.strip() for l in imagenet_labels]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7444f838",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the pretrained torchvision model\n",
+    "pretrained_model_class = locate('torchvision.models.{}'.format(model_name))\n",
+    "model = pretrained_model_class(pretrained=True)\n",
+    "\n",
+    "# Get a batch of training data\n",
+    "inputs, classes = next(iter(data_loader))\n",
+    "\n",
+    "# Get predictions from the pretrained model\n",
+    "model.eval()\n",
+    "outputs = model(inputs)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0e893dcf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# List of the actual labels for this batch\n",
+    "actual_label_batch = [class_names[int(id)] for id in classes]\n",
+    "\n",
+    "# List of the predicted labels for this batch\n",
+    "_, predicted_id = torch.max(outputs, 1)\n",
+    "predicted_label_batch = [imagenet_classes[id] for id in predicted_id]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bfb66dc7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create a results table to list out the ImageNet class prediction vs the actual dataset label\n",
+    "results_table = []\n",
+    "for prediction, actual in zip(predicted_label_batch, actual_label_batch):\n",
+    "    results_table.append([prediction, actual])\n",
+    "\n",
+    "pd.DataFrame(results_table, columns=[\"ImageNet Prediction\", \"Actual Label\"])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1d9409af",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plt.figure(figsize=(10,9))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(30):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    inp = inputs[n]\n",
+    "    inp = inp.numpy().transpose((1, 2, 0))\n",
+    "    mean = np.array([0.485, 0.456, 0.406])\n",
+    "    std = np.array([0.229, 0.224, 0.225])\n",
+    "    inp = std * inp + mean\n",
+    "    inp = np.clip(inp, 0, 1)\n",
+    "    plt.imshow(inp)\n",
+    "    plt.title(predicted_label_batch[n].title(), fontsize=9)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"ImageNet predictions\")\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "eba7d039",
+   "metadata": {},
+   "source": [
+    "## 4. Transfer learning"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cc029ef3",
+   "metadata": {},
+   "source": [
+    "Replace the pretrained head of the network with a new layer based on the number of classes in our dataset. Train the model using the new dataset for the specified number of epochs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "02f0eee5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Number of training epochs\n",
+    "num_epochs = 1\n",
+    "\n",
+    "# To reduce training time, the feature extractor layer can remain frozen (do_fine_tuning=False).\n",
+    "# Fine-tuning can be enabled to potentially get better accuracy. Note that enabling fine-tuning\n",
+    "# will increase training time.\n",
+    "do_fine_tuning = False"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41c2ee68",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def main(model, criterion, optimizer, dataset, dataset_test, num_epochs=10):\n",
+    "    since = time.time()\n",
+    "    \n",
+    "    device = torch.device(\"cpu\")\n",
+    "    model = model.to(device)\n",
+    "    best_acc = 0.0\n",
+    "\n",
+    "    # Create data loaders for training and validation\n",
+    "    data_loader = torch.utils.data.DataLoader(dataset, batch_size=batch_size,\n",
+    "                                          shuffle=True, num_workers=4)\n",
+    "    data_loader_test = torch.utils.data.DataLoader(dataset_test, batch_size=batch_size,\n",
+    "                                          shuffle=False, num_workers=4)\n",
+    "    \n",
+    "    for epoch in range(num_epochs):\n",
+    "        print(f'Epoch {epoch}/{num_epochs - 1}')\n",
+    "        print('-' * 10)\n",
+    "\n",
+    "        # Training phase\n",
+    "        model.train()\n",
+    "        running_loss = 0.0\n",
+    "        running_corrects = 0\n",
+    "\n",
+    "        # Iterate over data.\n",
+    "        for inputs, labels in data_loader:\n",
+    "            inputs = inputs.to(device)\n",
+    "            labels = labels.to(device)\n",
+    "\n",
+    "            # Zero the parameter gradients\n",
+    "            optimizer.zero_grad()\n",
+    "\n",
+    "            # Forward and backward pass\n",
+    "            with torch.set_grad_enabled(True):\n",
+    "                outputs = model(inputs)\n",
+    "                _, preds = torch.max(outputs, 1)\n",
+    "                loss = criterion(outputs, labels)\n",
+    "                loss.backward()\n",
+    "                optimizer.step()\n",
+    "\n",
+    "            # Statistics\n",
+    "            running_loss += loss.item() * inputs.size(0)\n",
+    "            running_corrects += torch.sum(preds == labels.data)\n",
+    "\n",
+    "        epoch_loss = running_loss / len(dataset)\n",
+    "        epoch_acc = running_corrects.double() / len(dataset)\n",
+    "\n",
+    "        print(f'Training Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')\n",
+    "\n",
+    "        # Evaluation phase\n",
+    "        model.eval()\n",
+    "        running_loss = 0.0\n",
+    "        running_corrects = 0\n",
+    "            \n",
+    "        # Iterate over data.\n",
+    "        for inputs, labels in data_loader_test:\n",
+    "            inputs = inputs.to(device)\n",
+    "            labels = labels.to(device)\n",
+    "\n",
+    "            # Zero the parameter gradients\n",
+    "            optimizer.zero_grad()\n",
+    "\n",
+    "            # Forward pass\n",
+    "            with torch.set_grad_enabled(False):\n",
+    "                outputs = model(inputs)\n",
+    "                _, preds = torch.max(outputs, 1)\n",
+    "                loss = criterion(outputs, labels)\n",
+    "                    \n",
+    "            # Statistics\n",
+    "            running_loss += loss.item() * inputs.size(0)\n",
+    "            running_corrects += torch.sum(preds == labels.data)\n",
+    "            \n",
+    "        epoch_loss = running_loss / len(dataset_test)\n",
+    "        epoch_acc = running_corrects.double() / len(dataset_test)\n",
+    "\n",
+    "        if epoch_acc > best_acc:\n",
+    "            best_acc = epoch_acc\n",
+    "                \n",
+    "        print(f'Validation Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')\n",
+    "        print()\n",
+    "        \n",
+    "\n",
+    "    time_elapsed = time.time() - since\n",
+    "    print(f'Training complete in {time_elapsed // 60:.0f}m {time_elapsed % 60:.0f}s')\n",
+    "    print(f'Best Validation Accuracy: {best_acc:4f}')\n",
+    "\n",
+    "    return model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f8b754b4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = get_retrainable_model(model_name, len(class_names), do_fine_tuning)\n",
+    "criterion = torch.nn.CrossEntropyLoss()\n",
+    "\n",
+    "# Adam optimizer\n",
+    "optimizer = torch.optim.Adam(model.parameters(), lr=0.005)\n",
+    "\n",
+    "print('Trainable parameters: {}'.format(sum(p.numel() for p in model.parameters() if p.requires_grad)))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2a2c8e8b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model, optimizer = ipex.optimize(model, optimizer=optimizer)\n",
+    "model = main(model, criterion, optimizer, dataset, dataset_test, num_epochs)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f22b2493",
+   "metadata": {},
+   "source": [
+    "## 5. Visualize the model output"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "fc700939",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.eval()\n",
+    "outputs = model(inputs)\n",
+    "_, predicted_id = torch.max(outputs, 1)\n",
+    "predicted_label_batch = [class_names[id] for id in predicted_id]\n",
+    "\n",
+    "# Display the results\n",
+    "plt.figure(figsize=(10,9))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(30):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    inp = inputs[n]\n",
+    "    inp = inp.numpy().transpose((1, 2, 0))\n",
+    "    mean = np.array([0.485, 0.456, 0.406])\n",
+    "    std = np.array([0.229, 0.224, 0.225])\n",
+    "    inp = std * inp + mean\n",
+    "    inp = np.clip(inp, 0, 1)\n",
+    "    plt.imshow(inp)\n",
+    "    correct_prediction = actual_label_batch[n] == predicted_label_batch[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predicted_label_batch[n].title() if correct_prediction else \"{}\\n({})\".format(predicted_label_batch[n], actual_label_batch[n]) \n",
+    "    plt.title(title, fontsize=9, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"Model predictions\")\n",
+    "plt.show()\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "549d3602",
+   "metadata": {},
+   "source": [
+    "## 6. Export the saved model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5a21d129",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if not os.path.exists(output_directory):\n",
+    "    os.makedirs(output_directory)\n",
+    "file_path = \"{}/image_classification.pt\".format(output_directory)\n",
+    "torch.save(model.state_dict(), file_path)\n",
+    "print(\"Saved to {}\".format(file_path))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "edc0250c",
+   "metadata": {},
+   "source": [
+    "## Dataset citations\n",
+    "```\n",
+    "@inproceedings{bossard14,\n",
+    "  title = {Food-101 -- Mining Discriminative Components with Random Forests},\n",
+    "  author = {Bossard, Lukas and Guillaumin, Matthieu and Van Gool, Luc},\n",
+    "  booktitle = {European Conference on Computer Vision},\n",
+    "  year = {2014}\n",
+    "}\n",
+    "\n",
+    "@ONLINE {tfflowers,\n",
+    "author = \"The TensorFlow Team\",\n",
+    "title = \"Flowers\",\n",
+    "month = \"jan\",\n",
+    "year = \"2019\",\n",
+    "url = \"http://download.tensorflow.org/example_images/flower_photos.tgz\" }\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/image_classification/pytorch_image_classification/README.md b/notebooks/image_classification/pytorch_image_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..5efc318364791afb4258788fa0c206d441ac1d8b
--- /dev/null
+++ b/notebooks/image_classification/pytorch_image_classification/README.md
@@ -0,0 +1,37 @@
+# Transfer Learning for Image Classification using PyTorch
+
+This notebook uses image classification models from Torchvision that were originally trained 
+using ImageNet and does transfer learning with the Food101 dataset, a flowers dataset, or
+a custom image dataset.
+
+The notebook performs the following steps:
+
+1. Import dependencies and setup parameters
+2. Prepare the dataset
+3. Predict using the original model
+4. Transfer learning
+5. Visualize the model output
+6. Export the saved model
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [PyTorch notebook environment](/notebooks#pytorch-environment).
+   
+## References
+
+Dataset citations:
+```
+@inproceedings{bossard14,
+  title = {Food-101 -- Mining Discriminative Components with Random Forests},
+  author = {Bossard, Lukas and Guillaumin, Matthieu and Van Gool, Luc},
+  booktitle = {European Conference on Computer Vision},
+  year = {2014}
+}
+
+@ONLINE {tfflowers,
+author = "The TensorFlow Team",
+title = "Flowers",
+month = "jan",
+year = "2019",
+url = "http://download.tensorflow.org/example_images/flower_photos.tgz" }
+```
diff --git a/notebooks/image_classification/pytorch_image_classification/model_utils.py b/notebooks/image_classification/pytorch_image_classification/model_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..ab981d5e759a6bc7def8d7ee3aa59cbac3296f62
--- /dev/null
+++ b/notebooks/image_classification/pytorch_image_classification/model_utils.py
@@ -0,0 +1,79 @@
+#
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import torch
+import torchvision
+from pydoc import locate
+
+
+# Dictionary of Torchvision image classification models
+torchvision_model_map = {
+    "resnet18": {
+        "classifier": "fc"
+    },
+    "resnet50": {
+        "classifier": "fc"
+    },
+    "efficientnet_b0": {
+        "classifier": ["classifier", 1]
+    },
+    "efficientnet_b1": {
+        "classifier": ["classifier", 1]
+    },
+    "efficientnet_b2": {
+        "classifier": ["classifier", 1]
+    },
+    "densenet121": {
+        "classifier": "classifier"
+    },
+    "densenet161": {
+        "classifier": "classifier"
+    },
+    "googlenet": {
+        "classifier": "fc"
+    },
+    "shufflenet_v2_x1_0": {
+        "classifier": "fc"
+    },
+    "mobilenet_v2": {
+        "classifier": ["classifier", 1]
+    }
+}
+
+def get_retrainable_model(model_name, num_classes, do_fine_tuning=False):
+    # Load an image classification model pretrained on ImageNet
+    pretrained_model_class = locate('torchvision.models.{}'.format(model_name))
+    classifier_layer = torchvision_model_map[model_name]['classifier']
+                                                         
+    model = pretrained_model_class(pretrained=True)
+
+    if not do_fine_tuning:
+        for param in model.parameters():
+            param.requires_grad = False
+
+    if type(classifier_layer) == list:
+        classifier = getattr(model, classifier_layer[0])[classifier_layer[1]]
+        num_features = classifier.in_features
+        model.classifier[classifier_layer[1]] = torch.nn.Linear(num_features, num_classes)
+    else:
+        classifier = getattr(model, classifier_layer)
+        num_features = classifier.in_features
+        setattr(model, classifier_layer, torch.nn.Linear(num_features, num_classes))
+        
+    return model
+
diff --git a/notebooks/image_classification/tf_image_classification/Image_Classification_Transfer_Learning.ipynb b/notebooks/image_classification/tf_image_classification/Image_Classification_Transfer_Learning.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..032513d4d9cb6aae7f16c4de53f1a9fa4fdfa888
--- /dev/null
+++ b/notebooks/image_classification/tf_image_classification/Image_Classification_Transfer_Learning.ipynb
@@ -0,0 +1,498 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Transfer Learning for Image Classification\n",
+    "\n",
+    "This notebook uses a classifier model that was originally trained using [ImageNet](https://image-net.org) and does transfer learning with either a TF dataset or your own raw images.\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset) using either a TF dataset or your own images\n",
+    "3. [Predict using the original model](#3.-Predict-using-the-original-model)\n",
+    "4. [Transfer learning](#4.-Transfer-Learning)\n",
+    "5. [Evaluate the model](#5.-Evaluate-the-model)\n",
+    "6. [Export the saved model](#6.-Export-the-saved-model)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [README.md](/notebooks/README.md) to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import tensorflow as tf\n",
+    "import tensorflow_hub as hub\n",
+    "import tensorflow_datasets as tfds\n",
+    "\n",
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "\n",
+    "from model_util import tfhub_model_map\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file\n",
+    "\n",
+    "print('Supported models:')\n",
+    "print('\\n'.join(tfhub_model_map.keys()))\n",
+    "\n",
+    "# Specify the the parent directory for the custom or tf dataset\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "    \n",
+    "# Specify a directory for output\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "# Batch size\n",
+    "batch_size = 32\n",
+    "\n",
+    "print(\"\\nDataset directory:\", dataset_directory)\n",
+    "print(\"Output directory:\", output_directory)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Specify a model from the list above\n",
+    "model_name = \"efficientnet_b0\"\n",
+    "\n",
+    "if model_name not in tfhub_model_map.keys():\n",
+    "    raise ValueError(\"The specified model_name ({}) is invalid. Please select from: {}\".\n",
+    "                     format(model_name, tfhub_model_map.keys()))\n",
+    "    \n",
+    "# Get the info for the specified model from the map\n",
+    "model_map_values = tfhub_model_map[model_name]\n",
+    "model_handle = tfhub_model_map[model_name][\"imagenet_model\"]\n",
+    "feature_vector_handle = tfhub_model_map[model_name][\"feature_vector\"]\n",
+    "image_size = tfhub_model_map[model_name][\"image_size\"]\n",
+    "print(\"Model:\", model_name)\n",
+    "print(\"Classifier model:\", model_handle)\n",
+    "print(\"Feature vector:\", feature_vector_handle)\n",
+    "print(\"Image size:\", image_size)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option A: Use your own image dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "To use your own image dataset for transfer learning with the rest of this notebook, format your images as `.jpg` files and save them in folders named after the classes that you want the model to predict. To provide a working example using the correct layout, we will download and extract a flower species dataset. This is different from using the TF dataset called `tf_flowers`, although they are the same images, because the download contains image files, not tf_records, and we are not using the TF datasets API. After downloading and extracting, you will have the following  subdirectories in your dataset directory. Each species subfolder will contain numerous `.jpg` files:\n",
+    "\n",
+    "```\n",
+    "dataset_directory\n",
+    "└── flower_photos\n",
+    "    └── daisy\n",
+    "    └── dandelion\n",
+    "    └── roses\n",
+    "    └── sunflowers\n",
+    "    └── tulips\n",
+    "```\n",
+    "\n",
+    "Use this as an example to organize your own image files accordingly."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# When you have your own properly organized subdirectory of images, adjust this variable\n",
+    "dataset_subdir = os.path.join(dataset_directory, \"flower_photos\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Only run this if you want to use the example flowers dataset\n",
+    "if not os.path.exists(dataset_subdir):\n",
+    "    os.makedirs(dataset_subdir)\n",
+    "    dataset_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    download_and_extract_tar_file(dataset_url, dataset_directory)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pathlib\n",
+    "data_subdir_path = pathlib.Path(dataset_subdir)\n",
+    "image_count = len(list(data_subdir_path.glob('*/*.jpg')))\n",
+    "print('Images:', image_count)\n",
+    "print('Image Size:', image_size)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create an image data generator and partition the data into train and test sets\n",
+    "img_gen = tf.keras.preprocessing.image.ImageDataGenerator(rescale=1./255, validation_split=0.25)\n",
+    "train_ds = img_gen.flow_from_directory(data_subdir_path, batch_size=batch_size, \n",
+    "                                   target_size=(image_size, image_size),\n",
+    "                                   class_mode='sparse', subset='training')\n",
+    "test_ds = img_gen.flow_from_directory(data_subdir_path, batch_size=batch_size, \n",
+    "                                  target_size=(image_size, image_size),\n",
+    "                                  class_mode='sparse', subset='validation')\n",
+    "\n",
+    "# Get class names for the dataset\n",
+    "class_names = [k for k in train_ds.class_indices.keys()]\n",
+    "print(\"Number of classes:\", len(class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [3. Predict using the original model](#3.-Predict-using-the-original-model) to continue using your own image dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a TF dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "To use a TF Dataset, specify the name of the dataset to load from the TF Datasets catalog, preprocess the images to convert them to float32, and resize the images. This example uses the [Food-101 dataset using the TensorFlow datasets API](https://www.tensorflow.org/datasets/catalog/food101) dataset, but you can choose from a wide variety of [options](https://www.tensorflow.org/datasets/catalog/overview) (click on the \"Image classification\" section). If the dataset is not found in the dataset directory it is downloaded. Subsequent runs will reuse the already downloaded dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Options include: \"food101\", cats_vs_dogs\", \"rock_paper_scissors\", and \"tf_flowers\"\n",
+    "tf_dataset = \"food101\"\n",
+    "\n",
+    "# Load the dataset using the TensorFlow datasets API\n",
+    "[train_ds, test_ds], info = tfds.load(tf_dataset,\n",
+    "                       data_dir=dataset_directory,\n",
+    "                       split=[\"train[:75%]\", \"train[75%:]\"],\n",
+    "                       as_supervised=True,\n",
+    "                       shuffle_files=True,\n",
+    "                       with_info=True)\n",
+    "\n",
+    "# Preprocess the images to convert them to float32 and resize the images to match our model\n",
+    "def preprocess_image(image, label):\n",
+    "    image = tf.image.convert_image_dtype(image, tf.float32)\n",
+    "    image = tf.image.resize_with_pad(image, image_size, image_size)\n",
+    "    return (image, label)\n",
+    "\n",
+    "train_ds = train_ds.map(preprocess_image)\n",
+    "test_ds = test_ds.map(preprocess_image)\n",
+    "\n",
+    "print(\"Dataset directory: \", dataset_directory)\n",
+    "print(\"Training dataset size:\", len(train_ds))\n",
+    "print(\"Validation dataset size:\", len(test_ds))\n",
+    "\n",
+    "# Training data is shuffled for randomness\n",
+    "# https://www.tensorflow.org/datasets/keras_example#build_a_training_pipeline\n",
+    "train_ds = train_ds.cache()\n",
+    "train_ds = train_ds.shuffle(info.splits['train'].num_examples)\n",
+    "train_ds = train_ds.batch(batch_size)\n",
+    "train_ds = train_ds.prefetch(tf.data.AUTOTUNE)\n",
+    "\n",
+    "# Test data does not need to be shuffled, and caching is done after batching\n",
+    "# https://www.tensorflow.org/datasets/keras_example#build_an_evaluation_pipeline\n",
+    "test_ds = test_ds.batch(batch_size)\n",
+    "test_ds = test_ds.cache()\n",
+    "test_ds = test_ds.prefetch(tf.data.AUTOTUNE)\n",
+    "\n",
+    "# Get class names for the dataset\n",
+    "class_names = info.features[\"label\"].names\n",
+    "print(\"Number of classes:\", len(class_names))\n",
+    "print('After processing and batching: ', train_ds.element_spec)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 3. Predict using the original model\n",
+    "\n",
+    "Use the classifier model that was trained using ImageNet to do predictions with the dataset and view the results for a single batch."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a batch of the dataset to use for testing\n",
+    "batch = next(iter(test_ds))\n",
+    "image_batch, label_batch = batch\n",
+    "\n",
+    "# List of the actual labels for this batch\n",
+    "actual_label_batch = [class_names[int(id)] for id in label_batch]\n",
+    "\n",
+    "# Download the ImageNet labels and load them into a list\n",
+    "labels_file = \"https://storage.googleapis.com/download.tensorflow.org/data/ImageNetLabels.txt\"\n",
+    "downloaded_file = tf.keras.utils.get_file(\"labels.txt\", origin=labels_file)\n",
+    "imagenet_classes = []\n",
+    "\n",
+    "with open(downloaded_file) as f:\n",
+    "    imagenet_labels = f.readlines()\n",
+    "    imagenet_classes = [l.strip() for l in imagenet_labels]\n",
+    "\n",
+    "# Predict using the TF Hub classifier that was trained using ImageNet\n",
+    "classifier = tf.keras.Sequential([\n",
+    "    hub.KerasLayer(model_handle, input_shape=(image_size, image_size)+(3,))\n",
+    "])\n",
+    "predicted_batch = classifier.predict(image_batch)\n",
+    "predicted_id = np.argmax(predicted_batch, axis=-1)\n",
+    "predicted_label_batch = [imagenet_classes[id] for id in predicted_id]\n",
+    "\n",
+    "# Visualize the results\n",
+    "plt.figure(figsize=(16,16))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    plt.imshow(image_batch[n])\n",
+    "    correct_prediction = actual_label_batch[n] == predicted_label_batch[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predicted_label_batch[n].title() if correct_prediction else \"{}\\n({})\".format(predicted_label_batch[n], actual_label_batch[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"ImageNet predictions\", fontsize=16)\n",
+    "plt.show()\n",
+    "\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 4. Transfer Learning\n",
+    "\n",
+    "Get the feature vector from TF Hub and add on a dense layer based on the number of classes in our dataset. Train the model using the training dataset for the specified number of epochs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Number of training epochs\n",
+    "training_epochs = 1\n",
+    "\n",
+    "# To reduce training time, the feature extractor layer can remain frozen (do_fine_tuning=False).\n",
+    "# Fine-tuning can be enabled to potentially get better accuracy. Note that enabling fine-tuning\n",
+    "# will increase training time.\n",
+    "do_fine_tuning = False\n",
+    "\n",
+    "# Optionally add a dropout layer (set to a float between 0 and 1, or None).\n",
+    "# If set to None, no dropout layer will be added.\n",
+    "dropout_layer_rate = None"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "feature_extractor_layer = hub.KerasLayer(feature_vector_handle,\n",
+    "                                         input_shape=(image_size, image_size, 3),\n",
+    "                                         trainable=do_fine_tuning)\n",
+    "\n",
+    "if dropout_layer_rate == None:\n",
+    "    model = tf.keras.Sequential([\n",
+    "      feature_extractor_layer,\n",
+    "      tf.keras.layers.Dense(len(class_names))\n",
+    "    ])\n",
+    "else:\n",
+    "    model = tf.keras.Sequential([\n",
+    "      feature_extractor_layer,\n",
+    "      tf.keras.layers.Dropout(dropout_layer_rate),\n",
+    "      tf.keras.layers.Dense(len(class_names))\n",
+    "    ])\n",
+    "\n",
+    "model.summary()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "model.compile(\n",
+    "  optimizer=tf.keras.optimizers.Adam(),\n",
+    "  loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),\n",
+    "  metrics=['acc'])\n",
+    "\n",
+    "class CollectBatchStats(tf.keras.callbacks.Callback):\n",
+    "    def __init__(self):\n",
+    "        self.batch_losses = []\n",
+    "        self.batch_acc = []\n",
+    "\n",
+    "    def on_train_batch_end(self, batch, logs=None):\n",
+    "        self.batch_losses.append(logs['loss'])\n",
+    "        self.batch_acc.append(logs['acc'])\n",
+    "        self.model.reset_metrics()\n",
+    "\n",
+    "batch_stats_callback = CollectBatchStats()\n",
+    "\n",
+    "history = model.fit(train_ds, epochs=training_epochs, shuffle=True, callbacks=[batch_stats_callback])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 5. Evaluate the model\n",
+    "\n",
+    "After the training completes, evaluate the model's accuracy using the validation dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "model.evaluate(test_ds, batch_size=batch_size)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Also, predict using the same sample batch that we used earlier with the ImageNet trained classier to visualize the results after training the model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Predict using the sample batch\n",
+    "predicted_batch = model.predict(image_batch)\n",
+    "predicted_id = np.argmax(predicted_batch, axis=-1)\n",
+    "predicted_label_batch = [class_names[id] for id in predicted_id]\n",
+    "\n",
+    "# Display the results\n",
+    "plt.figure(figsize=(16,16))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    plt.imshow(image_batch[n])\n",
+    "    correct_prediction = actual_label_batch[n] == predicted_label_batch[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predicted_label_batch[n].title() if correct_prediction else \"{}\\n({})\".format(predicted_label_batch[n], actual_label_batch[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"Model predictions\", fontsize=16)\n",
+    "plt.show()\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 6. Export the saved model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = os.path.join(output_directory, \"{}_saved_model\".format(model_name))\n",
+    "model.save(saved_model_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Dataset citations\n",
+    "```\n",
+    "@inproceedings{bossard14,\n",
+    "  title = {Food-101 -- Mining Discriminative Components with Random Forests},\n",
+    "  author = {Bossard, Lukas and Guillaumin, Matthieu and Van Gool, Luc},\n",
+    "  booktitle = {European Conference on Computer Vision},\n",
+    "  year = {2014}\n",
+    "}\n",
+    "\n",
+    "@ONLINE {tfflowers,\n",
+    "author = \"The TensorFlow Team\",\n",
+    "title = \"Flowers\",\n",
+    "month = \"jan\",\n",
+    "year = \"2019\",\n",
+    "url = \"http://download.tensorflow.org/example_images/flower_photos.tgz\" }\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
diff --git a/notebooks/image_classification/tf_image_classification/README.md b/notebooks/image_classification/tf_image_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..3803ad1316ed4aa500064f0d42fd135ac9be2b09
--- /dev/null
+++ b/notebooks/image_classification/tf_image_classification/README.md
@@ -0,0 +1,35 @@
+# Transfer Learning for Image Classification with TF Hub
+
+This notebook uses transfer learning with multiple [TF Hub](https://tfhub.dev) image classifiers,
+[TF datasets](https://www.tensorflow.org/datasets/), and custom image datasets.
+
+The notebook performs the following steps:
+1. Import dependencies and setup parameters
+1. Prepare the dataset
+1. Predict using the original model
+1. Transfer Learning
+1. Evaluate the model
+1. Export the saved model
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [TensorFlow notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations
+```
+@inproceedings{bossard14,
+  title = {Food-101 -- Mining Discriminative Components with Random Forests},
+  author = {Bossard, Lukas and Guillaumin, Matthieu and Van Gool, Luc},
+  booktitle = {European Conference on Computer Vision},
+  year = {2014}
+}
+
+@ONLINE {tfflowers,
+author = "The TensorFlow Team",
+title = "Flowers",
+month = "jan",
+year = "2019",
+url = "http://download.tensorflow.org/example_images/flower_photos.tgz" }
+```
diff --git a/notebooks/image_classification/tf_image_classification/model_util.py b/notebooks/image_classification/tf_image_classification/model_util.py
new file mode 100644
index 0000000000000000000000000000000000000000..9ef82a0061cd6446efbce338ad19f2705253c417
--- /dev/null
+++ b/notebooks/image_classification/tf_image_classification/model_util.py
@@ -0,0 +1,72 @@
+#
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+# Dictionary of TFHub models
+tfhub_model_map = {
+    "resnet_v1_50": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/resnet_v1_50/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/resnet_v1_50/feature_vector/5",
+        "image_size": 224
+    },
+    "resnet_v2_50": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/resnet_v2_50/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/resnet_v2_50/feature_vector/5",
+        "image_size": 224
+    },
+    "resnet_v2_101": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/resnet_v2_101/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/resnet_v2_101/feature_vector/5",
+        "image_size": 224
+    },
+    "mobilenet_v2_100_224": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/mobilenet_v2_100_224/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/mobilenet_v2_100_224/feature_vector/4",
+        "image_size": 224
+    },
+    "efficientnetv2-s": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/efficientnet_v2_imagenet1k_s/classification/2",
+        "feature_vector": "https://tfhub.dev/google/imagenet/efficientnet_v2_imagenet1k_s/feature_vector/2",
+        "image_size": 384
+    },
+    "efficientnet_b0": {
+        "imagenet_model": "https://tfhub.dev/google/efficientnet/b0/classification/1",
+        "feature_vector": "https://tfhub.dev/google/efficientnet/b0/feature-vector/1",
+        "image_size": 224
+    },
+    "efficientnet_b1": {
+        "imagenet_model": "https://tfhub.dev/google/efficientnet/b1/classification/1",
+        "feature_vector": "https://tfhub.dev/google/efficientnet/b1/feature-vector/1",
+        "image_size": 240
+    },
+    "efficientnet_b2": {
+        "imagenet_model": "https://tfhub.dev/google/efficientnet/b2/classification/1",
+        "feature_vector": "https://tfhub.dev/google/efficientnet/b2/feature-vector/1",
+        "image_size": 260
+    },
+    "inception_v3": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/inception_v3/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/inception_v3/feature_vector/5",
+        "image_size": 299
+    },
+    "nasnet_large": {
+        "imagenet_model": "https://tfhub.dev/google/imagenet/nasnet_large/classification/5",
+        "feature_vector": "https://tfhub.dev/google/imagenet/nasnet_large/feature_vector/5",
+        "image_size": 331
+    }
+}
+
diff --git a/notebooks/image_classification/tlt_api_pyt_image_classification/README.md b/notebooks/image_classification/tlt_api_pyt_image_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..5b77288c399810e058fd8fe472bc621bcf076f5f
--- /dev/null
+++ b/notebooks/image_classification/tlt_api_pyt_image_classification/README.md
@@ -0,0 +1,57 @@
+# Transfer Learning for PyTorch Image Classification using the Intel® Transfer Learning Tool API
+
+This notebook demonstrates how to use the Intel Transfer Learning Tool API to do transfer learning for
+image classification using PyTorch.
+
+The notebook performs the following steps:
+1. Import dependencies and setup parameters
+1. Get the model
+1. Get the dataset
+1. Prepare the dataset
+1. Predict using the original model
+1. Transfer learning
+1. Predict
+1. Export
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [PyTorch notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations
+```
+@ONLINE {tfflowers,
+author = "The TensorFlow Team",
+title = "Flowers",
+month = "jan",
+year = "2019",
+url = "http://download.tensorflow.org/example_images/flower_photos.tgz" }
+
+@ONLINE {CIFAR10,
+author = "Alex Krizhevsky",
+title = "CIFAR-10",
+year = "2009",
+url = "http://www.cs.toronto.edu/~kriz/cifar.html" }
+
+@article{openimages,
+  title={OpenImages: A public dataset for large-scale multi-label and multi-class image classification.},
+  author={Krasin, Ivan and Duerig, Tom and Alldrin, Neil and Veit, Andreas and Abu-El-Haija, Sami
+    and Belongie, Serge and Cai, David and Feng, Zheyun and Ferrari, Vittorio and Gomes, Victor
+    and Gupta, Abhinav and Narayanan, Dhyanesh and Sun, Chen and Chechik, Gal and Murphy, Kevin},
+  journal={Dataset available from https://github.com/openimages},
+  year={2016}
+}
+```
+Model citations
+```
+@misc{yalniz2019billionscale,
+    title={Billion-scale semi-supervised learning for image classification},
+    author={I. Zeki Yalniz and Hervé Jégou and Kan Chen and Manohar Paluri and Dhruv Mahajan},
+    year={2019},
+    eprint={1905.00546},
+    archivePrefix={arXiv},
+    primaryClass={cs.CV}
+}
+```
+
diff --git a/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb b/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..8d43838e058c0477b904d561a2db0a6fcab0a0da
--- /dev/null
+++ b/notebooks/image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb
@@ -0,0 +1,670 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "3405d28d",
+   "metadata": {},
+   "source": [
+    "# Transfer Learning for Image Classification using PyTorch and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the `tlt` library to do transfer learning for image classfication with a PyTorch pretrained model."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d61b7ac",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a PyTorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a0bf9fd0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import PIL.Image as Image\n",
+    "import torch, torchvision\n",
+    "import requests\n",
+    "from io import BytesIO\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file, download_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8f1fc78c",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the model factory to list supported PyTorch image classification models. This is a list of pretrained models from [Torchvision](https://pytorch.org/vision/stable/models.html) and [PyTorch Hub](https://pytorch.org/hub/) that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models` function call to get more information about each model (such as the classification layer, image size, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad4aeafd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available models\n",
+    "model_factory.print_supported_models(use_case='image_classification', framework='pytorch')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "aa1d9d53",
+   "metadata": {},
+   "source": [
+    "Next, use the model factory to get one of the models listed in the previous cell. The `get_model` function returns a model object that will later be used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ee4e43c0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name='efficientnet_b0', framework='pytorch')\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)\n",
+    "print(\"Image size:\", model.image_size)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dabd4183",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2d314ba0",
+   "metadata": {},
+   "source": [
+    "### Option A: Use your own dataset\n",
+    "\n",
+    "To use your own image dataset for transfer learning with the rest of this notebook, format your images as `.jpg` files and save them in folders named after the classes that you want the model to predict. To provide a working example using the correct layout, we will download a flower species dataset. After downloading and extracting, you will have the following  subdirectories in your dataset directory. Each species subfolder will contain numerous `.jpg` files:\n",
+    "\n",
+    "```\n",
+    "flower_photos\n",
+    "  └── daisy\n",
+    "  └── dandelion\n",
+    "  └── roses\n",
+    "  └── sunflowers\n",
+    "  └── tulips\n",
+    "```\n",
+    "\n",
+    "When using your own dataset, ensure that it is similarly organized with folders for each class. Change the `custom_dataset_path` variable to point to your dataset folder."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6ab17b6b",
+   "metadata": {
+    "tags": [
+     "remove_for_tv_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# For demonstration purposes, we download a flowers dataset. To instead use your own dataset, set the\n",
+    "# custom_dataset_path to point to your dataset's directory and comment out the download_and_extract_tar_file line.\n",
+    "custom_dataset_path = os.path.join(dataset_dir, \"flower_photos\")\n",
+    "\n",
+    "if not os.path.exists(custom_dataset_path):\n",
+    "    download_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    download_and_extract_tar_file(download_url, dataset_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8cccbc99",
+   "metadata": {},
+   "source": [
+    "Call the dataset factory to load the dataset from the directory."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f6706c01",
+   "metadata": {
+    "tags": [
+     "remove_for_tv_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# Load the dataset from the custom dataset path\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=custom_dataset_path,\n",
+    "                                       use_case='image_classification', \n",
+    "                                       framework='pytorch')\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "88897dc6",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [4. Prepare the dataset](#4.-Prepare-the-dataset) to continue using the custom dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c7e3cd9b",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a dataset from the PyTorch's Torchvision Datasets catalog\n",
+    "\n",
+    "To use a Torchvision dataset, specify the name of the dataset in the `get_dataset` function. This example uses the `CIFAR10` dataset from the [Torchvision datasets for image classification](https://pytorch.org/vision/stable/datasets.html#image-classification), but you can choose from a variety of options. If the dataset is not found in the dataset directory it will be downloaded. Subsequent runs will reuse the already downloaded dataset.\n",
+    "\n",
+    "These Torchvision datasets are currently supported in the API:\n",
+    "* CIFAR10\n",
+    "* Country211\n",
+    "* DTD\n",
+    "* Food101\n",
+    "* FGVCAircraft\n",
+    "* RenderedSST2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ba8bb0cb",
+   "metadata": {
+    "tags": [
+     "remove_for_custom_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.get_dataset(dataset_dir=dataset_dir,\n",
+    "                                      use_case='image_classification', \n",
+    "                                      framework='pytorch',\n",
+    "                                      dataset_name='CIFAR10',\n",
+    "                                      dataset_catalog='torchvision')\n",
+    "\n",
+    "print(dataset.info)\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "99f23249",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "Once you have your dataset from Option A or Option B above, use the following cells to split and preprocess the data. We split them into training and validation subsets, then resize the images to match the selected models, and then batch the images.\n",
+    "Data augmentation can be appplied by specifying the augmentations to be applied in add_aug parameter. Supported augmentations are given below\n",
+    "1. hflip - RandomHorizontalFlip\n",
+    "2. rotate - RandomRotate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "dd91fbcf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Split the dataset into training and validation subsets\n",
+    "dataset.shuffle_split(train_pct=.75, val_pct=.25)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e7c95a70",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess the dataset with an image size that matches the model and a batch size of 32\n",
+    "batch_size = 32\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size, add_aug=['hflip','rotate'])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3704772b",
+   "metadata": {},
+   "source": [
+    "## 5. Predict using the original model\n",
+    "\n",
+    "We get a single batch from our dataset, and use that to call predict on our model. Since we haven't done any training on the model yet, it will give us predictions using the original ImageNet trained model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cd6782b0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a single batch from the dataset\n",
+    "images, labels = dataset.get_batch()\n",
+    "labels = [dataset.class_names[id] for id in labels]\n",
+    "\n",
+    "# Download the ImageNet labels and load them into a list\n",
+    "labels_file = \"https://storage.googleapis.com/download.tensorflow.org/data/ImageNetLabels.txt\"\n",
+    "labels_file_path = os.path.join(dataset_dir, os.path.basename(labels_file))\n",
+    "\n",
+    "if not os.path.exists(labels_file_path):\n",
+    "    download_file(labels_file, dataset_dir)\n",
+    "\n",
+    "with open(labels_file_path) as f:\n",
+    "    imagenet_labels = f.readlines()\n",
+    "    imagenet_classes = [l.strip() for l in imagenet_labels]\n",
+    "    \n",
+    "# Predict using the original model\n",
+    "predictions = model.predict(images)\n",
+    "predictions = [imagenet_classes[id] for id in predictions]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d37b808f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Display the images with the predicted ImageNet label\n",
+    "plt.figure(figsize=(18,14))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    inp = images[n]\n",
+    "    inp = inp.numpy().transpose((1, 2, 0))\n",
+    "    mean = np.array([0.485, 0.456, 0.406])\n",
+    "    std = np.array([0.229, 0.224, 0.225])\n",
+    "    inp = std * inp + mean\n",
+    "    inp = np.clip(inp, 0, 1)\n",
+    "    plt.imshow(inp)\n",
+    "    correct_prediction = labels[n] == predictions[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predictions[n].title() if correct_prediction else \"{}\\n({})\".format(predictions[n], labels[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"ImageNet predictions\", fontsize=20)\n",
+    "plt.show()\n",
+    "\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a49ec7b7",
+   "metadata": {},
+   "source": [
+    "## 6. Transfer Learning\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the base model and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. With the do_eval parameter set to True by default, this step will also show how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ab510f51",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a2b601fc",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = model.train(dataset, output_dir=output_dir, epochs=1)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8582cfaf",
+   "metadata": {},
+   "source": [
+    "A complete model summary can be printed for all modules in case any need to be unfrozen:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0a5e279b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.list_layers(verbose=True) "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9530b21d",
+   "metadata": {},
+   "source": [
+    "Layers can be unfrozen by passing their string names, such as the following:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "258662a6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.unfreeze_layer(\"features\") # Unfreezes the features layers\n",
+    "model.list_layers(verbose=True) "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "707f17dd",
+   "metadata": {},
+   "source": [
+    "## 7. Predict\n",
+    "\n",
+    "Lastly, we predict using the same single batch that we used earlier with the ImageNet trained model to visualize the model's predictions after training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a2bc447f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Predict with a single batch\n",
+    "predictions = model.predict(images)\n",
+    "\n",
+    "# Map the predicted ids to the class names\n",
+    "predictions = [dataset.class_names[id] for id in predictions]\n",
+    "\n",
+    "# Display the results\n",
+    "plt.figure(figsize=(16,16))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    inp = images[n]\n",
+    "    inp = inp.numpy().transpose((1, 2, 0))\n",
+    "    mean = np.array([0.485, 0.456, 0.406])\n",
+    "    std = np.array([0.229, 0.224, 0.225])\n",
+    "    inp = std * inp + mean\n",
+    "    inp = np.clip(inp, 0, 1)\n",
+    "    plt.imshow(inp)\n",
+    "    correct_prediction = labels[n] == predictions[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predictions[n].title() if correct_prediction else \"{}\\n({})\".format(predictions[n], labels[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"Model predictions\", fontsize=16)\n",
+    "plt.show()\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d5b03792",
+   "metadata": {},
+   "source": [
+    "### Custom Single Image Prediction"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6dc48f94",
+   "metadata": {},
+   "source": [
+    "We can also predict using a single image that wasn't part of our original dataset. We download a flower image from the [Open Images Dataset](https://storage.googleapis.com/openimages/web/index.html) and then resize it to match our model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "5afd283f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Download an image from the web and resize it to match our model\n",
+    "image_url = 'https://c8.staticflickr.com/8/7095/7210797228_c7fe51c3cb_z.jpg'\n",
+    "\n",
+    "image_shape = (model.image_size, model.image_size)\n",
+    "daisy = Image.open(BytesIO(requests.get(image_url).content)).resize(image_shape)\n",
+    "daisy"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7b7a0227",
+   "metadata": {},
+   "source": [
+    "Then, we call predict by passing the np array for our image and add a dimension to our array to represent the batch."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "22146e35",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the image as a np array and scale and normalize it    \n",
+    "daisy = np.array(daisy)/255.0\n",
+    "daisy = (daisy - np.array([0.485, 0.456, 0.406])) / np.array([0.229, 0.224, 0.225])\n",
+    "\n",
+    "# Arrange the channels with a batch dimension first (np.newaxis) and RGB channels second (np.moveaxis)\n",
+    "daisy = torch.Tensor(np.moveaxis(daisy, -1, 0))[np.newaxis, ...]\n",
+    "\n",
+    "# Predict and print the class name\n",
+    "result = model.predict(daisy)\n",
+    "print(dataset.class_names[result[0]])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "26130983",
+   "metadata": {},
+   "source": [
+    "## 8. Export\n",
+    "\n",
+    "Lastly, we can call the model `export` function to generate a `saved_model.pb`. Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "391afe2b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "40f5dc3e",
+   "metadata": {},
+   "source": [
+    "## 9. Post-training quantization\n",
+    "\n",
+    "In this section, the  `tlt` API uses [Intel® Neural Compressor (INC)](https://github.com/intel/neural-compressor) to benchmark and quantize the model to get optimal inference performance.\n",
+    "\n",
+    "We use the Intel Neural Compressor to benchmark the full precision model to see how it performs, as our baseline.\n",
+    "\n",
+    "> Note that there is a known issue when running Intel Neural Compressor from a notebook that you may sometimes see the error \n",
+    "> `zmq.error.ZMQError: Address already in use`. If you see this error, rerun the cell again."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a8318885",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "results = model.benchmark(dataset=dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7997cc13",
+   "metadata": {},
+   "source": [
+    "Next we use Intel Neural Compressor to automatically search for the optimal quantization recipe for low-precision model inference within the accuracy loss constrains defined in the config. Running post training quantization may take several minutes, depending on your hardware and the exit policy (timeout and max trials).\n",
+    "\n",
+    "You can customize a config by passing these parameters to `get_inc_config()`:\n",
+    " * **approach** (str): The quantization approach (we recommend 'static' for image models and 'dynamic' for text models) \n",
+    " * **accuracy_criterion_relative** (float): Relative accuracy loss (default: 0.01, which is 1%)\n",
+    " * **exit_policy_timeout** (int): Tuning timeout in seconds (default: 0). Tuning processing finishes when the\n",
+    "   timeout or max_trials is reached. A tuning timeout of 0 means that the tuning phase stops when the accuracy\n",
+    "   criterion is met.\n",
+    "* **exit_policy_max_trials** (int): Maximum number of tuning trials (default: 50). Tuning processing finishes when\n",
+    "  the timeout or or max_trials is reached."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ce143e0f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from tlt.utils.inc_utils import get_inc_config\n",
+    "\n",
+    "config = get_inc_config(approach='static',\n",
+    "                        accuracy_criterion_relative=0.01,\n",
+    "                        exit_policy_timeout=0,\n",
+    "                        exit_policy_max_trials=10)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8ee3e1d7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "inc_output_dir = os.path.join(output_dir, 'quantized_models', model.model_name,\n",
+    "                                       os.path.basename(saved_model_dir))\n",
+    "model.quantize(inc_output_dir, dataset=dataset, config=config)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "abb5d272",
+   "metadata": {},
+   "source": [
+    "Let's benchmark using the quantized model, so that we can compare the performance to the full precision model that was originally benchmarked."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7a900100",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "quantized_results = model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0947915a",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "```\n",
+    "@ONLINE {tfflowers,\n",
+    "author = \"The TensorFlow Team\",\n",
+    "title = \"Flowers\",\n",
+    "month = \"jan\",\n",
+    "year = \"2019\",\n",
+    "url = \"http://download.tensorflow.org/example_images/flower_photos.tgz\" }\n",
+    "\n",
+    "@ONLINE {CIFAR10,\n",
+    "author = \"Alex Krizhevsky\",\n",
+    "title = \"CIFAR-10\",\n",
+    "year = \"2009\",\n",
+    "url = \"http://www.cs.toronto.edu/~kriz/cifar.html\" }\n",
+    "\n",
+    "@article{openimages,\n",
+    "  title={OpenImages: A public dataset for large-scale multi-label and multi-class image classification.},\n",
+    "  author={Krasin, Ivan and Duerig, Tom and Alldrin, Neil and Veit, Andreas and Abu-El-Haija, Sami\n",
+    "    and Belongie, Serge and Cai, David and Feng, Zheyun and Ferrari, Vittorio and Gomes, Victor\n",
+    "    and Gupta, Abhinav and Narayanan, Dhyanesh and Sun, Chen and Chechik, Gal and Murphy, Kevin},\n",
+    "  journal={Dataset available from https://github.com/openimages},\n",
+    "  year={2016}\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/image_classification/tlt_api_tf_image_classification/README.md b/notebooks/image_classification/tlt_api_tf_image_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..441fd3153362194c7866b59c2aaffff8229a23ad
--- /dev/null
+++ b/notebooks/image_classification/tlt_api_tf_image_classification/README.md
@@ -0,0 +1,51 @@
+# Transfer Learning for TensorFlow Image Classification using the Intel® Transfer Learning Tool API
+
+These notebooks demonstrate how to use the Intel Transfer Learning Tool API to do transfer learning for
+image classification using TensorFlow and then quantize or optimize the graph for inference.
+
+`TLT_TF_Image_Classification_Transfer_Learning.ipynb`  performs the following steps:
+1. Import dependencies and setup parameters
+1. Get the model
+1. Get the dataset
+1. Prepare the dataset
+1. Predict using the original model
+1. Transfer learning
+1. Predict
+1. Export
+1. Post-training quantization
+
+`TLT_TF_Transfer_Learning_and_Graph_Optimization.ipynb`  performs the following steps:
+1. Import dependencies and setup parameters
+1. Get the model
+1. Get the dataset
+1. Prepare the dataset
+1. Evaluate using the original model
+1. Transfer learning
+1. Export
+1. Graph Optimization
+
+## Running the notebooks
+
+To run the notebooks, follow the instructions to setup the [TensorFlow notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations
+```
+@ONLINE {tfflowers,
+author = "The TensorFlow Team",
+title = "Flowers",
+month = "jan",
+year = "2019",
+url = "http://download.tensorflow.org/example_images/flower_photos.tgz" }
+
+@article{openimages,
+  title={OpenImages: A public dataset for large-scale multi-label and multi-class image classification.},
+  author={Krasin, Ivan and Duerig, Tom and Alldrin, Neil and Veit, Andreas and Abu-El-Haija, Sami
+    and Belongie, Serge and Cai, David and Feng, Zheyun and Ferrari, Vittorio and Gomes, Victor
+    and Gupta, Abhinav and Narayanan, Dhyanesh and Sun, Chen and Chechik, Gal and Murphy, Kevin},
+  journal={Dataset available from https://github.com/openimages},
+  year={2016}
+}
+```
+
diff --git a/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb b/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..c41a92d8e94cc6f17e718cf087bed41500021b35
--- /dev/null
+++ b/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb
@@ -0,0 +1,597 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "41a52dc9",
+   "metadata": {},
+   "source": [
+    "# Transfer Learning for Image Classification using TensorFlow and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the `tlt` library to do transfer learning for image classfication with a TensorFlow pretrained model."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d1432fd2",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "b996490f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import PIL.Image as Image\n",
+    "import tensorflow as tf\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_file, download_and_extract_tar_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b18c4a5e",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported TensorFlow image classification models. This is a list of pretrained models from [TFHub](https://tfhub.dev) and [Keras Applications](https://keras.io/api/applications/) that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models` function call to get more information about each model (such as the image size, the original dataset, the preprocessor, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "11a2d427",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available models\n",
+    "model_factory.print_supported_models(use_case='image_classification', framework='tensorflow')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "384e7c0d",
+   "metadata": {},
+   "source": [
+    "Next, use the model factory to get one of the models listed in the previous cell. The `get_model` function returns a model object that will later be used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "44d6f386",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name='resnet_v1_50', framework='tensorflow')\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)\n",
+    "print(\"Image size:\", model.image_size)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e180d1fe",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset\n",
+    "\n",
+    "We call the dataset factory to get a sample image classification dataset. For demonstration purposes, we are using the [tf_flowers](https://www.tensorflow.org/datasets/catalog/tf_flowers) dataset from the [TensorFlow Datasets catalog](https://www.tensorflow.org/datasets). This dataset contains images of flowers in 5 different classes."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "681d42e8",
+   "metadata": {},
+   "source": [
+    "### Option A: Use your own dataset\n",
+    "\n",
+    "To use your own image dataset for transfer learning with the rest of this notebook, format your images as `.jpg` files and save them in folders named after the classes that you want the model to predict. To provide a working example using the correct layout, we will download a flower species dataset. After downloading and extracting, you will have the following  subdirectories in your dataset directory. Each species subfolder will contain numerous `.jpg` files:\n",
+    "\n",
+    "```\n",
+    "flower_photos\n",
+    "  └── daisy\n",
+    "  └── dandelion\n",
+    "  └── roses\n",
+    "  └── sunflowers\n",
+    "  └── tulips\n",
+    "```\n",
+    "\n",
+    "When using your own dataset, ensure that it is similarly organized with folders for each class. Change the `custom_dataset_path` variable to point to your dataset folder."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "01973de8",
+   "metadata": {
+    "tags": [
+     "remove_for_tf_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# For demonstration purposes, we download a flowers dataset. To instead use your own dataset, set the\n",
+    "# custom_dataset_path to point to your dataset's directory and comment out the download_and_extract_tar_file line.\n",
+    "custom_dataset_path = os.path.join(dataset_dir, \"flower_photos\")\n",
+    "\n",
+    "if not os.path.exists(custom_dataset_path):\n",
+    "    download_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    download_and_extract_tar_file(download_url, dataset_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b20dc2db",
+   "metadata": {},
+   "source": [
+    "Call the dataset factory to load the dataset from the directory."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ce99cbb3",
+   "metadata": {
+    "tags": [
+     "remove_for_tf_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# Load the dataset from the custom dataset path\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=custom_dataset_path,\n",
+    "                                       use_case='image_classification', \n",
+    "                                       framework='tensorflow')\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "34be95ae",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [4. Prepare the dataset](#4.-Prepare-the-dataset) to continue using the custom dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "2c68f367",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a dataset from the TensorFlow Datasets catalog"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "b6b4cc26",
+   "metadata": {
+    "tags": [
+     "remove_for_custom_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.get_dataset(dataset_dir=dataset_dir,\n",
+    "                                      use_case='image_classification', \n",
+    "                                      framework='tensorflow',\n",
+    "                                      dataset_name='tf_flowers',\n",
+    "                                      dataset_catalog='tf_datasets')\n",
+    "\n",
+    "print(dataset.info)\n",
+    "\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c3ec8cfe",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cells to split and preprocess the data. We split them into training and validation subsets, then resize the images to match the selected models, and then batch the images. Data augmentation can be applied by specifying the augmentations to be applied in __add_aug__ parameter. Supported augmentations are:\n",
+    "1. hvflip - RandomHorizontalandVerticalFlip\n",
+    "2. hflip - RandomHorizontalFlip\n",
+    "3. vflip - RandomVerticalFlip\n",
+    "4. rotate - RandomRotate\n",
+    "5. zoom - RandomZoom"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4282456e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Split the dataset into training and validation subsets\n",
+    "dataset.shuffle_split(train_pct=.75, val_pct=.25)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c9789ded",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess the dataset with an image size and preprocessor that match the model and a batch size of 32\n",
+    "batch_size = 32\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size, preprocessor=model.preprocessor)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a5ff5539",
+   "metadata": {},
+   "source": [
+    "## 5. Predict using the original model\n",
+    "\n",
+    "We get a single batch from our dataset, and use that to call predict on our model. Since we haven't done any training on the model yet, it will give us predictions using the original ImageNet trained model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a620aec8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a single batch from the dataset\n",
+    "images, labels = dataset.get_batch()\n",
+    "labels = [dataset.class_names[id] for id in labels]\n",
+    "\n",
+    "# Download the ImageNet labels and load them into a list\n",
+    "labels_file = \"https://storage.googleapis.com/download.tensorflow.org/data/ImageNetLabels.txt\"\n",
+    "downloaded_file = tf.keras.utils.get_file(\"labels.txt\", origin=labels_file)\n",
+    "imagenet_classes = []\n",
+    "\n",
+    "with open(downloaded_file) as f:\n",
+    "    imagenet_labels = f.readlines()\n",
+    "    imagenet_classes = [l.strip() for l in imagenet_labels]\n",
+    "\n",
+    "# Predict using the original model\n",
+    "predictions = model.predict(images)\n",
+    "predictions = [imagenet_classes[id] for id in predictions]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad8f845e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Display the images with the predicted ImageNet label\n",
+    "plt.figure(figsize=(18,14))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    norm_images = (images[n]-np.min(images[n]))/(np.max(images[n])-np.min(images[n]))\n",
+    "    plt.imshow(norm_images, vmin=np.min(norm_images), vmax=np.max(norm_images))\n",
+    "    correct_prediction = labels[n] == predictions[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predictions[n] if correct_prediction else \"{}\\n({})\".format(predictions[n], labels[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"ImageNet predictions\", fontsize=20)\n",
+    "plt.show()\n",
+    "\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d875f7ea",
+   "metadata": {},
+   "source": [
+    "## 6. Transfer Learning\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the base model and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. With the do_eval paramter set to True by default, this step will also show how the model can be evaluated and will return a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "213faef5",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **enable_auto_mixed_precision** (bool or None): Enable auto mixed precision for training. Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance. If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "76041187",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "enable_auto_mixed_precision = None\n",
+    "\n",
+    "# Train using the pretrained model with the new dataset\n",
+    "history = model.train(dataset, output_dir=output_dir, epochs=1,\n",
+    "                      enable_auto_mixed_precision=enable_auto_mixed_precision)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d1c7e3af",
+   "metadata": {},
+   "source": [
+    "## 7. Predict\n",
+    "\n",
+    "Let's predict using the same single batch that we used earlier with the ImageNet trained model to visualize the model's predictions after training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "721253eb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Predict with a single batch\n",
+    "predictions = model.predict(images)\n",
+    "\n",
+    "# Map the predicted ids to the class names\n",
+    "predictions = [dataset.class_names[id] for id in predictions]\n",
+    "\n",
+    "# Display the results\n",
+    "plt.figure(figsize=(18,14))\n",
+    "plt.subplots_adjust(hspace=0.5)\n",
+    "\n",
+    "for n in range(min(batch_size, 30)):\n",
+    "    plt.subplot(6,5,n+1)\n",
+    "    norm_images = (images[n]-np.min(images[n]))/(np.max(images[n])-np.min(images[n]))\n",
+    "    plt.imshow(norm_images, vmin=np.min(norm_images), vmax=np.max(norm_images))\n",
+    "    correct_prediction = labels[n] == predictions[n]\n",
+    "    color = \"darkgreen\" if correct_prediction else \"crimson\"\n",
+    "    title = predictions[n] if correct_prediction else \"{}\\n({})\".format(predictions[n], labels[n]) \n",
+    "    plt.title(title, fontsize=14, color=color)\n",
+    "    plt.axis('off')\n",
+    "_ = plt.suptitle(\"Model predictions\", fontsize=16)\n",
+    "plt.show()\n",
+    "\n",
+    "print(\"Correct predictions are shown in green\")\n",
+    "print(\"Incorrect predictions are shown in red with the actual label in parenthesis\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "54df401b",
+   "metadata": {},
+   "source": [
+    "### Custom Single Image Prediction"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ff61b5ca",
+   "metadata": {},
+   "source": [
+    "We can also predict using a single image that wasn't part of our original dataset. We download a flower image from the [Open Images Dataset](https://storage.googleapis.com/openimages/web/index.html) and then resize it to match our model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "14595bbc",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Download an image from the web and resize it to match our model\n",
+    "image_url = \"https://c8.staticflickr.com/8/7095/7210797228_c7fe51c3cb_z.jpg\"\n",
+    "daisy = download_file(image_url, output_dir)\n",
+    "\n",
+    "image_shape = (model.image_size, model.image_size)\n",
+    "daisy = Image.open(daisy).resize(image_shape)\n",
+    "daisy"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a300e55c",
+   "metadata": {},
+   "source": [
+    "Then, we call predict by passing the np array for our image and add a dimension to our array to represent the batch."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cfaa39dd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get the image as a np array and call predict while adding a batch dimension (with np.newaxis) \n",
+    "daisy = np.array(daisy)/255.0\n",
+    "result = model.predict(daisy[np.newaxis, ...])\n",
+    "\n",
+    "# Print the predicted class name\n",
+    "print(dataset.class_names[result[0]])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "9d4830f0",
+   "metadata": {},
+   "source": [
+    "## 8. Export\n",
+    "\n",
+    "Next, we can call the model `export` function to generate a `saved_model.pb`. The model is saved in a format that is ready to use with [TensorFlow Serving](https://github.com/tensorflow/serving). Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "aafcd747",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f66f4b1d",
+   "metadata": {},
+   "source": [
+    "## 9. Post-training quantization\n",
+    "\n",
+    "In this section, the  `tlt` API uses [Intel® Neural Compressor (INC)](https://github.com/intel/neural-compressor) to benchmark and quantize the model to get optimal inference performance."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f0edeffe",
+   "metadata": {},
+   "source": [
+    "We use the Intel Neural Compressor config to benchmark the full precision model to see how it performs, as our baseline.\n",
+    "\n",
+    "> Note that there is a known issue when running Intel Neural Compressor from a notebook that you may sometimes see the error \n",
+    "> `zmq.error.ZMQError: Address already in use`. If you see this error, rerun the cell again.\n",
+    "\n",
+    "> Likewise, if the benchmark function returns an empty dictionary `{}`, run the cell again."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3ee783f7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.benchmark(dataset=dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4761363e",
+   "metadata": {},
+   "source": [
+    "Next we use Intel Neural Compressor to automatically search for the optimal quantization recipe for low-precision model inference within the accuracy loss constrains defined in the config. Running post training quantization may take several minutes, depending on your hardware and the exit policy (timeout and max trials)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "902200ca",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "inc_output_dir = os.path.join(output_dir, 'quantized_models', model.model_name,\n",
+    "                                       os.path.basename(saved_model_dir))\n",
+    "model.quantize(inc_output_dir, dataset=dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0a298a32",
+   "metadata": {},
+   "source": [
+    "Let's benchmark using the quantized model, so that we can compare the performance to the full precision model that was originally benchmarked."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ec65e1ee",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "18a6c74f",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "```\n",
+    "@ONLINE {tfflowers,\n",
+    "author = \"The TensorFlow Team\",\n",
+    "title = \"Flowers\",\n",
+    "month = \"jan\",\n",
+    "year = \"2019\",\n",
+    "url = \"http://download.tensorflow.org/example_images/flower_photos.tgz\" }\n",
+    "\n",
+    "@article{openimages,\n",
+    "  title={OpenImages: A public dataset for large-scale multi-label and multi-class image classification.},\n",
+    "  author={Krasin, Ivan and Duerig, Tom and Alldrin, Neil and Veit, Andreas and Abu-El-Haija, Sami\n",
+    "    and Belongie, Serge and Cai, David and Feng, Zheyun and Ferrari, Vittorio and Gomes, Victor\n",
+    "    and Gupta, Abhinav and Narayanan, Dhyanesh and Sun, Chen and Chechik, Gal and Murphy, Kevin},\n",
+    "  journal={Dataset available from https://github.com/openimages},\n",
+    "  year={2016}\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Transfer_Learning_and_Graph_Optimization.ipynb b/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Transfer_Learning_and_Graph_Optimization.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..4f4a86181d3a0fad832eb5b1100803241179b2a3
--- /dev/null
+++ b/notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Transfer_Learning_and_Graph_Optimization.ipynb
@@ -0,0 +1,411 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "ffc0d761",
+   "metadata": {},
+   "source": [
+    "# Transfer Learning and Graph Optimization using TensorFlow and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the `tlt` library to do transfer learning and graph optimization for image classfication with a TensorFlow pretrained model."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "b266ca11",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [notebooks README.md](/notebooks/README.md) to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "1b31cc75",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import matplotlib.pyplot as plt\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import PIL.Image as Image\n",
+    "import tensorflow as tf\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "e49dafe3",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported TensorFlow image classification models. This is a list of pretrained models from [TFHub](https://tfhub.dev) and [Keras Applications](https://keras.io/api/applications/) that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models` function call to get more information about each model (such as the image size, the original dataset, the preprocessor, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad49dc51",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available models\n",
+    "model_factory.print_supported_models(use_case='image_classification', framework='tensorflow')"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "764c7063",
+   "metadata": {},
+   "source": [
+    "Next, use the model factory to get one of the models listed in the previous cell. The `get_model` function returns a model object that will later be used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "f101e379",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = model_factory.get_model(model_name='resnet_v1_50', framework='tensorflow')\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)\n",
+    "print(\"Image size:\", model.image_size)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "3351fbbc",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset\n",
+    "\n",
+    "We call the dataset factory to load sample image classification dataset. For demonstration purposes, we will download a flower species dataset. After downloading and extracting, you will have the following  subdirectories in your dataset directory. Each species subfolder will contain numerous `.jpg` files:\n",
+    "\n",
+    "```\n",
+    "flower_photos\n",
+    "  └── daisy\n",
+    "  └── dandelion\n",
+    "  └── roses\n",
+    "  └── sunflowers\n",
+    "  └── tulips\n",
+    "```\n",
+    "\n",
+    "When using your own dataset, ensure that it is similarly organized with folders for each class. Change the `custom_dataset_path` variable to point to your dataset folder."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8741e47e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# For demonstration purposes, we download a flowers dataset. To instead use your own dataset, set the\n",
+    "# custom_dataset_path to point to your dataset's directory and comment out the download_and_extract_tar_file line.\n",
+    "custom_dataset_path = os.path.join(dataset_dir, \"flower_photos\")\n",
+    "\n",
+    "if not os.path.exists(custom_dataset_path):\n",
+    "    download_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    download_and_extract_tar_file(download_url, dataset_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "0ddf65ed",
+   "metadata": {},
+   "source": [
+    "Call the dataset factory to load the dataset from the directory."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "94ebc8e1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load the dataset from the custom dataset path\n",
+    "dataset = dataset_factory.load_dataset(dataset_dir=custom_dataset_path,\n",
+    "                                       use_case='image_classification', \n",
+    "                                       framework='tensorflow')\n",
+    "\n",
+    "print(\"Class names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "372a5bd2",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset, use the following cells to split and preprocess the data. We split them into training and validation subsets, then resize the images to match the selected models, and then batch the images."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4b4dc950",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Split the dataset into training and validation subsets\n",
+    "dataset.shuffle_split(train_pct=.75, val_pct=.25)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "33c883c2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Preprocess the dataset with an image size and preprocessor that match the model and a batch size of 32\n",
+    "batch_size = 32\n",
+    "dataset.preprocess(model.image_size, batch_size=batch_size, preprocessor=model.preprocessor)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "05acac53",
+   "metadata": {},
+   "source": [
+    "## 5. Evaluate the model before training\n",
+    "\n",
+    "Since we haven't done any training on the model yet, it will evaluate using the original ImageNet trained model and accuracy on the new classes will be near zero."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "12ab6b31",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.evaluate(dataset)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "7208e757",
+   "metadata": {},
+   "source": [
+    "## 6. Transfer Learning\n",
+    "\n",
+    "This step calls the model's train function with the dataset that was just prepared. The training function will get the base model and add on a dense layer based on the number of classes in the dataset. The model is then compiled and trained based on the number of epochs specified in the argument. With the do_eval parameter set to True by default, this step will also show how the model can be evaluated and will return a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "039db26f",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **enable_auto_mixed_precision** (bool or None): Enable auto mixed precision for training. Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance. If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e7d51156",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "enable_auto_mixed_precision = None\n",
+    "\n",
+    "# Train using the pretrained model from TF Hub with the new dataset\n",
+    "history = model.train(dataset, output_dir=output_dir, epochs=1,\n",
+    "                      enable_auto_mixed_precision=enable_auto_mixed_precision)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "81f75fa0",
+   "metadata": {},
+   "source": [
+    "This time, the accuracy looks much better."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "007cc8fe",
+   "metadata": {},
+   "source": [
+    "## 7. Export\n",
+    "\n",
+    "Next, we can call the model `export` function to generate a `saved_model.pb`. The model is saved in a format that is ready to use with [TensorFlow Serving](https://github.com/tensorflow/serving). Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "eed84d55",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "b3e1df1f",
+   "metadata": {},
+   "source": [
+    "## 8. Graph Optimization\n",
+    "\n",
+    "The `tlt` API uses [Intel® Neural Compressor (INC)](https://github.com/intel/neural-compressor) to optimize the FP32 graph for improved inference performance. Graph optimization performs the following:\n",
+    "* Converting variables to constants\n",
+    "* Removing training-only operations like checkpoint saving\n",
+    "* Stripping out parts of the graph that are never reached\n",
+    "* Removing debug operations like CheckNumerics\n",
+    "* Folding batch normalization ops into the pre-calculated weights\n",
+    "* Fusing common operations into unified versions\n",
+    "\n",
+    "For benchmarking, we will use an auto-generated config. If you want more control over the configuration, you can create your own config using the Intel Neural Compressor or the `tlt.utils.inc_utils.get_inc_config()` method."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "e27391d9",
+   "metadata": {},
+   "source": [
+    "We use the Intel Neural Compressor config to benchmark the full non-optimized model to see how it performs, as our baseline.\n",
+    "\n",
+    "> Note that there is a known issue when running Intel Neural Compressor from a notebook that you may sometimes see the error \n",
+    "> `zmq.error.ZMQError: Address already in use`. If you see this error, rerun the cell again."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e4dbc03f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "result = model.benchmark(dataset)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "64210d77",
+   "metadata": {},
+   "source": [
+    "Next, we do the FP32 graph optimization."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0531bf13",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create an output directory for optimization output with the same base name as our saved model directory\n",
+    "optimization_output_dir = os.path.join(output_dir, 'optimized_models', model.model_name,\n",
+    "                                       os.path.basename(saved_model_dir))\n",
+    "\n",
+    "model.optimize_graph(optimization_output_dir, overwrite_model=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "77775e97",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "optimized_result = model.benchmark(dataset, saved_model_dir=optimization_output_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "210fb6ff",
+   "metadata": {},
+   "source": [
+    "## Dataset Citations\n",
+    "\n",
+    "```\n",
+    "@ONLINE {tfflowers,\n",
+    "author = \"The TensorFlow Team\",\n",
+    "title = \"Flowers\",\n",
+    "month = \"jan\",\n",
+    "year = \"2019\",\n",
+    "url = \"http://download.tensorflow.org/example_images/flower_photos.tgz\" }\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/performance/hf_text_classification_performance.ipynb b/notebooks/performance/hf_text_classification_performance.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..3caea7d2b8bd5174e0646ca4559b4ef68b2a3aad
--- /dev/null
+++ b/notebooks/performance/hf_text_classification_performance.ipynb
@@ -0,0 +1,809 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "57b029cd",
+   "metadata": {},
+   "source": [
+    "# Performance Comparison: Text Classification Transfer Learning with Hugging Face* and the Intel® Transfer Learning Tool\n",
+    "\n",
+    "This notebook uses the Hugging Face Trainer to do transfer learning with a text classification model with PyTorch*. The model is trained, evaluated, and exported. The same sequence is also done using the Intel Transfer Learning Tool. The Intel Transfer Learning Tool has a flag to control whether the Hugging Face Trainer is used under the hood, or if just PyTorch libraries are used. Training and evaluation are run both ways, giving us three combinations to compare:\n",
+    "* Using the Hugging Face Trainer\n",
+    "* Using the Intel Transfer Learning Tool with the Hugging Face Trainer\n",
+    "* Using the Intel Transfer Learning Tool with torch\n",
+    "\n",
+    "After all of the models have been trained and evaluated, charts are displayed to visually compare the training and evaluation metrics."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "30be8bb1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import psutil\n",
+    "\n",
+    "os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'\n",
+    "os.environ['TOKENIZERS_PARALLELISM'] = 'false'\n",
+    "\n",
+    "import datasets\n",
+    "import matplotlib.pyplot as plt\n",
+    "import matplotlib.ticker as mtick\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import torch\n",
+    "import transformers\n",
+    "from transformers import DataCollatorWithPadding, Trainer\n",
+    "from torch.utils.data import DataLoader as loader\n",
+    "\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.platform_util import CPUInfo, OptimizedPlatformUtil, PlatformUtil\n",
+    "\n",
+    "# Specify the the default dataset directory\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output (saved models and checkpoints)\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "# Location where Hugging Face will locally store data\n",
+    "os.environ['HF_HOME'] = dataset_directory\n",
+    "\n",
+    "datasets.utils.logging.set_verbosity(datasets.logging.ERROR)\n",
+    "\n",
+    "# Data Frame styles\n",
+    "table_styles =[{\n",
+    "    'selector': 'caption',\n",
+    "    'props': [\n",
+    "        ('text-align', 'center'),\n",
+    "        ('color', 'black'),\n",
+    "        ('font-size', '16px')\n",
+    "    ]\n",
+    "}]\n",
+    "\n",
+    "# Colors used in charts\n",
+    "blue = '#0071c5'\n",
+    "dark_blue = '#003c71'\n",
+    "yellow = '#ffcc4d'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f2730530",
+   "metadata": {},
+   "source": [
+    "## 1. Display Platform Information"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e63bb467",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get and display CPU/platform information\n",
+    "cpu_info = CPUInfo()\n",
+    "platform_util = PlatformUtil()\n",
+    "print(\"{0} CPU Information {0}\".format(\"=\" * 20))\n",
+    "print(\"CPU family:\", platform_util.cpu_family)\n",
+    "print(\"CPU model:\", platform_util.cpu_model)\n",
+    "print(\"CPU type:\", platform_util.cpu_type)\n",
+    "print(\"Physical cores per socket:\", cpu_info.cores_per_socket)\n",
+    "print(\"Total physical cores:\", cpu_info.cores)\n",
+    "cpufreq = psutil.cpu_freq()\n",
+    "print(\"Max Frequency:\", cpufreq.max)\n",
+    "print(\"Min Frequency:\", cpufreq.min)\n",
+    "cpu_socket_count = cpu_info.sockets\n",
+    "print(\"Socket Number:\", cpu_socket_count)\n",
+    "\n",
+    "print(\"\\n{0} Memory Information {0}\".format(\"=\" * 20))\n",
+    "svmem = psutil.virtual_memory()\n",
+    "print(\"Total: \", int(svmem.total / (1024 ** 3)), \"GB\")\n",
+    "\n",
+    "# Display Hugging Face version information\n",
+    "print(\"\\n{0} Hugging Face Information {0}\".format(\"=\" * 20))\n",
+    "print(\"Hugging Face Transformers version:\", transformers.__version__)\n",
+    "print(\"Hugging Face Datasets version:\", datasets.__version__)\n",
+    "\n",
+    "# Display PyTorch version information\n",
+    "print(\"\\n{0} PyTorch Information {0}\".format(\"=\" * 20))\n",
+    "print(\"PyTorch version:\", torch.__version__)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e0b7f5fb",
+   "metadata": {},
+   "source": [
+    "## 2. Select a model and define parameters to use during training and evaluation\n",
+    "\n",
+    "### Select a model\n",
+    "\n",
+    "See the list of supported PyTorch text classification models from Hugging Face in the Intel Transfer Learning Tool."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "069e58da",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "framework = 'pytorch'\n",
+    "use_case = 'text_classification'\n",
+    "model_hub = 'huggingface'\n",
+    "supported_models = model_factory.get_supported_models(framework, use_case)\n",
+    "supported_models = supported_models[use_case]\n",
+    "\n",
+    "# Filter to only get relevant models\n",
+    "supported_models = { key:value for (key,value) in supported_models.items() if value[framework]['model_hub'] == model_hub}\n",
+    "\n",
+    "print(\"Supported {} models for {} from {}\".format(framework, use_case, model_hub))\n",
+    "print(\"=\" * 70)\n",
+    "for model_name in supported_models.keys():\n",
+    "    print(model_name)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8fc116a5",
+   "metadata": {},
+   "source": [
+    "Set the `model_name` to the model that will be used during this experiment."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bda109e9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Select a model\n",
+    "model_name = \"bert-base-cased\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bd568624",
+   "metadata": {},
+   "source": [
+    "### Select a dataset\n",
+    "\n",
+    "For these experiments, we will be using text classification datasets from the [Hugging Face Datasets catalog](https://huggingface.co/datasets?task_categories=task_categories:text-classification&sort=downloads). Specify the name of the dataset to use with the `dataset_name` variable in the next cell."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6aa35cf0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset_name = 'imdb'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "409141c0",
+   "metadata": {},
+   "source": [
+    "### Define parameters\n",
+    "\n",
+    "For consistency between the model training experiments using Hugging Face and the Intel Transfer Learning Tool, the next cell defines parameters that will be used by both methods."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9588f07d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Number of training epochs\n",
+    "training_epochs = 2\n",
+    "\n",
+    "# Shuffle the files after each training epoch\n",
+    "shuffle_files = True\n",
+    "\n",
+    "# Define the name of the split to use for validation (i.e. 'validation' or 'test')\n",
+    "eval_split=None\n",
+    "# If eval_split=None, split the 'train' dataset\n",
+    "validation_split = 0.05\n",
+    "training_split = 0.1\n",
+    "\n",
+    "# Set seed for consistency between runs (or None)\n",
+    "seed = 10\n",
+    "\n",
+    "# List of batch size(s) to compare (maximum of 4 batch sizes to try)\n",
+    "batch_size_list = [ 16, 32 ]\n",
+    "\n",
+    "learning_rate=3e-5\n",
+    "\n",
+    "# Text preprocessing\n",
+    "max_sequence_length = 128\n",
+    "padding = 'max_length'\n",
+    "truncation = True\n",
+    "\n",
+    "# Use the Intel Extension for PyTorch\n",
+    "use_ipex = True"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c508355f",
+   "metadata": {},
+   "source": [
+    "Validate parameter values and then print out the parameters."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ec3ec8be",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if not isinstance(training_epochs, int):\n",
+    "    raise TypeError(\"The training_epochs parameter should be an integer, but found a {}\".format(type(training_epochs)))\n",
+    "\n",
+    "if training_epochs < 1:\n",
+    "    raise ValueError(\"The training_epochs parameter should not be less than 1.\")\n",
+    "    \n",
+    "if not isinstance(shuffle_files, bool):\n",
+    "    raise TypeError(\"The shuffle_files parameter should be a bool, but found a {}\".format(type(shuffle_files)))\n",
+    "\n",
+    "if not eval_split:\n",
+    "    if not isinstance(validation_split, float):\n",
+    "        raise TypeError(\"The validation_split parameter should be a float, but found a {}\".format(type(validation_split)))\n",
+    "\n",
+    "    if not isinstance(training_split, float):\n",
+    "        raise TypeError(\"The training_split parameter should be a float, but found a {}\".format(type(training_split)))\n",
+    "\n",
+    "if validation_split + training_split > 1:\n",
+    "    raise ValueError(\"The sum of validation_split and training_split should not be greater than 1.\")\n",
+    "\n",
+    "if seed and not isinstance(seed, int):\n",
+    "    raise TypeError(\"The seed parameter should be a integer or None, but found a {}\".format(type(seed)))\n",
+    "\n",
+    "if len(batch_size_list) > 4 or len(batch_size_list) == 0:\n",
+    "    raise ValueError(\"The batch_size_list should have at most 4 values, but found {} values ({})\".format(\n",
+    "        len(batch_size_list), batch_size_list))\n",
+    "    \n",
+    "print(\"Number of training epochs:\", training_epochs)\n",
+    "print(\"Shuffle files:\", shuffle_files)\n",
+    "print(\"Training split: {}%\".format('train' if eval_split else training_split*100))\n",
+    "print(\"Validation split: {}%\".format(eval_split if eval_split else validation_split*100))\n",
+    "print(\"Seed:\", str(seed))\n",
+    "print(\"Batch size list:\", batch_size_list)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d102b97b",
+   "metadata": {},
+   "source": [
+    "## 3. Train and evaluate the models\n",
+    "\n",
+    "In this section, we will compare the time that it takes to fine tune the text classification model using the dataset that was selected in the previous section.\n",
+    "\n",
+    "The fine tuning will be done in two different ways:\n",
+    "* Using the Hugging Face python libraries\n",
+    "* Using the Intel Transfer Learning Tool\n",
+    "\n",
+    "### Fine tuning using the Hugging Face libraries\n",
+    "\n",
+    "First, we download and prepare the dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ad0b244c",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "transformers.set_seed(seed)\n",
+    "\n",
+    "# Determine the splits to load\n",
+    "split = ['train']\n",
+    "if eval_split:\n",
+    "    split.append(eval_split)\n",
+    "\n",
+    "# Load the dataset from the Hugging Face dataset catalog\n",
+    "hf_dataset = datasets.load_dataset(dataset_name, cache_dir=dataset_directory, split=split)\n",
+    "\n",
+    "# Load the tokenizer based on our selected model\n",
+    "hf_tokenizer = transformers.AutoTokenizer.from_pretrained(model_name, cache_dir=output_directory)\n",
+    "\n",
+    "text_column_names = [col_name for col_name in hf_dataset[0].column_names if col_name != 'label' and\n",
+    "                     all(isinstance(s, str) for s in hf_dataset[0][col_name])]\n",
+    "\n",
+    "# Tokenize the dataset\n",
+    "def tokenize_function(examples):\n",
+    "    args = (examples[text_column_name] for text_column_name in text_column_names)\n",
+    "    return hf_tokenizer(*args, padding=padding, max_length=max_sequence_length, truncation=truncation)\n",
+    "\n",
+    "tokenized_hf_dataset = [d.map(tokenize_function, batched=True) for d in hf_dataset]\n",
+    "for tokenized in tokenized_hf_dataset:\n",
+    "    tokenized.set_format('torch')\n",
+    "\n",
+    "# If eval_split is defined, that split will be used for validation. Otherwise, the 'train' dataset split will be\n",
+    "# split by the defined percentage to use for training and evaluation.\n",
+    "hf_train_dataset = tokenized_hf_dataset[0]\n",
+    "if eval_split:\n",
+    "    print(\"Using 'train' and '{}' dataset splits\".format(eval_split))\n",
+    "    hf_train_subset = hf_train_dataset\n",
+    "    hf_eval_subset = tokenized_hf_dataset[1]\n",
+    "else:\n",
+    "    dataset_length = len(hf_train_dataset)\n",
+    "    train_size = int(training_split * dataset_length)\n",
+    "    eval_size = int(validation_split * dataset_length)\n",
+    "    generator = torch.Generator().manual_seed(seed) \n",
+    "    dataset_indices = torch.randperm(dataset_length, generator=generator).tolist() if shuffle_files else range(dataset_length)\n",
+    "    train_indices = dataset_indices[:train_size]\n",
+    "    eval_indices = dataset_indices[train_size:train_size + eval_size]\n",
+    "    print(\"Using {}% for training and {}% for validation\".format(training_split * 100, validation_split * 100))\n",
+    "    print(\"Total dataset size:\", dataset_length)\n",
+    "    print(\"Train size:\", train_size)\n",
+    "    print(\"Eval size:\", eval_size)\n",
+    "    hf_train_subset = hf_train_dataset.select(train_indices)\n",
+    "    hf_eval_subset = hf_train_dataset.select(eval_indices)\n",
+    "\n",
+    "# Get the number of classes from the train dataset features (either called 'label' or 'labels')\n",
+    "class_names = hf_dataset[0].features['label'].names if 'label' in hf_dataset[0].features else \\\n",
+    "    hf_dataset[0].features['labels'].names\n",
+    "print(\"Class names: {}\".format(class_names))\n",
+    "\n",
+    "hf_train_dataset_length = len(hf_train_subset)\n",
+    "hf_eval_dataset_length = len(hf_eval_subset)\n",
+    "\n",
+    "# Define function to compute accuracy to pass to the Hugging Face Trainer\n",
+    "def compute_metrics(p: transformers.EvalPrediction):\n",
+    "    preds = p.predictions[0] if isinstance(p.predictions, tuple) else p.predictions\n",
+    "    preds = np.argmax(preds, axis=1)\n",
+    "    return {\"accuracy\": (preds == p.label_ids).astype(np.float32).mean().item()}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "75bc822a",
+   "metadata": {},
+   "source": [
+    "Next, we iterate through our list of batch sizes to train the model for each configuration with the dataset that was prepared in the previous cell. After training is complete, the model is evaluated and exported. The training and evaluation metrics are saved to lists."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9b3037a8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "hf_saved_model_paths = []\n",
+    "hf_training_metrics = []\n",
+    "hf_eval_results = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 40)\n",
+    "    print('Training using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "    \n",
+    "    # Get the model from pretrained\n",
+    "    model = transformers.AutoModelForSequenceClassification.from_pretrained(model_name, num_labels=len(class_names))\n",
+    "\n",
+    "    # Setup a directory to save the model output\n",
+    "    saved_model_dir = os.path.join(output_directory, model_name, 'HF_model_bs{}'.format(batch_size))\n",
+    "    \n",
+    "    # Note: Even when setting do_eval=False, an error gets thrown if a eval_dataset is not provided\n",
+    "    training_args = transformers.TrainingArguments(\n",
+    "        output_dir=saved_model_dir,\n",
+    "        do_eval=False,\n",
+    "        do_train=True,\n",
+    "        learning_rate=learning_rate,\n",
+    "        per_device_train_batch_size=batch_size,\n",
+    "        per_device_eval_batch_size=batch_size,\n",
+    "        num_train_epochs=training_epochs,\n",
+    "        evaluation_strategy=\"epoch\",\n",
+    "        push_to_hub=False,\n",
+    "        no_cuda=True,\n",
+    "        overwrite_output_dir=True,\n",
+    "        seed=seed,\n",
+    "        data_seed=seed,\n",
+    "        use_ipex=use_ipex\n",
+    "    )\n",
+    "\n",
+    "    trainer = Trainer(\n",
+    "        model=model,\n",
+    "        args=training_args,\n",
+    "        train_dataset=hf_train_subset,\n",
+    "        eval_dataset=hf_eval_subset,\n",
+    "        compute_metrics=compute_metrics,\n",
+    "        tokenizer=hf_tokenizer,\n",
+    "    )\n",
+    "\n",
+    "    # Train the model\n",
+    "    history = trainer.train()\n",
+    "    \n",
+    "    # Evaluate the model\n",
+    "    eval_results = trainer.evaluate()\n",
+    "    \n",
+    "    # Export the trained model\n",
+    "    trainer.save_model(saved_model_dir)\n",
+    "        \n",
+    "    # Save objects and metrics\n",
+    "    hf_training_metrics.append(history)\n",
+    "    hf_eval_results.append(eval_results)\n",
+    "    hf_saved_model_paths.append(saved_model_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "86cafc34",
+   "metadata": {},
+   "source": [
+    "### Using the Intel Transfer Learning tool API\n",
+    "\n",
+    "Next, we train the same model using the same parameters using the Intel Transfer Learning Tool. The Intel Transfer Learning Tool training method has an argument called `use_trainer` to determine if the Hugging Face Trainer will be used. If `use_trainer=False`, the torch libraries will be used to train the model. The next section will do the training with and without the Hugging Face Trainer, so that we can gather metrics both ways. After the model is trained, it is evaluted. Again, we save the training and evaluation metrics to lists."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e08223da",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Intel Transfer Learning Tool using the Hugging Face Trainer\n",
+    "tlt_trainer_saved_model_paths = []\n",
+    "tlt_trainer_training_metrics = []\n",
+    "tlt_trainer_eval_results = []\n",
+    "\n",
+    "# Intel Transfer Learning Tool training using torch libraries\n",
+    "tlt_torch_saved_model_paths = []\n",
+    "tlt_torch_training_metrics = []\n",
+    "tlt_torch_eval_results = []\n",
+    "\n",
+    "split_names = ['train'] if eval_split is None else ['train', eval_split]\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 40)\n",
+    "    print('Training using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "\n",
+    "    # Get the dataset\n",
+    "    dataset = dataset_factory.get_dataset(dataset_directory, use_case, framework, dataset_name,\n",
+    "                                          dataset_catalog=\"huggingface\", shuffle_files=shuffle_files,\n",
+    "                                          split=split_names)\n",
+    "\n",
+    "    # Batch and tokenize the dataset\n",
+    "    dataset.preprocess(model_name, batch_size=batch_size, max_length=max_sequence_length, padding=padding,\n",
+    "                       truncation=truncation)\n",
+    "\n",
+    "    # If the dataset doesn't have a defined split, then split it by percentages\n",
+    "    if eval_split is None:\n",
+    "        dataset.shuffle_split(train_pct=training_split, val_pct=validation_split)\n",
+    "        \n",
+    "    tlt_train_dataset_length = len(dataset.train_subset)\n",
+    "    \n",
+    "    if eval_split == 'test':\n",
+    "        eval_dataset = dataset.test_subset\n",
+    "        tlt_eval_dataset_length = len(eval_dataset)\n",
+    "    else:\n",
+    "        eval_dataset = dataset.validation_subset\n",
+    "        tlt_eval_dataset_length = len(eval_dataset)\n",
+    "    \n",
+    "    # Verify dataset length between the experiments\n",
+    "    assert tlt_train_dataset_length == hf_train_dataset_length\n",
+    "    assert tlt_eval_dataset_length == hf_eval_dataset_length\n",
+    "        \n",
+    "    for use_trainer in [True, False]:\n",
+    "        print('\\nTraining using Hugging Face Trainer: {}'.format(use_trainer))\n",
+    "        \n",
+    "        # Get the model\n",
+    "        model = model_factory.get_model(model_name, framework)\n",
+    "\n",
+    "        # Train the model\n",
+    "        history = model.train(dataset, output_directory, epochs=training_epochs, ipex_optimize=use_ipex,\n",
+    "                              use_trainer=use_trainer, do_eval=False, learning_rate=learning_rate, seed=seed)\n",
+    "        \n",
+    "        eval_metrics = model.evaluate(eval_dataset)\n",
+    "\n",
+    "        # Save the model\n",
+    "        saved_model_dir = model.export(output_directory)\n",
+    "        \n",
+    "        if use_trainer:\n",
+    "            tlt_trainer_training_metrics.append(history)\n",
+    "            tlt_trainer_saved_model_paths.append(saved_model_dir)\n",
+    "            tlt_trainer_eval_results.append(eval_metrics)\n",
+    "        else:\n",
+    "            tlt_torch_training_metrics.append(history)\n",
+    "            tlt_torch_saved_model_paths.append(saved_model_dir)\n",
+    "            tlt_torch_eval_results.append(eval_metrics)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "c8a27d05",
+   "metadata": {},
+   "source": [
+    "## 4. Compare metrics\n",
+    "\n",
+    "This section compares metrics for training and evaluating the model for the following experiments:\n",
+    "* Using the Hugging Face Trainer\n",
+    "* Using the Intel Transfer Learning Tool with the Hugging Face Trainer\n",
+    "* Using the Intel Transfer Learning Tool with torch"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "570f872d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "display_df = []\n",
+    "\n",
+    "# Display training metrics\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    df = pd.DataFrame({\n",
+    "        'Hugging Face Trainer': [hf_training_metrics[i].metrics['train_loss'], hf_training_metrics[i].metrics['train_samples_per_second'], hf_training_metrics[i].metrics['train_runtime']],\n",
+    "        'Intel Transfer Learning Tool<br>using the HF Trainer': [tlt_trainer_training_metrics[i].metrics['train_loss'], tlt_trainer_training_metrics[i].metrics['train_samples_per_second'], tlt_trainer_training_metrics[i].metrics['train_runtime']],\n",
+    "        'Intel Transfer Learning Tool<br>using Torch': [tlt_torch_training_metrics[i]['Loss'], tlt_torch_training_metrics[i]['train_samples_per_second'][0], tlt_torch_training_metrics[i]['train_runtime'][0]],\n",
+    "    }, index = ['Loss', 'Samples per second', 'Train Runtime'])\n",
+    "    df = df.style.set_table_styles(table_styles).set_caption(\"Training metrics with batch size {}\".format(batch_size))\n",
+    "    display_df.append(df)\n",
+    "\n",
+    "# Display evaluation metrics\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    df = pd.DataFrame({\n",
+    "        'Eval using the<br>Hugging Face Trainer': [\"{0:.2%}\".format(hf_eval_results[i]['eval_accuracy']), hf_eval_results[i]['eval_loss'], hf_eval_results[i]['eval_samples_per_second'], hf_eval_results[i]['eval_runtime']],\n",
+    "        'Intel Transfer Learning Tool<br>eval using the HF Trainer': [\"{0:.2%}\".format(tlt_trainer_eval_results[i]['eval_accuracy']), tlt_trainer_eval_results[i]['eval_loss'], tlt_trainer_eval_results[i]['eval_samples_per_second'], tlt_trainer_eval_results[i]['eval_runtime']],\n",
+    "        'Intel Transfer Learning Tool<br>eval using Torch': [\"{0:.2%}\".format(tlt_torch_eval_results[i]['eval_accuracy']), tlt_torch_eval_results[i]['eval_loss'], tlt_torch_eval_results[i]['eval_samples_per_second'], tlt_torch_eval_results[i]['eval_runtime']],\n",
+    "    }, index = ['Eval accuracy', 'Eval Loss', 'Samples per second', 'Train Runtime'])\n",
+    "    df = df.style.set_table_styles(table_styles).set_caption(\"Training metrics with batch size {}\".format(batch_size))\n",
+    "    display_df.append(df)\n",
+    "    \n",
+    "for df in display_df:\n",
+    "    display(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "89360585",
+   "metadata": {},
+   "source": [
+    "### Training metrics\n",
+    "\n",
+    "Generate charts to compare the time that it took to train the model in each experiment (lower is better) and the thoughput (higher is better)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0919f4dc",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Bar chart group labels\n",
+    "groups = [\"batch size = {}\".format(bs) for bs in batch_size_list]\n",
+    "\n",
+    "hf_train_runtime = [x.metrics['train_runtime'] for x in hf_training_metrics]\n",
+    "tlt_trainer_train_runtime = [x.metrics['train_runtime'] for x in tlt_trainer_training_metrics]\n",
+    "tlt_torch_train_runtime = [x['train_runtime'][0] for x in tlt_torch_training_metrics]\n",
+    "\n",
+    "hf_train_throughput = [x.metrics['train_samples_per_second'] for x in hf_training_metrics]\n",
+    "tlt_trainer_train_throughput = [x.metrics['train_samples_per_second'] for x in tlt_trainer_training_metrics]\n",
+    "tlt_torch_train_thoughput = [x['train_samples_per_second'][0] for x in tlt_torch_training_metrics]\n",
+    "\n",
+    "x = np.arange(len(groups))\n",
+    "width = 0.2  # the width of the bars\n",
+    "multiplier = 0\n",
+    "\n",
+    "# Setup bars for training run times\n",
+    "fig, (ax1, ax2) = plt.subplots(2)\n",
+    "fig.set_figheight(15)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax1.bar(x, hf_train_runtime, width, label='HF trained', color=yellow)\n",
+    "rects_tlt_trainer = ax1.bar(x + width, tlt_trainer_train_runtime, width, label='TLT using Trainer', color=blue)\n",
+    "rects_tlt_torch = ax1.bar(x + width * 2, tlt_torch_train_runtime, width, label='TLT using Torch', color=dark_blue)\n",
+    "ax1.bar_label(rects_tf, padding=3)\n",
+    "ax1.bar_label(rects_tlt_trainer, padding=3)\n",
+    "ax1.bar_label(rects_tlt_torch, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax1.set_ylabel('Seconds')\n",
+    "ax1.set_title('Training Runtime')\n",
+    "ax1.set_xticks(x+width, groups)\n",
+    "ax1.set_ymargin(0.2) \n",
+    "ax1.legend(ncols=2)\n",
+    "\n",
+    "# Setup bars for throughput\n",
+    "rects_tf = ax2.bar(x, hf_train_throughput, width, label='HF trained', color=yellow)\n",
+    "rects_tlt_trainer = ax2.bar(x + width, tlt_trainer_train_throughput, width, label='TLT using Trainer', color=blue)\n",
+    "rects_tlt_torch = ax2.bar(x + width * 2, tlt_torch_train_thoughput, width, label='TLT using Torch', color=dark_blue)\n",
+    "ax2.bar_label(rects_tf, padding=3)\n",
+    "ax2.bar_label(rects_tlt_trainer, padding=3)\n",
+    "ax2.bar_label(rects_tlt_torch, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax2.set_ylabel('Samples per second')\n",
+    "ax2.set_title('Training Throughput')\n",
+    "ax2.set_xticks(x+width, groups)\n",
+    "ax2.set_ymargin(0.2) \n",
+    "ax2.legend(ncols=2)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "54559456",
+   "metadata": {},
+   "source": [
+    "### Evaluation Metrics\n",
+    "\n",
+    "Next, we generate charts to compare the evaluation metrics for the same three experiments that were used for training the model. We have a charts with the validation accuracy, total evaluation time (lower is better), and evaluation throughput (higher is better)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "02473c34",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Decimals used for rounding\n",
+    "decimals = 2\n",
+    "\n",
+    "# Get the evaluation metrics\n",
+    "hf_eval_acc = [round(x['eval_accuracy'] * 100, decimals) for x in hf_eval_results]\n",
+    "tlt_trainer_eval_acc = [round(x['eval_accuracy'] * 100, decimals) for x in tlt_trainer_eval_results]\n",
+    "tlt_torch_eval_acc = [round(x['eval_accuracy'] * 100, decimals) for x in tlt_torch_eval_results]\n",
+    "\n",
+    "hf_eval_runtime = [round(x['eval_runtime'], decimals) for x in hf_eval_results]\n",
+    "tlt_trainer_eval_runtime = [round(x['eval_runtime'], decimals) for x in tlt_trainer_eval_results]\n",
+    "tlt_torch_eval_runtime = [round(x['eval_runtime'], decimals) for x in tlt_torch_eval_results]\n",
+    "\n",
+    "hf_eval_throughput = [round(x['eval_samples_per_second'], decimals) for x in hf_eval_results]\n",
+    "tlt_trainer_eval_throughput = [round(x['eval_samples_per_second'], decimals) for x in tlt_trainer_eval_results]\n",
+    "tlt_torch_eval_thoughput = [round(x['eval_samples_per_second'], decimals) for x in tlt_torch_eval_results]\n",
+    "\n",
+    "x = np.arange(len(groups))\n",
+    "width = 0.2  # the width of the bars\n",
+    "multiplier = 0\n",
+    "\n",
+    "# Setup bars for training run times\n",
+    "fig, (ax1, ax2, ax3) = plt.subplots(3)\n",
+    "fig.set_figheight(20)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax1.bar(x, hf_eval_acc, width, label='HF evaluated', color=yellow)\n",
+    "rects_tlt_trainer = ax1.bar(x + width, tlt_trainer_eval_acc, width, label='TLT eval using Trainer', color=blue)\n",
+    "rects_tlt_torch = ax1.bar(x + width * 2, tlt_torch_eval_acc, width, label='TLT eval using Torch', color=dark_blue)\n",
+    "ax1.bar_label(rects_tf, padding=3)\n",
+    "ax1.bar_label(rects_tlt_trainer, padding=3)\n",
+    "ax1.bar_label(rects_tlt_torch, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax1.set_ylabel('Percentage (%)')\n",
+    "ax1.set_title('Evaluation Accuracy')\n",
+    "ax1.set_xticks(x+width, groups)\n",
+    "ax1.set_ymargin(0.2) \n",
+    "ax1.legend(ncols=2)\n",
+    "\n",
+    "rects_tf = ax2.bar(x, hf_eval_runtime, width, label='HF evaluated', color=yellow)\n",
+    "rects_tlt_trainer = ax2.bar(x + width, tlt_trainer_eval_runtime, width, label='TLT eval using Trainer', color=blue)\n",
+    "rects_tlt_torch = ax2.bar(x + width * 2, tlt_torch_eval_runtime, width, label='TLT eval using Torch', color=dark_blue)\n",
+    "ax2.bar_label(rects_tf, padding=3)\n",
+    "ax2.bar_label(rects_tlt_trainer, padding=3)\n",
+    "ax2.bar_label(rects_tlt_torch, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax2.set_ylabel('Seconds')\n",
+    "ax2.set_title('Evaluation Runtime')\n",
+    "ax2.set_xticks(x+width, groups)\n",
+    "ax2.set_ymargin(0.2) \n",
+    "ax2.legend(ncols=2)\n",
+    "\n",
+    "# Setup bars for throughput\n",
+    "rects_tf = ax3.bar(x, hf_eval_throughput, width, label='HF evaluated', color=yellow)\n",
+    "rects_tlt_trainer = ax3.bar(x + width, tlt_trainer_eval_throughput, width, label='TLT eval using Trainer', color=blue)\n",
+    "rects_tlt_torch = ax3.bar(x + width * 2, tlt_torch_eval_thoughput, width, label='TLT eval using Torch', color=dark_blue)\n",
+    "ax3.bar_label(rects_tf, padding=3)\n",
+    "ax3.bar_label(rects_tlt_trainer, padding=3)\n",
+    "ax3.bar_label(rects_tlt_torch, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax3.set_ylabel('Samples per second')\n",
+    "ax3.set_title('Evaluation Throughput')\n",
+    "ax3.set_xticks(x+width, groups)\n",
+    "ax3.set_ymargin(0.2) \n",
+    "ax3.legend(ncols=2)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "68f77b7d",
+   "metadata": {},
+   "source": [
+    "## Next Steps\n",
+    "\n",
+    "This concludes our performance comparison using a Hugging Face model with the Hugging Face `Trainer` and the Intel Transfer Learning Tool. All of the models trained during these experiments have been saved to your output directory. Any of these can be loaded back to perform further experiments."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3c26d581",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print(\"\\nUsing batch size {}\".format(batch_size))\n",
+    "    print('-' * 25)\n",
+    "    print(\"Model trained using the Hugging Face Trainer:\\n\\t\", hf_saved_model_paths[i])\n",
+    "    print(\"Model trained using the Intel Transfer Learning tool and the Hugging Face Trainer:\\n\\t\", tlt_trainer_saved_model_paths[i])\n",
+    "    print(\"Model trained using the Intel Transfer Learning tool and the PyTorch libraries:\\n\\t\", tlt_torch_saved_model_paths[i])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "13e228cd",
+   "metadata": {},
+   "source": [
+    "## Citations \n",
+    "\n",
+    "```\n",
+    "@misc{devlin2019bert,\n",
+    "      title={BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding}, \n",
+    "      author={Jacob Devlin and Ming-Wei Chang and Kenton Lee and Kristina Toutanova},\n",
+    "      year={2019},\n",
+    "      eprint={1810.04805},\n",
+    "      archivePrefix={arXiv},\n",
+    "      primaryClass={cs.CL}\n",
+    "}\n",
+    "```\n",
+    "\n",
+    "```\n",
+    "@InProceedings{maas-EtAl:2011:ACL-HLT2011,\n",
+    "  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},\n",
+    "  title     = {Learning Word Vectors for Sentiment Analysis},\n",
+    "  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},\n",
+    "  month     = {June},\n",
+    "  year      = {2011},\n",
+    "  address   = {Portland, Oregon, USA},\n",
+    "  publisher = {Association for Computational Linguistics},\n",
+    "  pages     = {142--150},\n",
+    "  url       = {http://www.aclweb.org/anthology/P11-1015}\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/performance/tf_image_classification_performance.ipynb b/notebooks/performance/tf_image_classification_performance.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..1c2414474dcbf6f0e6eff54b1af0c190e1e912d5
--- /dev/null
+++ b/notebooks/performance/tf_image_classification_performance.ipynb
@@ -0,0 +1,1347 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "924b27fa",
+   "metadata": {},
+   "source": [
+    "# Performance Comparison: Image Classification Transfer Learning with TensorFlow and the Intel® Transfer Learning Tool\n",
+    "\n",
+    "This notebook uses the TensorFlow libraries to do transfer learning with an image classification model. The model is exported, evaluated, and used to generate predictions. The same sequence is also done using the Intel Transfer Learning Tool. The Intel Transfer Learning Tool is also used to optimize and quantized the trained model.\n",
+    "\n",
+    "Graphs are generated to visually compare:\n",
+    "* Training metrics (time per epoch, accuracy by epoch, loss by epoch)\n",
+    "* Evaluation metrics (time to evaluate the validation dataset, accuracy using the validation data)\n",
+    "* Prediction time for a single batch\n",
+    "* Latency and throughput for the trained models, quantized model, and the optimized model.\n",
+    "\n",
+    "The notebook has variables to allow controlling parameters such as the model name, dataset, the number of training epochs, and the batch size(s)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1f305fbd",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2' \n",
+    "\n",
+    "import math\n",
+    "import matplotlib.pyplot as plt\n",
+    "import matplotlib.ticker as mtick\n",
+    "import numpy as np\n",
+    "import pandas as pd\n",
+    "import psutil\n",
+    "import random\n",
+    "import tempfile\n",
+    "import tensorflow as tf\n",
+    "import tensorflow_hub as hub\n",
+    "import warnings\n",
+    "\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_tar_file\n",
+    "from tlt.utils.platform_util import CPUInfo, OptimizedPlatformUtil, PlatformUtil\n",
+    "from utils import inc_utils\n",
+    "\n",
+    "# Ignore all warnings\n",
+    "warnings.filterwarnings('ignore')\n",
+    "tf.get_logger().setLevel('ERROR')\n",
+    "\n",
+    "# Specify the the default dataset directory\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output (saved models and checkpoints)\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Output directory:\", output_directory)\n",
+    "\n",
+    "# TF Hub cache directory\n",
+    "os.environ[\"TFHUB_CACHE_DIR\"] = os.path.join(output_directory, \".cache\", \"tfhub_modules\")\n",
+    "\n",
+    "# Data Frame styles\n",
+    "table_styles =[{\n",
+    "    'selector': 'caption',\n",
+    "    'props': [\n",
+    "        ('text-align', 'center'),\n",
+    "        ('color', 'black'),\n",
+    "        ('font-size', '16px')\n",
+    "    ]\n",
+    "}]\n",
+    "\n",
+    "# Colors used in charts\n",
+    "orange = '#ff6f00'\n",
+    "blue = '#0071c5'\n",
+    "dark_blue = '#003c71'\n",
+    "yellow = '#f3d54e'\n",
+    "\n",
+    "# Caption style for DataFrames\n",
+    "caption_style = [dict(selector=\"caption\", props=[(\"text-align\", \"center\"), (\"font-size\", \"14pt\"), (\"color\", \"black\")])]\n",
+    "\n",
+    "# Line styles\n",
+    "line_styles = ['solid', 'dotted', 'dashed', 'dashdot']\n",
+    "\n",
+    "# Marker styles\n",
+    "marker_styles = ['o', 'D', 's', 'v']"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4270c3e8",
+   "metadata": {},
+   "source": [
+    "## 1. Display Platform Information\n",
+    "\n",
+    "Use the `CPUInfo` and `PlatformUtil` classes in the get and display information about the platform and TensorFlow version."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2f3c3ee5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get and display CPU/platform information\n",
+    "cpu_info = CPUInfo()\n",
+    "platform_util = PlatformUtil()\n",
+    "print(\"{0} CPU Information {0}\".format(\"=\" * 20))\n",
+    "print(\"CPU family:\", platform_util.cpu_family)\n",
+    "print(\"CPU model:\", platform_util.cpu_model)\n",
+    "print(\"CPU type:\", platform_util.cpu_type)\n",
+    "print(\"Physical cores per socket:\", cpu_info.cores_per_socket)\n",
+    "print(\"Total physical cores:\", cpu_info.cores)\n",
+    "cpufreq = psutil.cpu_freq()\n",
+    "print(\"Max Frequency:\", cpufreq.max)\n",
+    "print(\"Min Frequency:\", cpufreq.min)\n",
+    "cpu_socket_count = cpu_info.sockets\n",
+    "print(\"Socket Number:\", cpu_socket_count)\n",
+    "\n",
+    "print(\"\\n{0} Memory Information {0}\".format(\"=\" * 20))\n",
+    "svmem = psutil.virtual_memory()\n",
+    "print(\"Total: \", int(svmem.total / (1024 ** 3)), \"GB\")\n",
+    "\n",
+    "# Display TensorFlow version information\n",
+    "print(\"\\n{0} TensorFlow Information {0}\".format(\"=\" * 20))\n",
+    "print(\"TensorFlow version:\", tf.__version__)\n",
+    "print(\"TensorFlow Hub version:\", hub.__version__)\n",
+    "major_version = int(tf.__version__.split(\".\")[0])\n",
+    "minor_version = int(tf.__version__.split(\".\")[1])\n",
+    "if major_version >= 2:\n",
+    "    onednn_enabled = 0\n",
+    "    if minor_version < 5:\n",
+    "        from tensorflow.python import _pywrap_util_port\n",
+    "    else:\n",
+    "        from tensorflow.python.util import _pywrap_util_port\n",
+    "        onednn_enabled = int(os.environ.get('TF_ENABLE_ONEDNN_OPTS', '0'))\n",
+    "    on_onednn = _pywrap_util_port.IsMklEnabled() or (onednn_enabled == 1)\n",
+    "else:\n",
+    "    on_onednn = tf.pywrap_tensorflow.IsMklEnabled()\n",
+    "\n",
+    "print(\"oneDNN enabled:\", on_onednn)\n",
+    "\n",
+    "# Don't use the NVidia GPU, if there is one\n",
+    "os.environ['CUDA_VISIBLE_DEVICES'] = \"\""
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1d5a1252",
+   "metadata": {},
+   "source": [
+    "## 2. Select a model and define parameters to use during training and evaluation\n",
+    "\n",
+    "### Select a model\n",
+    "\n",
+    "See the list of supported image classification models from TensorFlow Hub in the Intel Transfer Learning Tool."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c4d9b894",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "framework = 'tensorflow'\n",
+    "use_case = 'image_classification'\n",
+    "model_hub = 'TFHub'\n",
+    "supported_models = model_factory.get_supported_models(framework, use_case)\n",
+    "supported_models = supported_models[use_case]\n",
+    "\n",
+    "# Filter to only get relevant models\n",
+    "supported_models = { key:value for (key,value) in supported_models.items() if value[framework]['model_hub'] == model_hub}\n",
+    "\n",
+    "print(\"Supported {} models for {} from {}\".format(framework, use_case, model_hub))\n",
+    "print(\"=\" * 70)\n",
+    "for model_name in supported_models.keys():\n",
+    "    print(model_name)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fd14554e",
+   "metadata": {},
+   "source": [
+    "Set the `model_name` to the model that will be used for transfer learning."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bca71035",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Select a model\n",
+    "model_name = \"resnet_v1_50\"\n",
+    "\n",
+    "# Get information about the model (image size and the feature vector handle)\n",
+    "# This information will be used during transfer learning using the TensorFlow framework API\n",
+    "if model_name in supported_models.keys():\n",
+    "    model_info = supported_models[model_name][framework]\n",
+    "    image_size = model_info[\"image_size\"]\n",
+    "    feature_vector_handle = model_info['feature_vector']\n",
+    "    \n",
+    "    print(\"Model Name: {}\".format(model_name))\n",
+    "    print(\"TF Hub feature vector: {}\".format(feature_vector_handle))\n",
+    "    print(\"Image size: {}\".format(image_size))\n",
+    "else:\n",
+    "    raise ValueError(\"The specified model is unsupported. Please select a model from the list of supported models.\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e05fc52e",
+   "metadata": {},
+   "source": [
+    "### Select a dataset\n",
+    "\n",
+    "By default, the notebook will use the [TensorFlow Flowers dataset](https://www.tensorflow.org/datasets/catalog/tf_flowers), which has flower images that belong to 5 categories.\n",
+    "\n",
+    "To use your own dataset, set the `dataset_subdir` variable to the dataset path. The dataset directory is expected to have folders of images for each class, where the name of the folder will be used as the class name.\n",
+    "\n",
+    "```\n",
+    "dataset_dir\n",
+    "          ├── class_a\n",
+    "          ├── class_b\n",
+    "          └── class_c\n",
+    "```\n",
+    "\n",
+    "Optionally, the `dataset_subdir` directory can have `train` and `test`/`validation` subdirectories. For example:\n",
+    "```\n",
+    "dataset_dir\n",
+    "          ├── train\n",
+    "          |   ├── class_a\n",
+    "          |   ├── class_b\n",
+    "          |   └── class_c\n",
+    "          └── test\n",
+    "              ├── class_a\n",
+    "              ├── class_b\n",
+    "              └── class_c\n",
+    "```\n",
+    "If the dataset does not have separate folders for train and test/validation, the dataset will be split by percentage."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4a0d6c0d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "dataset_subdir = os.path.join(dataset_directory, \"flower_photos\")\n",
+    "\n",
+    "# Download the flowers dataset, if the folder doesn't exist\n",
+    "if not os.path.exists(dataset_subdir):\n",
+    "    os.makedirs(dataset_subdir)\n",
+    "    dataset_url = \"https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz\"\n",
+    "    download_and_extract_tar_file(dataset_url, dataset_directory)\n",
+    "    \n",
+    "print(\"Dataset path:\", dataset_subdir)\n",
+    "\n",
+    "print(\"\\nFolders in the dataset directory:\")\n",
+    "for d in os.listdir(dataset_subdir):\n",
+    "    if os.path.isdir(os.path.join(dataset_subdir, d)):\n",
+    "        print(\"-\", d)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e1aa58df",
+   "metadata": {},
+   "source": [
+    "### Define parameters\n",
+    "\n",
+    "For consistency between the model training using the TensorFlow framework API and the model training using the Intel Transfer Learning Tool API, the next cell defines parameters that will be used by both methods."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "eee80253",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Number of training epochs\n",
+    "training_epochs = 2\n",
+    "\n",
+    "# Shuffle the files after each training epoch\n",
+    "shuffle_files = True\n",
+    "\n",
+    "# Define training/validation splits for the dataset \n",
+    "# (if the dataset directory does not have subdirectories for train and test/validation)\n",
+    "validation_split = 0.25\n",
+    "training_split = 1 - validation_split\n",
+    "\n",
+    "# Set seed for consistency between runs (or None)\n",
+    "seed = 10\n",
+    "\n",
+    "# List of batch size(s) to compare (maximum of 4 batch sizes to try)\n",
+    "batch_size_list = [ 256, 512 ]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4847ae1d",
+   "metadata": {},
+   "source": [
+    "Validate parameter values and then print out the parameter values."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "051ea2a1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if not isinstance(training_epochs, int):\n",
+    "    raise TypeError(\"The training_epochs parameter should be an integer, but found a {}\".format(type(training_epochs)))\n",
+    "\n",
+    "if training_epochs < 1:\n",
+    "    raise ValueError(\"The training_epochs parameter should not be less than 1.\")\n",
+    "    \n",
+    "if not isinstance(shuffle_files, bool):\n",
+    "    raise TypeError(\"The shuffle_files parameter should be a bool, but found a {}\".format(type(shuffle_files)))\n",
+    "\n",
+    "if not isinstance(validation_split, float):\n",
+    "    raise TypeError(\"The validation_split parameter should be a float, but found a {}\".format(type(validation_split)))\n",
+    "\n",
+    "if not isinstance(training_split, float):\n",
+    "    raise TypeError(\"The training_split parameter should be a float, but found a {}\".format(type(training_split)))\n",
+    "\n",
+    "if validation_split + training_split > 1:\n",
+    "    raise ValueError(\"The sum of validation_split and training_split should not be greater than 1.\")\n",
+    "\n",
+    "if seed and not isinstance(seed, int):\n",
+    "    raise TypeError(\"The seed parameter should be a integer or None, but found a {}\".format(type(seed)))\n",
+    "\n",
+    "if len(batch_size_list) > 4 or len(batch_size_list) == 0:\n",
+    "    raise ValueError(\"The batch_size_list should have at most 4 values, but found {} values ({})\".format(\n",
+    "        len(batch_size_list), batch_size_list))\n",
+    "    \n",
+    "print(\"Number of training epochs:\", training_epochs)\n",
+    "print(\"Shuffle files:\", shuffle_files)\n",
+    "print(\"Training split: {}%\".format(training_split*100))\n",
+    "print(\"Validation split: {}%\".format(validation_split*100))\n",
+    "print(\"Seed:\", str(seed))\n",
+    "print(\"Batch size list:\", batch_size_list)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fb2d786a",
+   "metadata": {},
+   "source": [
+    "Define a callback method that track the time that it took to run training epochs, evaluation, and batch predictions."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "713f648f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Callback to track the training time for each epoch, evaluation time, or prediction time\n",
+    "class TimerCallback(tf.keras.callbacks.Callback):\n",
+    "    def __init__(self):\n",
+    "        self.epoch_times = []\n",
+    "        self.eval_times = []\n",
+    "        self.predict_times = []\n",
+    "    def on_epoch_begin(self, batch, logs={}):\n",
+    "        self.tf_timestamp = tf.timestamp()\n",
+    "    def on_epoch_end(self,epoch,logs = {}):\n",
+    "        self.epoch_times.append((tf.timestamp() - self.tf_timestamp).numpy())\n",
+    "    def on_test_begin(self, batch, logs={}):\n",
+    "        self.tf_timestamp = tf.timestamp()\n",
+    "    def on_test_end(self,epoch,logs = {}):\n",
+    "        self.eval_times.append((tf.timestamp() - self.tf_timestamp).numpy())\n",
+    "    def on_predict_begin(self, batch, logs={}):\n",
+    "        self.tf_timestamp = tf.timestamp()\n",
+    "    def on_predict_end(self,epoch,logs = {}):\n",
+    "        self.predict_times.append((tf.timestamp() - self.tf_timestamp).numpy())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "abd401a7",
+   "metadata": {},
+   "source": [
+    "## 3. Compare the training time for transfer learning\n",
+    "\n",
+    "In this section, we will compare the time it takes to retrain the image classification model using the dataset that was selected in the previous section.\n",
+    "\n",
+    "The training will be done in two different ways to compare:\n",
+    "* Transfer learning using the TensorFlow framework and TF Hub libraries\n",
+    "* Transfer learning using the Intel Transfer Learning Tool API\n",
+    "\n",
+    "### Transfer learning using the TensorFlow framework and TF Hub libraries\n",
+    "\n",
+    "This section goes through using the TensorFlow framework and TF Hub libraries to retrain the model using the selected dataset.\n",
+    "\n",
+    "First, the dataset is loaded in, which allows us to determine the number of classes in the dataset. The original ImageNet dataset that the image classification model was trained on has 1000 classes. To do transfer learning using the new dataset, we will get the feature vector from TF Hub and then add on a classification layer that matches the number of classes in the new dataset.\n",
+    "\n",
+    "If multiple batch sizes were set in the `batch_size_list`, training will be run for each batch size."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "08cfd3ea",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Set seed\n",
+    "if seed:\n",
+    "    os.environ['PYTHONHASHSEED'] = str(seed)\n",
+    "    random.seed(seed)\n",
+    "    np.random.seed(seed)\n",
+    "    tf.random.set_seed(seed)\n",
+    "\n",
+    "# Lists to track callbacks, datasets, models, and saved model directory for each batch size experiment\n",
+    "tf_time_callback_list = []\n",
+    "tf_dataset_list = []\n",
+    "tf_model_list = []\n",
+    "tf_export_dir_list = []\n",
+    "tf_history_list = []\n",
+    "\n",
+    "# Check if the dataset directory has subdirectories for train/validation/test splits\n",
+    "val_dataset_dir = None\n",
+    "train_dataset_dir = dataset_subdir\n",
+    "if os.path.exists(os.path.join(dataset_subdir, 'train')):\n",
+    "    train_dataset_dir = os.path.join(dataset_subdir, 'train')\n",
+    "    val_dataset_dir = os.path.join(dataset_subdir, 'validation')\n",
+    "    \n",
+    "    if not os.path.exists(val_dataset_dir):\n",
+    "        if os.path.exists(os.path.join(dataset_subdir, 'test')):\n",
+    "            val_dataset_dir = os.path.join(dataset_subdir, 'test')\n",
+    "        else:\n",
+    "            raise ValueError('The dataset directory ({}) has a \"train\" directory, but no \"validation\" or \"test\" directory.')\n",
+    "\n",
+    "    print(\"Using training data from {}\".format(train_dataset_dir))\n",
+    "    print(\"Using validation data from {}\".format(val_dataset_dir))\n",
+    "    \n",
+    "# Load the dataset\n",
+    "tf_dataset = tf.keras.utils.image_dataset_from_directory(train_dataset_dir, batch_size=None, seed=seed)\n",
+    "class_names = tf_dataset.class_names\n",
+    "\n",
+    "if shuffle_files:\n",
+    "    tf_dataset = tf_dataset.shuffle(tf_dataset.cardinality(), reshuffle_each_iteration=False, seed=seed)\n",
+    "\n",
+    "if val_dataset_dir:\n",
+    "    # Load the validation/test sub directory\n",
+    "    train_ds = tf_dataset\n",
+    "    val_ds = tf.keras.utils.image_dataset_from_directory(val_dataset_dir, batch_size=None, seed=seed) \n",
+    "    if shuffle_files:\n",
+    "        val_ds = val_ds.shuffle(val_ds.cardinality(), reshuffle_each_iteration=False, seed=seed)\n",
+    "    train_size = len(train_ds)\n",
+    "    val_size = len(val_ds)\n",
+    "else:\n",
+    "    # Split the data into train/validation subsets (Note that image_dataset_from_directory can also do splitting but\n",
+    "    # we are doing it this way to match what the Intel Transfer Learning Tool does to ensure the same sized splits)\n",
+    "    train_size = int(training_split * len(tf_dataset))\n",
+    "    val_size = int(validation_split * len(tf_dataset))\n",
+    "    train_ds = tf_dataset.take(train_size)\n",
+    "    val_ds = tf_dataset.skip(train_size).take(val_size)\n",
+    "\n",
+    "print(\"Training dataset size:\", train_size)\n",
+    "print(\"Validation dataset size:\", val_size)\n",
+    "    \n",
+    "# Preprocess the dataset\n",
+    "normalization_layer = tf.keras.layers.Rescaling(1. / 255)\n",
+    "\n",
+    "def preprocess_image(image, label):\n",
+    "    image = tf.image.resize_with_pad(image, image_size, image_size)\n",
+    "    image = normalization_layer(image)\n",
+    "    return (image, label)\n",
+    "\n",
+    "train_ds = train_ds.map(preprocess_image)\n",
+    "val_ds = val_ds.map(preprocess_image)\n",
+    "\n",
+    "for batch_size in batch_size_list:\n",
+    "    print('-' * 40)\n",
+    "    print('Training using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "    \n",
+    "    # Batch the dataset \n",
+    "    batched_train_ds = train_ds.batch(batch_size)\n",
+    "    batched_val_ds = val_ds.batch(batch_size)\n",
+    "    \n",
+    "    # Get the feature extractor layer from TF Hub\n",
+    "    feature_extractor_layer = hub.KerasLayer(feature_vector_handle,\n",
+    "                                             input_shape=(image_size, image_size, 3),\n",
+    "                                             trainable=False)\n",
+    "\n",
+    "    # Add the dense layer sized according to the number of classes in our dataset\n",
+    "    tf_model = tf.keras.Sequential([\n",
+    "      feature_extractor_layer,\n",
+    "      tf.keras.layers.Dense(len(class_names))\n",
+    "    ])\n",
+    "\n",
+    "    # Configure the model optimizer and loss function\n",
+    "    tf_model.compile(\n",
+    "      optimizer=tf.keras.optimizers.Adam(),\n",
+    "      loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),\n",
+    "      metrics=['acc'])\n",
+    "    \n",
+    "    tf_model.summary()\n",
+    "\n",
+    "    # Define the callback for tracking the time it takes to train each epoch\n",
+    "    tf_time_callback = TimerCallback()\n",
+    "\n",
+    "    # Train the model\n",
+    "    tf_history_list.append(tf_model.fit(batched_train_ds, epochs=training_epochs, shuffle=shuffle_files,\n",
+    "                                        callbacks=[tf_time_callback]))\n",
+    "    \n",
+    "    # Export the trained model\n",
+    "    tf_export_dir = os.path.join(output_directory, \"tf_saved_models\", model_name)\n",
+    "    if not os.path.exists(tf_export_dir):\n",
+    "        os.makedirs(tf_export_dir)\n",
+    "    tf_export_dir = tempfile.mkdtemp(prefix=tf_export_dir + '/')\n",
+    "    print(\"Save model to:\", tf_export_dir)\n",
+    "    tf_model.save(tf_export_dir)\n",
+    "    \n",
+    "    # Append to lists for each batch size\n",
+    "    tf_time_callback_list.append(tf_time_callback)\n",
+    "    tf_dataset_list.append((batched_train_ds, batched_val_ds))\n",
+    "    tf_model_list.append(tf_model)\n",
+    "    tf_export_dir_list.append(tf_export_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "160cf79a",
+   "metadata": {},
+   "source": [
+    "### Transfer learning using the Intel Transfer Learning Tool API\n",
+    "\n",
+    "This section uses the Intel Transfer Learning Tool API to retrain the model using the selected dataset. This API simplifies the transfer learning process, so there are less lines of code compared to directly using the TensorFlow and TensorFlow Hub libraries."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2fd15b3f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Use the OptimizedPlatform Util class from the Intel Transfer Learning Tool API to set recommended settings\n",
+    "optimized_platform_util = OptimizedPlatformUtil(omp_num_threads=cpu_info.cores_per_socket,\n",
+    "                                               kmp_blocktime=0,\n",
+    "                                               kmp_affinity='granularity=fine,compact,1,0',\n",
+    "                                               tf_num_intraop_threads=cpu_info.cores_per_socket,\n",
+    "                                               tf_num_interop_threads=cpu_info.sockets,\n",
+    "                                               force_reset_env_vars=True)\n",
+    "\n",
+    "for k, v in optimized_platform_util.env_vars_dict.items():\n",
+    "    if v is not None:\n",
+    "        print(\"{}: {}\".format(k, v))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "fac3d6df",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Lists to track callbacks, datasets, models, and saved model directory for each batch size experiment\n",
+    "tlt_time_callback_list = []\n",
+    "tlt_dataset_list = []\n",
+    "tlt_model_list = []\n",
+    "tlt_export_dir_list = []\n",
+    "tlt_history_list = []\n",
+    "    \n",
+    "for batch_size in batch_size_list:\n",
+    "    print('-' * 40)\n",
+    "    print('Training using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "    \n",
+    "    # Use the model factory to get the model\n",
+    "    tlt_model = model_factory.get_model(model_name=model_name, framework=framework)\n",
+    "    \n",
+    "    # Load, split, and preprocess the dataset\n",
+    "    tlt_dataset = dataset_factory.load_dataset(dataset_dir=dataset_subdir, use_case=use_case, framework=framework)\n",
+    "    \n",
+    "    if not tlt_dataset.train_subset:\n",
+    "        tlt_dataset.shuffle_split(train_pct=training_split, val_pct=validation_split, seed=seed, shuffle_files=shuffle_files)\n",
+    "    \n",
+    "    tlt_dataset.preprocess(tlt_model.image_size, batch_size=batch_size)\n",
+    "    \n",
+    "    # Define the callback for tracking the time it takes to train each epoch\n",
+    "    tlt_time_callback = TimerCallback()\n",
+    "\n",
+    "    # Train the model\n",
+    "    tlt_history_list.append(tlt_model.train(tlt_dataset, output_dir=output_directory, epochs=training_epochs,\n",
+    "                                            shuffle_files=shuffle_files, do_eval=False, callbacks=tlt_time_callback,\n",
+    "                                            seed=seed))\n",
+    "\n",
+    "    # Export the trained model\n",
+    "    tlt_export_dir = os.path.join(output_directory, \"tlt_saved_models\")\n",
+    "    tlt_export_dir = tlt_model.export(tlt_export_dir)\n",
+    "    \n",
+    "    # Append to lists for each batch size\n",
+    "    tlt_time_callback_list.append(tlt_time_callback)\n",
+    "    tlt_dataset_list.append(tlt_dataset)\n",
+    "    tlt_model_list.append(tlt_model)\n",
+    "    tlt_export_dir_list.append(tlt_export_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e5e52a50",
+   "metadata": {},
+   "source": [
+    "### Optimize the model using the Intel Transfer Learning Tool API\n",
+    "\n",
+    "After training, the Intel Transfer Learning Tool can optimize the model to improve inference performance. This is done using the [Intel® Neural Compressor](https://github.com/intel/neural-compressor) quantizing the model or optimizing the full precision model. \n",
+    "\n",
+    "First, we setup a configuration file that with parameters that will be used by the Intel Neural Compressor for quantization."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "df079cb0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tlt_quantization_dir_list = []\n",
+    "tlt_optimized_dir_list = []\n",
+    "inc_config_list = []\n",
+    "\n",
+    "# Create a tuning workspace directory for INC\n",
+    "nc_workspace = os.path.join(output_directory, 'nc_workspace')\n",
+    "\n",
+    "# Relative accuracy loss (1%)\n",
+    "relative_accuracy_criterion = 0.01\n",
+    "\n",
+    "# Define the exit policy timeout (in seconds) and max number of trials. The tuning processing finishes when\n",
+    "# the timeout or max trials is reached. A tuning timeout of 0 means that the tuning phase stops when the\n",
+    "# accuracy criterion is met.\n",
+    "timeout = 0\n",
+    "max_trials=15\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    # Create an output directories for the quantized and optimized models\n",
+    "    tlt_quantization_dir = os.path.join(output_directory, 'tlt_quantized_models', model_name, os.path.basename(tlt_export_dir_list[i]))\n",
+    "    tlt_optimized_dir = os.path.join(output_directory, 'tlt_optimized_models', model_name, os.path.basename(tlt_export_dir_list[i]))\n",
+    "\n",
+    "    # Create an Intel Neural Compressor config based on the inputs that we are using\n",
+    "    inc_config_list.append(tlt_model.get_inc_config(accuracy_criterion_relative=relative_accuracy_criterion,\n",
+    "                                                    exit_policy_timeout=timeout, exit_policy_max_trials=max_trials))\n",
+    "    \n",
+    "    # Append to lists for each batch size\n",
+    "    tlt_quantization_dir_list.append(tlt_quantization_dir)\n",
+    "    tlt_optimized_dir_list.append(tlt_optimized_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "534de66e",
+   "metadata": {},
+   "source": [
+    "Next, we quantize the model using the config file that was just generated. Quantization aims to improve inference\n",
+    "performance by reducing the number of bits required, by maintaining close the the same amount of accuracy as the full precision model. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "103ffd57",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    # Quantize the model\n",
+    "    tlt_model.quantize(tlt_quantization_dir_list[i], tlt_dataset_list[i], config=inc_config_list[i])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cfeea7eb",
+   "metadata": {},
+   "source": [
+    "Another option to improve inference performance is using graph optimization through the Intel Neural Compressor which:\n",
+    "* Converts variables to constants\n",
+    "* Removes training-only operations like checkpoint saving\n",
+    "* Strips out parts of the graph that are never reached\n",
+    "* Removes debug operations like CheckNumerics\n",
+    "* Folds batch normalization ops into the pre-calculated weights\n",
+    "* Fuses common operations into unified versions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6a2f7a8e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    # Optimize the full precision model\n",
+    "    tlt_model.optimize_graph(tlt_optimized_dir_list[i])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "304258ec",
+   "metadata": {},
+   "source": [
+    "### Compare training times\n",
+    "\n",
+    "The table below compares the time it took to train each epoch (in seconds) using the TensorFlow framework libraries directly versus the Intel Transfer Learning Tool API."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "16299291",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "display_df = []\n",
+    "plt.figure(figsize=(10,6))\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    # Sanity check that both datasets had the same number of batches\n",
+    "    if len(tf_dataset_list[i][0]) != len(tlt_dataset_list[i].train_subset):\n",
+    "        print(\"WARNING: For batch size {}, the TF training dataset had {} batches and the TLT training dataset had \"\n",
+    "              \"{} batches. These values should have been the same.\".format(batch_size, len(tf_dataset_list[i][0]), len(tlt_dataset_list[i].train_subset)))\n",
+    "    \n",
+    "    # Calculate images/second\n",
+    "    tf_images_per_second = [train_size / t for t in tf_time_callback_list[i].epoch_times]\n",
+    "    tlt_images_per_second = [train_size / t for t in tlt_time_callback_list[i].epoch_times]\n",
+    "    performance_delta = [\"{0:.2f}%\".format((tlt-tf)/tf * 100) for tf, tlt in zip(tf_images_per_second, tlt_images_per_second)]\n",
+    "\n",
+    "    # Graph the results\n",
+    "    epoch_list = [str(i) for i in range(1, training_epochs + 1)]\n",
+    "    tf_train_time = tf_time_callback_list[i].epoch_times\n",
+    "    tlt_train_time = tlt_time_callback_list[i].epoch_times\n",
+    "\n",
+    "    plt.plot(epoch_list, tf_train_time, label=\"Using TF libraries with batch size {}\".format(batch_size),\n",
+    "             linestyle=line_styles[i], marker=marker_styles[i], color=orange)\n",
+    "    plt.plot(epoch_list, tlt_train_time, label=\"Using TLT with batch size {}\".format(batch_size), \n",
+    "             linestyle=line_styles[i], marker=marker_styles[i],color=blue)\n",
+    "    \n",
+    "    # Create a DataFrame to display the results in a table\n",
+    "    df = pd.DataFrame({\n",
+    "        'TF epoch time<br>(seconds)': tf_time_callback_list[i].epoch_times,\n",
+    "        'TLT epoch time<br>(seconds)': tlt_time_callback_list[i].epoch_times,\n",
+    "        'TF throughput<br>(images/sec)': tf_images_per_second,\n",
+    "        'TLT throughput<br>(images/sec)': tlt_images_per_second,\n",
+    "        'Performance<br>Boost': performance_delta\n",
+    "    })\n",
+    "    df.index += 1 \n",
+    "    df = df.style.set_table_styles(table_styles).set_caption(\"Epoch training times with batch size {}\".format(batch_size))\n",
+    "    display_df.append(df)\n",
+    "\n",
+    "plt.title(\"Training time per epoch\")\n",
+    "plt.xlabel(\"Epoch\")\n",
+    "plt.ylabel(\"Seconds\")\n",
+    "plt.legend()\n",
+    "plt.show()\n",
+    "\n",
+    "# Display tables with epoch training time for each batch size\n",
+    "for df in display_df:\n",
+    "    display(df)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "388a7675",
+   "metadata": {},
+   "source": [
+    "Next, visualize the accuracy and loss metrics collected during training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "59598b38",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Graph the training accuracy by epoch for each batch size\n",
+    "plt.figure(figsize=(10,6))\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    tf_acc_time = [i * 100 for i in tf_history_list[i].history['acc']]\n",
+    "    tlt_acc_time = [i * 100 for i in tlt_history_list[i]['acc']]\n",
+    "\n",
+    "    plt.plot(epoch_list, tf_acc_time, label = \"Using TF libraries (batch size = {})\".format(batch_size), linestyle=line_styles[i], marker=marker_styles[i], color=orange)\n",
+    "    plt.plot(epoch_list, tlt_acc_time, label = \"Using TLT (batch size = {})\".format(batch_size), linestyle=line_styles[i], marker=marker_styles[i], color=blue)\n",
+    "\n",
+    "plt.title(\"Training Accuracy by Epoch\")\n",
+    "plt.xlabel(\"Epoch\")\n",
+    "plt.ylabel(\"Accuracy (%)\")\n",
+    "plt.legend()\n",
+    "plt.show()\n",
+    "\n",
+    "# Graph the training loss by epoch for each batch size\n",
+    "plt.figure(figsize=(10,6))\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    tf_loss_time = tf_history_list[i].history['loss']\n",
+    "    tlt_loss_time = tlt_history_list[i]['loss']\n",
+    "\n",
+    "    plt.plot(epoch_list, tf_loss_time, label = \"Using TF libraries (batch size = {})\".format(batch_size), linestyle=line_styles[i], marker=marker_styles[i], color=orange)\n",
+    "    plt.plot(epoch_list, tlt_loss_time, label = \"Using TLT (batch size = {})\".format(batch_size), linestyle=line_styles[i], marker=marker_styles[i], color=blue)\n",
+    "\n",
+    "plt.title(\"Training Loss by Epoch\")\n",
+    "plt.xlabel(\"Epoch\")\n",
+    "plt.ylabel(\"Loss\")\n",
+    "plt.legend()\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e58715d4",
+   "metadata": {},
+   "source": [
+    "## 4. Evaluate and predict\n",
+    "\n",
+    "This section calls evaluation and prediction methods for the models trained using the TensorFlow libraries and the Intel Transfer Learning Tool.\n",
+    "\n",
+    "### Evaluate the models using the validation data\n",
+    "\n",
+    "First, evaluate the models trained using the TensorFlow libraries."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9ba3aadb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tf_eval_callback_list = []\n",
+    "tf_eval_metrics_list = []\n",
+    "\n",
+    "# Evaluate using the TensorFlow framework model for each batch size\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 40)\n",
+    "    print('Evaluate using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "    \n",
+    "    tf_eval_callback = TimerCallback()\n",
+    "    \n",
+    "    # Use the test split of the dataset to evaluate the model\n",
+    "    tf_eval_metrics_list.append(tf_model_list[i].evaluate(tf_dataset_list[i][1], callbacks=tf_eval_callback))\n",
+    "    tf_eval_callback_list.append(tf_eval_callback)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "de6dbc91",
+   "metadata": {},
+   "source": [
+    "Next, evaluate the models trained using the Intel Transfer Learning Tool."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0ed9e1a0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tlt_eval_callback_list = []\n",
+    "tlt_eval_metrics_list = []\n",
+    "\n",
+    "# Evaluate using the Intel Transfer Learning Tool model for each batch size\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 40)\n",
+    "    print('Evaluate using batch size: {}'.format(batch_size))\n",
+    "    print('-' * 40)\n",
+    "    \n",
+    "    use_test_set = tlt_dataset_list[i].validation_subset is None and tlt_dataset_list[i].test_subset is not None\n",
+    "    \n",
+    "    tlt_eval_callback = TimerCallback()\n",
+    "    tlt_eval_metrics_list.append(tlt_model_list[i].evaluate(tlt_dataset_list[i], callbacks=tlt_eval_callback, use_test_set=use_test_set))\n",
+    "    tlt_eval_callback_list.append(tlt_eval_callback)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "231f3731",
+   "metadata": {},
+   "source": [
+    "After all the models have been evaluated, visualize the results using charts that the display the time that it took to evaluate each model and the accuracy that was found when using the validation dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3c31fee1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Bar chart group labels\n",
+    "groups = [\"batch size = {}\".format(bs) for bs in batch_size_list]\n",
+    "\n",
+    "# Create grouped bar chart for evaluation time\n",
+    "decimals = 3 # number of decimals to use for rounding\n",
+    "tf_eval_times = [round(callback.eval_times[0], decimals) for callback in tf_eval_callback_list]\n",
+    "tlt_eval_times = [round(callback.eval_times[0], decimals) for callback in tlt_eval_callback_list]\n",
+    "\n",
+    "x = np.arange(len(groups))\n",
+    "width = 0.24  # the width of the bars\n",
+    "multiplier = 0\n",
+    "\n",
+    "# Setup bars for evaluation times\n",
+    "fig, (ax1, ax2) = plt.subplots(2)\n",
+    "fig.set_figheight(10)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax1.bar(x - width/2, tf_eval_times, width, label='TF eval', color=orange)\n",
+    "rects_tlt = ax1.bar(x + width/2, tlt_eval_times, width, label='TLT eval', color=blue)\n",
+    "ax1.bar_label(rects_tf, padding=3)\n",
+    "ax1.bar_label(rects_tlt, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax1.set_ylabel('Seconds')\n",
+    "ax1.set_title('Evaluation time')\n",
+    "ax1.set_xticks(x, groups)\n",
+    "ax1.set_ymargin(0.2) \n",
+    "ax1.legend(ncols=2)\n",
+    "#plt.show()\n",
+    "\n",
+    "# Evaluation accuracy comparison\n",
+    "decimals = 2\n",
+    "tf_acc_index = tf_model_list[0].metrics_names.index('acc')\n",
+    "tlt_acc_index = tlt_model_list[0]._model.metrics_names.index('acc')\n",
+    "tf_eval_accuracy = [round(x[tf_acc_index] * 100, decimals) for x in tf_eval_metrics_list]\n",
+    "tlt_eval_accuracy = [round(x[tlt_acc_index] * 100, decimals) for x in tlt_eval_metrics_list]\n",
+    "\n",
+    "# Setup bars for evaluation accuracy\n",
+    "rects_tf = ax2.bar(x - width/2, tf_eval_accuracy, width, label='TF accuracy', color=orange)\n",
+    "rects_tlt = ax2.bar(x + width/2, tlt_eval_accuracy, width, label='TLT accuracy', color=blue)\n",
+    "ax2.bar_label(rects_tf, padding=3)\n",
+    "ax2.bar_label(rects_tlt, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax2.set_ylabel('Accuracy (%)')\n",
+    "ax2.yaxis.set_major_formatter(mtick.PercentFormatter())\n",
+    "ax2.set_title('Evaluation accuracy using the validation data')\n",
+    "ax2.set_xticks(x, groups)\n",
+    "ax2.set_ymargin(0.2) \n",
+    "ax2.legend(ncols=2)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4d759b5d",
+   "metadata": {},
+   "source": [
+    "### Predict using a batch of images\n",
+    "\n",
+    "Use the TensorFlow libaries to get a batch of images and predict using the trained models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "38132396",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tf_predict_callback_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 50)\n",
+    "    print('Predict on a single batch (batch size = {})'.format(batch_size))\n",
+    "    print('-' * 50)\n",
+    "    \n",
+    "    tf_predict_time = TimerCallback()\n",
+    "    dataset_batch = next(iter(tf_dataset_list[i][0]))\n",
+    "    tf_batch, _ = dataset_batch\n",
+    "    batch_predictions = tf_model_list[i].predict(tf_batch, callbacks=tf_predict_time)\n",
+    "    tf_predict_callback_list.append(tf_predict_time)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0d3beb10",
+   "metadata": {},
+   "source": [
+    "Similarly, use the Intel Transfer Learning Tool API to get a batch of images and predict using the trained models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "66be9e10",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tlt_predict_callback_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 50)\n",
+    "    print('Predict on a single batch (batch size = {})'.format(batch_size))\n",
+    "    print('-' * 50)\n",
+    "    \n",
+    "    tlt_predict_time = TimerCallback()\n",
+    "\n",
+    "    tlt_batch, _ = tlt_dataset_list[i].get_batch(subset='train')\n",
+    "    predictions = tlt_model_list[i].predict(tlt_batch, callbacks=tlt_predict_time)\n",
+    "    tlt_predict_callback_list.append(tlt_predict_time)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a594631f",
+   "metadata": {},
+   "source": [
+    "Visualize the time that it took to get predictions for a batch of images for each model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "309f636a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create grouped bar chart for prediction time\n",
+    "decimals = 3   # number of decimals to use for rounding\n",
+    "tf_predict_times = [round(callback.predict_times[0], decimals) for callback in tf_predict_callback_list]\n",
+    "tlt_predict_times = [round(callback.predict_times[0], decimals) for callback in tlt_predict_callback_list]\n",
+    "\n",
+    "# Setup bars for evaluation times\n",
+    "fig, ax = plt.subplots()\n",
+    "fig.set_figheight(6)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax.bar(x - width/2, tf_predict_times, width, label='TF predict', color=orange)\n",
+    "rects_tlt = ax.bar(x + width/2, tlt_predict_times, width, label='TLT predict', color=blue)\n",
+    "ax.bar_label(rects_tf, padding=3)\n",
+    "ax.bar_label(rects_tlt, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax.set_ylabel('Seconds')\n",
+    "ax.set_title('Prediction time for a single batch')\n",
+    "ax.set_xticks(x, groups)\n",
+    "ax.set_ymargin(0.2) \n",
+    "ax.legend(ncols=2)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ca0771ec",
+   "metadata": {},
+   "source": [
+    "### Check performance using the Intel® Neural Compressor\n",
+    "\n",
+    "Use the [Intel Neural Compressor](https://github.com/intel/neural-compressor/tree/master) to determine the performance of the exported models. \n",
+    "\n",
+    "We will compare:\n",
+    "* The original model that was trained using the TensorFlow and TF Hub libaries\n",
+    "* The model trained using the Intel Transfer Learning Tool\n",
+    "* The model trained and quantized using the Intel Transfer Learning Tool\n",
+    "* The model trained and optimized using the Intel Transfer Learning Tool"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41b6baee",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "test_dataset_dir = dataset_subdir\n",
+    "\n",
+    "if os.path.exists(os.path.join(dataset_subdir, 'validation')):\n",
+    "    test_dataset_dir = os.path.join(dataset_subdir, 'validation')\n",
+    "elif os.path.exists(os.path.join(dataset_subdir, 'test')):\n",
+    "    test_dataset_dir = os.path.join(dataset_subdir, 'test')\n",
+    "    \n",
+    "print(\"Test dataset directory:\", test_dataset_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e89ccbfb",
+   "metadata": {},
+   "source": [
+    "Use the Intel Neural Compressor to get the performance of the model trained using the TensorFlow libraries.\n",
+    "\n",
+    "Note that you may see a `zmq.error.ZMQError: Address already in use` error in the output, which is a known issuen when running the Intel Neural Compressor from Jupyter notebooks. If this happens, rerun the cell."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "80be966e",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "tf_latency_list = []\n",
+    "tf_throughput_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 90)\n",
+    "    print('Check performance for TF model (batch size = {})'.format(batch_size))\n",
+    "    print('Saved model directory: {}'.format(tf_export_dir_list[i]))\n",
+    "    print('-' * 90)\n",
+    "    \n",
+    "    results = inc_utils.performance(tf_export_dir_list[i], batch_size, image_size, test_dataset_dir, framework)\n",
+    "    tf_latency, tf_throughput = inc_utils.calculate_latency_and_throughput(results)\n",
+    "    \n",
+    "    tf_latency_list.append(tf_latency)\n",
+    "    tf_throughput_list.append(tf_throughput)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7ee14994",
+   "metadata": {},
+   "source": [
+    "Next, get the performance of the the model that was trained and exported by the Intel Transfer Learning Toolkit."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bb33d150",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tlt_latency_list = []\n",
+    "tlt_throughput_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    print('-' * 90)\n",
+    "    print('Check performance for TLT model (batch size = {})'.format(batch_size))\n",
+    "    print('Saved model directory: {}'.format(tlt_export_dir_list[i]))\n",
+    "    print('-' * 90)\n",
+    "    \n",
+    "    tlt_results = inc_utils.performance(tlt_export_dir_list[i], batch_size, image_size, test_dataset_dir, framework)\n",
+    "    tlt_latency, tlt_throughput = inc_utils.calculate_latency_and_throughput(tlt_results)\n",
+    "    \n",
+    "    tlt_latency_list.append(tlt_latency)\n",
+    "    tlt_throughput_list.append(tlt_throughput)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4aaf38ec",
+   "metadata": {},
+   "source": [
+    "Get the performance of the model that was quantized using the Intel Transfer Learning tool with the Intel Neural Compressor."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7322f6a1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "quantized_latency_list = []\n",
+    "quantized_throughput_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    try:\n",
+    "        tlt_quantized_latency = 0\n",
+    "        tlt_quantized_throughput = 0\n",
+    "        \n",
+    "        print('-' * 90)\n",
+    "        print('Check performance for TLT quantized model (batch size = {})'.format(batch_size))\n",
+    "        print('Saved model directory: {}'.format(tlt_quantization_dir_list[i]))\n",
+    "        print('-' * 90)\n",
+    "        \n",
+    "        if not os.path.exists(os.path.join(tlt_quantization_dir_list[i], 'saved_model.pb')):\n",
+    "            raise FileNotFoundError(\"The quantized model was not found at: {}\\nQuantization may have failed for this model/batch size.\".format(tlt_quantization_dir_list[i],))\n",
+    "    \n",
+    "        tlt_quantized_results = inc_utils.performance(tlt_quantization_dir_list[i], batch_size, image_size, test_dataset_dir, framework)\n",
+    "        tlt_quantized_latency, tlt_quantized_throughput = inc_utils.calculate_latency_and_throughput(tlt_quantized_results)\n",
+    "    except Exception as e:\n",
+    "        print(\"Error when trying to check the performance for the quantized model with batch size {}\".format(batch_size))\n",
+    "        print(e)\n",
+    "    finally:\n",
+    "        quantized_latency_list.append(tlt_quantized_latency)\n",
+    "        quantized_throughput_list.append(tlt_quantized_throughput)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e262895d",
+   "metadata": {},
+   "source": [
+    "Finally, get the performance of the model that was optimized using the Intel Transfer Learning tool with the Intel Neural Compressor."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8c42c815",
+   "metadata": {
+    "scrolled": true
+   },
+   "outputs": [],
+   "source": [
+    "optimized_latency_list = []\n",
+    "optimized_throughput_list = []\n",
+    "\n",
+    "for i, batch_size in enumerate(batch_size_list):\n",
+    "    try:\n",
+    "        tlt_optimized_latency = 0\n",
+    "        tlt_optimized_throughput = 0\n",
+    "        \n",
+    "        print('-' * 90)\n",
+    "        print('Check performance for TLT optimized model (batch size = {})'.format(batch_size))\n",
+    "        print('Saved model directory: {}'.format(tlt_optimized_dir_list[i]))\n",
+    "        print('-' * 90)\n",
+    "        \n",
+    "        if not os.path.exists(os.path.join(tlt_optimized_dir_list[i], 'saved_model.pb')):\n",
+    "            raise FileNotFoundError(\"The optimized model was not found at: {}\\nOptimization may have failed for this model/batch size.\".format(tlt_optimized_dir_list[i],))\n",
+    "\n",
+    "        tlt_optimized_results = inc_utils.performance(tlt_optimized_dir_list[i], batch_size, image_size, test_dataset_dir, framework)\n",
+    "        \n",
+    "        tlt_optimized_latency, tlt_optimized_throughput = inc_utils.calculate_latency_and_throughput(tlt_optimized_results)\n",
+    "    except Exception as e:\n",
+    "        print(\"Error when trying to check the performance for the optimized model with batch size {}\".format(batch_size))\n",
+    "        print(e)\n",
+    "    finally:\n",
+    "        optimized_latency_list.append(tlt_optimized_latency)\n",
+    "        optimized_throughput_list.append(tlt_optimized_throughput)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "44b337ab",
+   "metadata": {},
+   "source": [
+    "Visualize the latency and throughput results for all of the models."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0b5ca789",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "width = 0.18   # the width of the bars\n",
+    "\n",
+    "# Round the latency values\n",
+    "decimals = 2   # number of decimals to use for rounding\n",
+    "tf_latency_list = [0 if math.isnan(x) else round(x, decimals) for x in tf_latency_list]\n",
+    "tlt_latency_list = [0 if math.isnan(x) else round(x, decimals) for x in tlt_latency_list]\n",
+    "quantized_latency_list = [0 if math.isnan(x) else round(x, decimals) for x in quantized_latency_list]\n",
+    "optimized_latency_list = [0 if math.isnan(x) else round(x, decimals) for x in optimized_latency_list]\n",
+    "\n",
+    "# Setup the grouped bar chart for latency\n",
+    "fig, ax = plt.subplots()\n",
+    "fig.set_figheight(6)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax.bar(x, tf_latency_list, width, label='TF latency', color=orange)\n",
+    "rects_tlt = ax.bar(x + width, tlt_latency_list, width, label='TLT latency', color=blue)\n",
+    "rects_quant = ax.bar(x + width * 2, quantized_latency_list, width, label='TLT quantized latency', color=yellow)\n",
+    "rects_opt = ax.bar(x + width * 3, optimized_latency_list, width, label='TLT optimized latency', color=dark_blue)\n",
+    "ax.bar_label(rects_tf, padding=3)\n",
+    "ax.bar_label(rects_tlt, padding=3)\n",
+    "ax.bar_label(rects_quant, padding=3)\n",
+    "ax.bar_label(rects_opt, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax.set_ylabel('Milliseconds')\n",
+    "ax.set_title('Latency')\n",
+    "ax.set_xticks(x + width*1.5, groups)\n",
+    "ax.set_ymargin(0.2) \n",
+    "ax.legend(ncols=2)\n",
+    "plt.show()\n",
+    "\n",
+    "# Round the throughput values\n",
+    "decimals = 0   # number of decimals to use for rounding\n",
+    "tf_throughput_list = [round(x, decimals) for x in tf_throughput_list]\n",
+    "tlt_throughput_list = [round(x, decimals) for x in tlt_throughput_list]\n",
+    "quantized_throughput_list = [round(x, decimals) for x in quantized_throughput_list]\n",
+    "optimized_throughput_list = [round(x, decimals) for x in optimized_throughput_list]\n",
+    "\n",
+    "# Setup the grouped bar chart for throughput\n",
+    "fig, ax = plt.subplots()\n",
+    "fig.set_figheight(6)\n",
+    "fig.set_figwidth(10)\n",
+    "rects_tf = ax.bar(x, tf_throughput_list, width, label='TF throughput', color=orange)\n",
+    "rects_tlt = ax.bar(x + width, tlt_throughput_list, width, label='TLT throughput', color=blue)\n",
+    "rects_quant = ax.bar(x + width * 2, quantized_throughput_list, width, label='TLT quantized throughput', color=yellow)\n",
+    "rects_opt = ax.bar(x + width * 3, optimized_throughput_list, width, label='TLT optimized throughput', color=dark_blue)\n",
+    "ax.bar_label(rects_tf, padding=3)\n",
+    "ax.bar_label(rects_tlt, padding=3)\n",
+    "ax.bar_label(rects_quant, padding=3)\n",
+    "ax.bar_label(rects_opt, padding=3)\n",
+    "\n",
+    "# Add labels, title, and legend\n",
+    "ax.set_ylabel('images/second')\n",
+    "ax.set_title('Throughput')\n",
+    "ax.set_xticks(x + width*1.5, groups)\n",
+    "ax.set_ymargin(0.2) \n",
+    "ax.legend(ncols=2)\n",
+    "plt.show()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "aa9644c8",
+   "metadata": {},
+   "source": [
+    "The experiments done in this notebook allowed us to compare the training time and inference/evaluation metrics when using the TensorFlow libraries and the Intel Transfer Learning tool. We can also see how batch size affects performance. More experiments can be done by rerunning this notebook with a different model, different dataset, and/or different training parameters.\n",
+    "\n",
+    "Other related notebooks:\n",
+    "* [Transfer Learning for Image Classification using TensorFlow and the Intel® Transfer Learning Tool API](../image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb)\n",
+    "* [Transfer Learning for Image Classification using PyTorch and the Intel® Transfer Learning Tool API](../image_classification/tlt_api_pyt_image_classification/TLT_PyTorch_Image_Classification_Transfer_Learning.ipynb)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/performance/utils/inc_utils.py b/notebooks/performance/utils/inc_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..e8a78908a597f0060481dbedde73b227dcda9201
--- /dev/null
+++ b/notebooks/performance/utils/inc_utils.py
@@ -0,0 +1,78 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import numpy as np
+
+
+def performance(saved_model_dir, batch_size, image_size, dataset_dir, framework, warmup=10, iteration=100,
+                cores_per_instance=None, num_of_instance=None, inter_num_of_threads=None, intra_num_of_threads=None):
+    """
+    Uses the Intel Neural Compressor to get performance metrics for the specified model.
+    
+    :param saved_model_dir: Model to load
+    :param batch_size: Batch size
+    :param image_size: Image input size
+    :param dataset_dir: Dataset directory (for a custom image classification dataset)
+    :param framework: Framework (i.e. tensorflow)
+    :param warmup: Number of warmup iterations before running performance tests
+    :param iteration: The number of iterations to run for the performance test
+    :param cores_per_instance: Number of CPU cores to use per instance
+    :param num_of_instance: Number of instances to use for performance testing
+    :param inter_num_of_threads: Number of threads to use for inter-thread operations
+    :param intra_num_of_threads: Number of threads to use for intra-thread operations
+    :return: accuracy, batch_size, result_list
+    """
+
+    from neural_compressor.benchmark import fit
+    from neural_compressor.config import BenchmarkConfig
+    from neural_compressor.utils.create_obj_from_config import create_dataloader
+
+    dataloader_args = {
+        'batch_size': batch_size,
+        'dataset': {'ImageFolder': {'root': dataset_dir}},
+        'transform': {'PaddedCenterCrop': {'size': image_size, 'crop_padding': 32},
+                      'Resize': {'size': image_size, 'interpolation': 'bicubic'},
+                      'Rescale': {}
+                      },
+        'filter': None
+    }
+
+    eval_dataloader = create_dataloader(framework, dataloader_args)
+
+    conf = BenchmarkConfig(warmup=warmup, iteration=iteration)
+    try:
+        return fit(model=saved_model_dir, config=conf, b_dataloader=eval_dataloader)
+    except Exception:
+        # Retry a second time due to the known ZQMError when running from Jupyter
+        print("Retrying benchmarking a second time")
+        return fit(model=saved_model_dir, config=conf, b_dataloader=eval_dataloader)
+
+
+def calculate_latency_and_throughput(results):
+    """
+    Parses the results from the benchmarking function and returns the latency (ms) and throughput (samples/sec)
+    
+    :param results: Return value from calling the performance util function
+    :param batch_size: batch size
+    :return: latency (ms) and throughput (images/sec)
+    """
+    _, batch_size, result_list = results['performance']
+    latency = np.array(result_list).mean() / batch_size
+    latency_ms = latency * 1000
+    throughput = 1. / latency
+    return latency_ms, throughput
diff --git a/notebooks/plot_utils.py b/notebooks/plot_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..3d043bde461fe0cf91a6b007af311b401048d211
--- /dev/null
+++ b/notebooks/plot_utils.py
@@ -0,0 +1,54 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import matplotlib.pyplot as plt
+
+
+def plot_curves(history, checkpoint_dir):
+    """
+    Reads a pickle file and plots accuracy and loss curves
+
+    :param history: Pickle file
+    :return: None
+    """
+    if not history:
+        raise FileNotFoundError("The pickle file {} does not exist".format(history))
+
+    acc = history['acc']
+    val_acc = history['val_acc']
+    loss = history['loss']
+    val_loss = history['val_loss']
+    plt.figure(figsize=(7, 7))
+    plt.subplot(2, 1, 1)
+    plt.plot(acc, label='Training Accuracy')
+    plt.plot(val_acc, label='Validation Accuracy')
+    plt.legend(loc='lower right')
+    plt.ylabel('Accuracy')
+    plt.title('Training and Validation Accuracy')
+
+    plt.subplot(2, 1, 2)
+    plt.plot(loss, label='Training Loss')
+    plt.plot(val_loss, label='Validation Loss')
+    plt.legend(loc='upper right')
+    plt.ylabel('Cross Entropy')
+    plt.title('Training and Validation Loss')
+    plt.xlabel('epoch')
+    if not os.path.exists(os.path.join(checkpoint_dir, 'train_val_plot.png')):
+        print("Saving plot in checkpoint_dir:", checkpoint_dir)
+        plt.savefig(os.path.join(checkpoint_dir, 'train_val_plot.png'))
diff --git a/notebooks/question_answering/tfhub_question_answering/BERT_Question_Answering.ipynb b/notebooks/question_answering/tfhub_question_answering/BERT_Question_Answering.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..a5b4d777d99122486d91db2170f243e463a44533
--- /dev/null
+++ b/notebooks/question_answering/tfhub_question_answering/BERT_Question_Answering.ipynb
@@ -0,0 +1,417 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# BERT fine tuning for Question-Answering\n",
+    "\n",
+    "This notebook demonstrates fine tuning BERT models from TF Hub using the [SQuAD dataset](https://rajpurkar.github.io/SQuAD-explorer/). Scripts from the [TensorFlow Model Garden](https://github.com/tensorflow/models) are used for preprocessing the training dataset and fine tuning.\n",
+    "\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset)\n",
+    "3. [Fine tuning and evaluation](#3.-Fine-tuning-and-evaluation)\n",
+    "4. [Export the saved model](#4.-Export-the-saved-model)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [README.md](/notebooks/README.md) to setup a TensorFlow environment with all the dependencies required to run the notebook.\n",
+    "\n",
+    "It will run one of the supported [BERT models from TF Hub](https://tfhub.dev/google/collections/bert/1). The table below has a list of the available models and links to their URLs in TF Hub."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import json\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "\n",
+    "from bert_utils import get_model_map\n",
+    "from tlt.utils.file_utils import download_file\n",
+    "\n",
+    "tfhub_model_map, models_df = get_model_map(\"tfhub_bert_model_map_qa.json\", return_data_frame=True)\n",
+    "models_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Specify the name of the BERT model to use. This string must match one of the models listed in the table above."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"bert_en_wwm_uncased_L-24_H-1024_A-16\"\n",
+    "if model_name not in tfhub_model_map.keys():\n",
+    "    raise ValueError(\"The specified model name ({}) is not supported\".format(model_name))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define a directory to download the dataset\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Define an output directory for the saved model to be exported\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "    \n",
+    "# Directory for downloading the BERT config and vocab file\n",
+    "bert_dir = os.path.join(output_directory, model_name)\n",
+    "\n",
+    "# Output directory for logs and checkpoints generated during training\n",
+    "if not os.path.isdir(output_directory):\n",
+    "    os.makedirs(output_directory)\n",
+    "\n",
+    "# Directory to download the bert checkpoint zip so to get the vocab.txt and bert_config.json\n",
+    "if not os.path.isdir(bert_dir):\n",
+    "    os.makedirs(bert_dir)\n",
+    "    \n",
+    "# Get the BERT TF Hub URL from the model map\n",
+    "tfhub_bert_encoder = tfhub_model_map[model_name][\"bert_encoder\"]\n",
+    "checkpoint_url = tfhub_model_map[model_name][\"checkpoint_zip\"]\n",
+    "\n",
+    "print(\"Using TF Hub model:\", model_name)\n",
+    "print(\"BERT encoder URL:\", tfhub_bert_encoder)\n",
+    "print(\"Dataset directory:\", dataset_directory)\n",
+    "print(\"Output directory:\", output_directory)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Path where the https://github.com/tensorflow/models repo will be cloned\n",
+    "tf_models_dir = os.path.join(output_directory, \"tensorflow-models\")\n",
+    "os.environ[\"TF_MODELS_DIR\"] = tf_models_dir\n",
+    "tf_models_branch = \"v2.12.0\"\n",
+    "\n",
+    "# Clone the TensorFlow models repo\n",
+    "if not os.path.exists(tf_models_dir):\n",
+    "    !git clone --depth=1 --branch=$tf_models_branch https://github.com/tensorflow/models.git $tf_models_dir\n",
+    "\n",
+    "# Add the TensorFlow models repo to the PYTHONPATH\n",
+    "os.environ[\"PYTHONPATH\"] = \"{}:{}\".format(os.getenv(\"PYTHONPATH\", \"\"), tf_models_dir)\n",
+    "\n",
+    "from bert_qa_utils import create_mini_dataset_file, \\\n",
+    "                          display_predictions, \\\n",
+    "                          get_config_and_vocab_from_zip, \\\n",
+    "                          predict_squad_customized\n",
+    "\n",
+    "# Extract the vocab.txt and bert_config.json from the checkpoint zip file\n",
+    "vocab_txt, bert_config = get_config_and_vocab_from_zip(checkpoint_url, bert_dir)\n",
+    "\n",
+    "if not os.path.exists(vocab_txt):\n",
+    "    ValueError(\"The vocab file could not be found at:\", vocab_txt)\n",
+    "\n",
+    "if not os.path.exists(bert_config):\n",
+    "    ValueError(\"The bert config could not be found at:\", bert_config)\n",
+    "\n",
+    "print(\"Vocab file:\", vocab_txt)\n",
+    "print(\"BERT config:\", bert_config)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset\n",
+    "\n",
+    "Download the SQuAD dataset, create smaller json files with a subset of the dev and train datasets, and then create TF records for the mini training dataset. The SQuAD dataset has json files for a train and dev datasets. The json files are formatted like:\n",
+    "\n",
+    "```\n",
+    "{\n",
+    "    \"data\": [\n",
+    "        {\n",
+    "            \"title\": \"...\",\n",
+    "            \"paragraphs\": [\n",
+    "                {\n",
+    "                    \"qas\": [\n",
+    "                        {\n",
+    "                            \"question\": \"...\",\n",
+    "                            \"id\": \"<unique id>\",\n",
+    "                            \"answers\": [\n",
+    "                                {\n",
+    "                                    \"text\": \"...\",\n",
+    "                                    \"answer_start\": <index>\n",
+    "                                },\n",
+    "                                {\n",
+    "                                    \"text\": \"...\",\n",
+    "                                    \"answer_start\": <index>\n",
+    "                                },\n",
+    "                                {\n",
+    "                                    \"text\": \"...\",\n",
+    "                                    \"answer_start\": <index>\n",
+    "                                }\n",
+    "                            ],\n",
+    "                            \"is_impossible\": <true/false>\n",
+    "                        },\n",
+    "                        ...\n",
+    "                    ],\n",
+    "                    \"context\": \".....\"\n",
+    "                },\n",
+    "                ...\n",
+    "            ]\n",
+    "        }\n",
+    "    ],\n",
+    "    \"version\": \"v2.0\"\n",
+    "}\n",
+    "```\n",
+    "\n",
+    "Each item in the data list has a title, a list of paragraphs that with questions/answers and a context string. The answer to each question is a segment of text from the context paragraph (unless the question is impossible).\n",
+    "\n",
+    "For this example, we will be using a subset of the dev and train dataset in order to speed up the execution time. The size of the datasets can be increased (or the full dataset can be used) to try to improve accuracy."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Specify to use SQuAD v1.1 or v2.0\n",
+    "squad_version = \"v1.1\"\n",
+    "\n",
+    "# Maximum sequence length\n",
+    "max_seq_length = 384\n",
+    "\n",
+    "# Specify the number of dataset items to grab from the dev and train datasets.\n",
+    "# More dataset items can increase accuracy, but will also increase the training/evaluation time.\n",
+    "num_dev_dataset_items = 2\n",
+    "num_train_dataset_items = 12\n",
+    "\n",
+    "# Flag to overwrite previously generated mini dataset .json files and the TF records file\n",
+    "overwrite = False\n",
+    "\n",
+    "# Dataset download directory\n",
+    "squad_dir = os.path.join(dataset_directory, \"squad\")\n",
+    "\n",
+    "squad_dev_dataset = os.path.join(squad_dir, \"dev-{}.json\".format(squad_version))\n",
+    "squad_train_dataset = os.path.join(squad_dir, \"train-{}.json\".format(squad_version))\n",
+    "version_2_with_negative = squad_version == \"v2.0\"\n",
+    "\n",
+    "# Create a directory for the SQuAD files, if the folder does not exist\n",
+    "if not os.path.isdir(squad_dir):\n",
+    "    os.makedirs(squad_dir)\n",
+    "\n",
+    "# Download the SQuAD dev dataset file, if it doesn't exist\n",
+    "if not os.path.exists(squad_dev_dataset):\n",
+    "    squad_dev_url = \"https://rajpurkar.github.io/SQuAD-explorer/dataset/dev-{}.json\".format(squad_version)\n",
+    "    download_file(squad_dev_url, squad_dir)\n",
+    "\n",
+    "# Download the SQuAD train dataset file, if it doesn't exist\n",
+    "if not os.path.exists(squad_train_dataset):\n",
+    "    squad_train_url = \"https://rajpurkar.github.io/SQuAD-explorer/dataset/train-{}.json\".format(squad_version)\n",
+    "    download_file(squad_train_url, squad_dir)\n",
+    "    \n",
+    "# Create a smaller version of the dev dataset\n",
+    "squad_mini_file = \"mini-dev-{}.json\".format(squad_version)\n",
+    "mini_dataset_path = os.path.join(squad_dir, squad_mini_file)\n",
+    "create_mini_dataset_file(squad_dev_dataset, mini_dataset_path, num_dev_dataset_items, overwrite=overwrite)\n",
+    "\n",
+    "# Create a smaller version of the train dataset\n",
+    "squad_mini_train_file = \"mini-train-{}.json\".format(squad_version)\n",
+    "mini_train_dataset_path = os.path.join(squad_dir, squad_mini_train_file)\n",
+    "create_mini_dataset_file(squad_train_dataset, mini_train_dataset_path, num_train_dataset_items, overwrite=overwrite)\n",
+    "\n",
+    "# Create TF Records for the mini training dataset\n",
+    "train_mini_tfrecords_path = os.path.join(squad_dir, \"squad_mini_{}_train.tf_record\".format(squad_version))\n",
+    "squad_metadata_path = os.path.join(squad_dir, \"squad_{}_meta_data\".format(squad_version))\n",
+    "\n",
+    "# Preprocess the dataset, if we don't already have the files\n",
+    "if not os.path.exists(train_mini_tfrecords_path) or not os.path.exists(squad_metadata_path) or overwrite:\n",
+    "    !python $tf_models_dir/official/nlp/data/create_finetuning_data.py \\\n",
+    "        --squad_data_file=$mini_train_dataset_path \\\n",
+    "        --vocab_file=$vocab_txt \\\n",
+    "        --version_2_with_negative=$version_2_with_negative \\\n",
+    "        --train_data_output_path=$train_mini_tfrecords_path \\\n",
+    "        --meta_data_file_path=$squad_metadata_path \\\n",
+    "        --fine_tuning_task_type=squad \\\n",
+    "        --max_seq_length=$max_seq_length\n",
+    "    \n",
+    "    if os.path.exists(train_mini_tfrecords_path):\n",
+    "        print(\"Preprocessed dataset: \", train_mini_tfrecords_path)\n",
+    "else:\n",
+    "    print(\"The preprocessed training dataset was found at:\", train_mini_tfrecords_path)\n",
+    "    print(\"The SQuAD metadata file was found at:\", squad_metadata_path)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 3. Fine tuning and evaluation\n",
+    "\n",
+    "Train the model using the `run_squad.py` script from the [TensorFlow Model Garden](https://github.com/tensorflow/models/blob/v2.7.0/official/nlp/bert/run_squad.py) with the mode set to `train_and_eval`. The [TF Hub](https://tfhub.dev) model URL is being passed as the `hub_module_url`."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "\n",
+    "# Learning rate\n",
+    "learning_rate = 8e-5\n",
+    "\n",
+    "# Number of training epochs\n",
+    "num_train_epochs=1\n",
+    "\n",
+    "# Batch sizes\n",
+    "train_batch_size = 4\n",
+    "predict_batch_size = 4\n",
+    "\n",
+    "# Directory for checkpoints\n",
+    "checkpoint_dir = os.path.join(output_directory, \"{}_checkpoints\".format(model_name))\n",
+    "\n",
+    "if os.path.exists(checkpoint_dir):\n",
+    "    if len(os.listdir(checkpoint_dir)) > 0:\n",
+    "        print(\"WARNING: The model checkpoint directory is not empty and fine tuning may pick up \" \n",
+    "              \"previously generated checkpoint files.\\n\")\n",
+    "else:\n",
+    "    os.makedirs(checkpoint_dir)\n",
+    "\n",
+    "os.environ[\"TFHUB_CACHE_DIR\"] = os.path.join(output_directory, \"tfhub_modules\")\n",
+    "!python $tf_models_dir/official/legacy/bert/run_squad.py \\\n",
+    "  --mode=train_and_eval \\\n",
+    "  --input_meta_data_path=$squad_metadata_path \\\n",
+    "  --train_data_path=$train_mini_tfrecords_path \\\n",
+    "  --predict_file=$mini_dataset_path \\\n",
+    "  --vocab_file=$vocab_txt \\\n",
+    "  --bert_config_file=$bert_config \\\n",
+    "  --hub_module_url=$tfhub_bert_encoder \\\n",
+    "  --train_batch_size=$train_batch_size \\\n",
+    "  --predict_batch_size=$predict_batch_size \\\n",
+    "  --learning_rate=$learning_rate \\\n",
+    "  --num_train_epochs=$num_train_epochs \\\n",
+    "  --model_dir=$checkpoint_dir \\\n",
+    "  --distribution_strategy=one_device"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "display_predictions(mini_dataset_path, os.path.join(checkpoint_dir, \"predictions.json\"), n=25)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 4. Export the saved model\n",
+    "\n",
+    "Using the TensorFlow Model Garden API, export the saved model using the checkpoint files that were generated during fine tuning."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import tensorflow as tf\n",
+    "from official.legacy.bert import bert_models\n",
+    "from official.legacy.bert import configs as bert_configs\n",
+    "from official.legacy.bert import model_saving_utils\n",
+    "\n",
+    "tf.keras.mixed_precision.set_global_policy('float32')\n",
+    "bert_config_obj = bert_configs.BertConfig.from_json_file(bert_config)\n",
+    "squad_model, _ = bert_models.squad_model(bert_config_obj,\n",
+    "                                         max_seq_length,\n",
+    "                                         hub_module_url=tfhub_bert_encoder)\n",
+    "\n",
+    "saved_model_dir = os.path.join(output_directory, \"{}_saved_model\".format(model_name))\n",
+    "\n",
+    "if not os.path.exists(saved_model_dir):\n",
+    "    os.makedirs(saved_model_dir)\n",
+    "\n",
+    "model_saving_utils.export_bert_model(saved_model_dir, model=squad_model, checkpoint_dir=checkpoint_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@misc{tensorflowmodelgarden2020,\n",
+    "  author = {Hongkun Yu and Chen Chen and Xianzhi Du and Yeqing Li and\n",
+    "            Abdullah Rashwan and Le Hou and Pengchong Jin and Fan Yang and\n",
+    "            Frederick Liu and Jaeyoun Kim and Jing Li},\n",
+    "  title = {{TensorFlow Model Garden}},\n",
+    "  howpublished = {\\url{https://github.com/tensorflow/models}},\n",
+    "  year = {2020}\n",
+    "}\n",
+    "\n",
+    "@article{2016arXiv160605250R,\n",
+    "       author = { {Rajpurkar}, Pranav and {Zhang}, Jian and {Lopyrev},\n",
+    "                 Konstantin and {Liang}, Percy},\n",
+    "        title = \"{SQuAD: 100,000+ Questions for Machine Comprehension of Text}\",\n",
+    "      journal = {arXiv e-prints},\n",
+    "         year = 2016,\n",
+    "          eid = {arXiv:1606.05250},\n",
+    "        pages = {arXiv:1606.05250},\n",
+    "archivePrefix = {arXiv},\n",
+    "       eprint = {1606.05250},\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/notebooks/question_answering/tfhub_question_answering/README.md b/notebooks/question_answering/tfhub_question_answering/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..41b15db625d8af39b446d4f21c8373707abac15c
--- /dev/null
+++ b/notebooks/question_answering/tfhub_question_answering/README.md
@@ -0,0 +1,43 @@
+# Question Answering fine tuning using TensorFlow
+
+This notebook demonstrates fine tuning using various [BERT](https://arxiv.org/abs/1810.04805) models
+from [TF Hub](https://tfhub.dev) using Intel® Optimization for TensorFlow with the SQuAD dataset.
+
+The notebook performs the following steps:
+1. Import dependencies and setup parameters
+1. Prepare the dataset
+1. Fine tuning and evaluation
+1. Export the saved model
+
+## Running the notebooks
+
+To run the notebook, follow the instructions to setup the [TensorFlow notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations:
+```
+@article{2016arXiv160605250R,
+       author = { {Rajpurkar}, Pranav and {Zhang}, Jian and {Lopyrev},
+                 Konstantin and {Liang}, Percy},
+        title = "{SQuAD: 100,000+ Questions for Machine Comprehension of Text}",
+      journal = {arXiv e-prints},
+         year = 2016,
+          eid = {arXiv:1606.05250},
+        pages = {arXiv:1606.05250},
+archivePrefix = {arXiv},
+       eprint = {1606.05250},
+}
+```
+
+TensorFlow Model Garden citation:
+```
+@misc{tensorflowmodelgarden2020,
+  author = {Hongkun Yu and Chen Chen and Xianzhi Du and Yeqing Li and
+            Abdullah Rashwan and Le Hou and Pengchong Jin and Fan Yang and
+            Frederick Liu and Jaeyoun Kim and Jing Li},
+  title = {{TensorFlow Model Garden}},
+  howpublished = {\url{https://github.com/tensorflow/models}},
+  year = {2020}
+}
+```
diff --git a/notebooks/question_answering/tfhub_question_answering/bert_qa_utils.py b/notebooks/question_answering/tfhub_question_answering/bert_qa_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..ad3b9a664191655bbca4d5ae6eeacac7270fd5cb
--- /dev/null
+++ b/notebooks/question_answering/tfhub_question_answering/bert_qa_utils.py
@@ -0,0 +1,208 @@
+#
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import glob
+import json
+import os
+import pandas as pd
+import sys
+import tensorflow as tf
+
+sys.path.append(os.environ["TF_MODELS_DIR"])
+
+from official.common import distribute_utils
+from official.legacy.bert.run_squad_helper import get_dataset_fn
+from tlt.utils.file_utils import download_file
+from zipfile import ZipFile
+
+def create_mini_dataset_file(original_file, output_file, num_dataset_items, overwrite=False):
+    """
+    Creates a mini version of the specified json file. The original_file is expected to be in a format
+    similar to the SQuAD dataset. The number of dataset items represents the number of child elements
+    under the "data" tag that will be grabbed for the mini dataset. Dataset items will be randomly
+    selected from the original dataset. Each child element may contain several sets of articles with
+    questions/answers. The overwrite flag specifies whether or not to overwrite a mini dataset file
+    that already exists. If overwrite=False and the mini dataset file already exists, nothing will happen.
+    """
+    if not os.path.exists(output_file) or overwrite:
+        import random
+        
+        with open(original_file) as f:
+            original_data = json.load(f)
+
+        total_len = len(original_data["data"])
+        
+        if num_dataset_items > total_len:
+            raise ValueError("The number of dataset items ({}) cannot be more than the total "
+                             "dataset length ({}).".format(num_dataset_items, total_len))
+        
+        item_indicies = random.sample(range(0, total_len), num_dataset_items)
+        print("Total dataset length:", total_len)
+        print("Randomly selected dataset indices:", item_indicies)
+        
+        articles = []
+        
+        for data_index in item_indicies:
+            article = {}
+            article["paragraphs"] = original_data["data"][data_index]["paragraphs"]
+            article["title"] = original_data["data"][data_index]["title"]
+            
+            for p in article["paragraphs"]:
+                for qas in p["qas"]:
+                    qas["id"] = str(qas["id"])
+            
+            articles.append(article)
+
+        # Add the article to a dictionary for the mini dataset
+        mini_data = {}
+        mini_data["data"] = articles
+        
+        # Add on a version
+        mini_data["version"] = original_data["version"] if "version" in original_data.keys() else "1.0"
+
+        with open(output_file, "w") as f:
+            f.write(json.dumps(mini_data, indent=4))
+
+        if os.path.exists(output_file):
+            print("Wrote dataset file with {} articles to: {}".format(num_dataset_items, output_file))
+    else:
+        print("Found existing dataset file:", output_file)
+
+
+def display_predictions(predict_data_path, results_file_path, n=10):
+    """ Displays n number of predictions along with the actual value """
+    
+    def get_data_list():
+        count = 0
+        data_list = []
+        with open(predict_data_path, "r") as actual_data_file:
+            actual_data = json.load(actual_data_file)["data"]
+            with open(results_file_path, "r") as results_file:
+                results = json.load(results_file)
+                for actual_item in actual_data:
+                    for actual_paragraph in actual_item["paragraphs"]:
+                        for actual_qas in actual_paragraph["qas"]:
+                            if "is_impossible" in actual_qas.keys() and actual_qas["is_impossible"]:
+                                actual_answer = "is_impossible"
+                            elif len(actual_qas["answers"]) >= 1:
+                                answers_text = [x["text"] for x in actual_qas["answers"]]
+                                actual_answer = "<br>".join(set(answers_text))
+                            else:
+                                actual_answer = "Unknown"
+                            question = actual_qas["question"]
+                            prediction = results[actual_qas["id"]]
+                            data_list.append([question, prediction, actual_answer])
+                            count += 1
+                            if count > n:
+                                return data_list
+
+    predict_df = pd.DataFrame(get_data_list(),
+                              columns=["Question",
+                                       "Predicted Answer",
+                                       "Actual Answer(s)"])
+    return predict_df.style.hide(axis="index")
+                    
+
+def get_config_and_vocab_from_zip(zip_url, bert_dir):
+    """
+    We are loading the trained BERT model from TF Hub, however the run_squad.py scripts still
+    require us to pass in a vocab.txt and bert config file. We can get these from the checkpoint
+    .zip files. The directory structure of the .zip files for each BERT model is not
+    consistent, so there's a glob search being done to locate the actual vocab.txt and
+    bert_config.json file after they're extracted from the zip (sometimes they are in
+    subdirectories).
+    :param zip_url: URL where the checkpoint zip can be downloaded
+    :param bert_dir: BERT directory where the vocab.txt and bert_config.json should be copied
+    :return: Paths to the vocab.txt and bert_config.json
+    """
+    vocab_txt = os.path.join(bert_dir, "vocab.txt")
+    bert_config = os.path.join(bert_dir, "bert_config.json")
+    
+    if not os.path.exists(vocab_txt) or not os.path.exists(bert_config):
+        downloaded_file = download_file(zip_url, bert_dir)
+        with ZipFile(downloaded_file, "r") as checkpoint_zip:
+            def get_file_from_zip(file_path):
+                file_basename = os.path.basename(file_path)
+                for zipinfo in checkpoint_zip.infolist():
+                    if file_basename in zipinfo.filename:
+                        checkpoint_zip.extract(member=zipinfo.filename, path=bert_dir)
+
+                        if not os.path.exists(file_path):
+                            # the file isn't directly in the bert_dir, so search subfolders and move it
+                            search_path = os.path.join(bert_dir, "**", file_basename)
+                            matches = glob.glob(search_path, recursive=True)
+                            if matches:
+                                os.replace(matches[0], file_path)
+                        break
+            
+            if not os.path.exists(vocab_txt):
+                get_file_from_zip(vocab_txt)
+            
+            if not os.path.exists(bert_config):
+                get_file_from_zip(bert_config)
+
+        os.remove(downloaded_file)
+        
+    return vocab_txt, bert_config
+
+
+# This function was taken from the TensorFlow Model Garden repo and adapted
+# to be a utility function that has a string for the strategy, directly passes
+# in the max_seq_length instead of a metadata object, and removes the need for FLAGS
+# being defined (instead just passes in the predict_batch_size as an arg).
+
+# https://github.com/tensorflow/models/blob/v2.7.0/official/nlp/bert/run_squad_helper.py#L176
+def predict_squad_customized(strategy_str, max_seq_length, predict_batch_size,
+                             predict_tfrecord_path, num_steps, squad_model):
+    
+    strategy = distribute_utils.get_distribution_strategy(distribution_strategy=strategy_str)
+    
+    """Make predictions using a Bert-based squad model."""
+    predict_dataset_fn = get_dataset_fn(
+        predict_tfrecord_path,
+        max_seq_length,
+        predict_batch_size,
+        is_training=False)
+    predict_iterator = iter(
+        strategy.distribute_datasets_from_function(predict_dataset_fn))
+
+    @tf.function
+    def predict_step(iterator):
+        """Predicts on distributed devices."""
+
+        def _replicated_step(inputs):
+            """Replicated prediction calculation."""
+            x, _ = inputs
+            unique_ids = x.pop('unique_ids')
+            start_logits, end_logits = squad_model(x, training=False)
+            return dict(
+                unique_ids=unique_ids,
+                start_logits=start_logits,
+                end_logits=end_logits)
+
+        outputs = strategy.run(_replicated_step, args=(next(iterator),))
+        return tf.nest.map_structure(strategy.experimental_local_results, outputs)
+
+    all_results = []
+    for _ in range(num_steps):
+        predictions = predict_step(predict_iterator)
+        for result in get_raw_results(predictions):
+            all_results.append(result)
+        if len(all_results) % 100 == 0:
+            print('Made predictions for %d records.', len(all_results))
+    return all_results
diff --git a/notebooks/question_answering/tfhub_question_answering/bert_utils.py b/notebooks/question_answering/tfhub_question_answering/bert_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..c9ebf090273dd0839ca5dfa26cf46bfcea05b6e1
--- /dev/null
+++ b/notebooks/question_answering/tfhub_question_answering/bert_utils.py
@@ -0,0 +1,57 @@
+#
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import json
+import os
+import pandas as pd
+
+from zipfile import ZipFile
+
+
+def get_model_map(json_path, return_data_frame=False):
+    """
+    Gets the model map from the speified json path and loads it into a python dictionary. If the
+    data frame option is enabled, it will also return the list of models in a pandas data frame
+    with column headers so that it can be used to display in a notebook.
+    """
+    with open(json_path) as json_file:
+        tfhub_model_map = json.load(json_file)
+
+    if return_data_frame:
+        # Generate list of model names and URL links to TF Hub based on the model map
+        model_options = [[i,
+                          tfhub_model_map[i]["num_hidden_layers"],
+                          tfhub_model_map[i]["hidden_size"],
+                          tfhub_model_map[i]["num_attention_heads"],
+                          "<a href=\"{0}\" target=\"_blank\">{0}</a>".format(
+                              tfhub_model_map[i]["bert_encoder"])]
+                         for i in tfhub_model_map.keys()]
+
+        if len(model_options) == 0:
+            print("Warning: No models were found in the json file:", json_path)
+
+        pd.set_option('display.max_colwidth', None)
+        models_df = pd.DataFrame(model_options,
+                                 columns=["Model",
+                                          "Hidden layers",
+                                          "Hidden size",
+                                          "Attention heads",
+                                          "TF Hub BERT encoder URL"])
+        return tfhub_model_map, models_df
+    else:
+        return tfhub_model_map
diff --git a/notebooks/question_answering/tfhub_question_answering/tfhub_bert_model_map_qa.json b/notebooks/question_answering/tfhub_question_answering/tfhub_bert_model_map_qa.json
new file mode 100644
index 0000000000000000000000000000000000000000..e8206476426968e555567b018f1656740af76f2a
--- /dev/null
+++ b/notebooks/question_answering/tfhub_question_answering/tfhub_bert_model_map_qa.json
@@ -0,0 +1,26 @@
+{
+    "bert_en_wwm_uncased_L-24_H-1024_A-16": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/bert_en_wwm_uncased_L-24_H-1024_A-16/2",
+        "hidden_size": 1024,
+        "num_hidden_layers": 24,
+        "num_attention_heads": 16,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2019_05_30/wwm_uncased_L-24_H-1024_A-16.zip"
+    },
+    "bert_en_uncased_L-12_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/bert_en_uncased_L-12_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2018_10_18/uncased_L-12_H-768_A-12.zip"
+    },
+    "bert_en_uncased_L-24_H-1024_A-16": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/bert_en_uncased_L-24_H-1024_A-16/2",
+        "hidden_size": 1024,
+        "num_hidden_layers": 24,
+        "num_attention_heads": 16,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2018_10_18/uncased_L-24_H-1024_A-16.zip"
+    }
+}
diff --git a/notebooks/requirements.txt b/notebooks/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..5326874445f18eb04bfb2186434cf4db692fdf34
--- /dev/null
+++ b/notebooks/requirements.txt
@@ -0,0 +1,29 @@
+Pillow~=9.5.0
+PyYAML~=6.0
+charset-normalizer~=3.1.0
+datasets~=2.12.0
+gin-config~=0.5.0
+intel-extension-for-pytorch==1.13.100
+intel-tensorflow==2.12.0
+ipython-genutils~=0.2.0
+ipython~=8.13.2
+ipywidgets~=8.0.6
+jmespath~=1.0.1
+matplotlib-inline~=0.1.6
+matplotlib~=3.7.1
+notebook~=6.5.4
+numpy~=1.23.5
+opencv-python~=4.7.0.72
+pandas~=2.0.1
+psutil~=5.9.5
+pycocotools~=2.0.6
+scikit-learn~=1.2.2
+scipy~=1.10.1
+sentencepiece~=0.1.99
+tensorflow-addons~=0.20.0
+tensorflow-datasets~=4.9.2
+tensorflow-hub~=0.13.0
+torch==1.13.1
+torchvision==0.14.1
+transformers~=4.30.0
+urllib3~=2.0.2
diff --git a/notebooks/setup.md b/notebooks/setup.md
new file mode 100644
index 0000000000000000000000000000000000000000..5d6542bd1fe926bc7d23c5f6d0125c8c697576b1
--- /dev/null
+++ b/notebooks/setup.md
@@ -0,0 +1,45 @@
+# Environment Setup and Running the Notebooks
+
+Use the instructions below to install the dependencies required to run the notebooks.
+
+Software Requirements:
+1. Linux* system (validated on Ubuntu* 20.04/22.04 LTS)
+2. Python3 (3.8, 3.9, or 3.10), Pip/Conda and Virtualenv
+3. git
+
+## Set Up Notebook Environment
+
+1. Install Intel® Transfer Learning Tool using the Developer Installation option in the [Get Started](/GetStarted.md) Guide.
+   This is required for the Intel Transfer Learning Tool tutorial notebooks, E2E notebooks, and performance comparison. Follow the
+   instructions in the [Get Started Guide](/GetStarted.md). You can
+   skip this step if you are only running the native framework notebooks.
+
+2. Activate the virtualenv or conda environment used to install Intel Transfer Learning Tool,
+   then from inside the activated environment, run these steps:
+   ```
+   pip install --upgrade pip
+   pip install -r notebooks/requirements.txt
+   ```
+
+3. Set environment variables for the path to the dataset folder and an output directory.
+   The dataset and output directories can be empty. The notebook will download the dataset to
+   the dataset directory, if it is empty. Subsequent runs will reuse the dataset.
+   If the `DATASET_DIR` and `OUTPUT_DIR` variables are not defined, the notebooks will
+   default to use `~/dataset` and `~/output`.
+   ```
+   export DATASET_DIR=<directory to download the dataset>
+   export OUTPUT_DIR=<output directory for the saved model>
+
+   mkdir -p $DATASET_DIR
+   mkdir -p $OUTPUT_DIR
+   ```
+4. Navigate to the notebook directory in your clone of the Transfer Learning repo, and then start the
+   [notebook server](https://jupyter.readthedocs.io/en/latest/running.html#starting-the-notebook-server):
+   ```
+   cd notebooks
+   jupyter notebook --port 8888
+   ```
+5. Copy and paste the URL from the terminal to your browser to view and run the notebooks.
+
+Once you have the environment and dependencies set up, see the list of available
+[notebooks](/notebooks/README.md).
diff --git a/notebooks/text_classification/pytorch_text_classification/PyTorch_Text_Classifier_fine_tuning.ipynb b/notebooks/text_classification/pytorch_text_classification/PyTorch_Text_Classifier_fine_tuning.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..1fd3175a3605e870cdd390f5562eda433921165f
--- /dev/null
+++ b/notebooks/text_classification/pytorch_text_classification/PyTorch_Text_Classifier_fine_tuning.ipynb
@@ -0,0 +1,905 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "b65f0c82",
+   "metadata": {},
+   "source": [
+    "# Text Classifier fine tuning using IMDb with PyTorch\n",
+    "\n",
+    "This notebook demonstrates fine tuning pretrained models from [Hugging Face](https://huggingface.co) using text classification datasets from the [Hugging Face Datasets catalog](https://huggingface.co/datasets) or a custom dataset. The notebook uses [Intel® Extension for PyTorch*](https://github.com/intel/intel-extension-for-pytorch), which extends PyTorch with optimizations for an extra performance boost on Intel hardware.\n",
+    "\n",
+    "Please install the dependencies from the [setup.md](../../setup.md) file before executing this notebook.\n",
+    "\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset)\n",
+    "3. [Prepare the model for fine tuning and evaluation](#3.-Prepare-the-model-for-fine-tuning-and-evaluation)\n",
+    "4. [Export the model](#4.-Export-the-model)\n",
+    "5. [Reload the model and make predictions](#5.-Reload-the-model-and-make-predictions)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "454a6685",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [setup.md](../../setup.md) to setup a PyTorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0b2b3bf9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import intel_extension_for_pytorch as ipex\n",
+    "import logging\n",
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import sys\n",
+    "import torch\n",
+    "import warnings\n",
+    "import typing\n",
+    "import pickle\n",
+    "\n",
+    "from tqdm.auto import tqdm\n",
+    "from torch.optim import AdamW\n",
+    "from torch.utils.data import DataLoader\n",
+    "from datasets import ClassLabel, load_dataset, load_metric, Split\n",
+    "from datasets import logging as datasets_logging\n",
+    "from transformers.utils import logging as transformers_logging\n",
+    "from transformers import (\n",
+    "    AutoModelForSequenceClassification,\n",
+    "    AutoTokenizer,\n",
+    "    Trainer,\n",
+    "    TrainingArguments,\n",
+    "    get_scheduler\n",
+    ")\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file\n",
+    "\n",
+    "# Set the logging stream to stdout\n",
+    "for handler in transformers_logging._get_library_root_logger().handlers:\n",
+    "    handler.setStream(sys.stdout)\n",
+    "\n",
+    "sh = datasets_logging.logging.StreamHandler(sys.stdout)\n",
+    "\n",
+    "datasets_logging.set_verbosity_error()\n",
+    "warnings.filterwarnings('ignore')\n",
+    "os.environ[\"TRANSFORMERS_NO_ADVISORY_WARNINGS\"] = \"1\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0fdf13ec",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Specify the name of the Hugging Face pretrained model to use (https://huggingface.co/models)\n",
+    "# For example: \n",
+    "#   albert-base-v2\n",
+    "#   bert-base-uncased\n",
+    "#   distilbert-base-uncased\n",
+    "#   distilbert-base-uncased-finetuned-sst-2-english\n",
+    "#   roberta-base\n",
+    "model_name = \"distilbert-base-uncased\"\n",
+    "\n",
+    "# Define an output directory\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\", model_name)\n",
+    "\n",
+    "# Define a dataset directory\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "print(\"Model name:\", model_name)\n",
+    "print(\"Output directory:\", output_dir)\n",
+    "print(\"Dataset directory:\", dataset_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "2f258d4f",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset\n",
+    "\n",
+    "The notebook has two options for getting a dataset:\n",
+    "* Option A: Use a dataset from the [Hugging Face Datasets catalog](https://huggingface.co/datasets)\n",
+    "* Option B: Use a custom dataset (downloaded from another source or from your local system)\n",
+    "\n",
+    "In both cases, the code ends up defining [`datasets.Dataset`](https://huggingface.co/docs/datasets/package_reference/main_classes#datasets.Dataset) objects for the train and evaluation splits.\n",
+    "\n",
+    "Execute the following cell to load the tokenizer and declare the base class used for the dataset setup."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "649c5c22",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load the tokenizer\n",
+    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
+    "\n",
+    "class TextClassificationData():\n",
+    "    \"\"\"\n",
+    "    Base class used for defining the text classification dataset being used. Defines Hugging Face datasets.Dataset\n",
+    "    objects for train and evaluations splits, along with helper functions for preprocessing the dataset.\n",
+    "    \"\"\"\n",
+    "\n",
+    "    def __init__(self, dataset_name, tokenizer, sentence1_key, sentence2_key, label_key):\n",
+    "        self.tokenizer = tokenizer\n",
+    "        self.dataset_name = dataset_name\n",
+    "        self.class_labels = None\n",
+    "        \n",
+    "        # Tokenized train and eval ds\n",
+    "        self.train_ds = None\n",
+    "        self.eval_ds = None\n",
+    "        \n",
+    "        # Column keys\n",
+    "        self.sentence1_key = sentence1_key\n",
+    "        self.sentence2_key = sentence2_key\n",
+    "        self.label_key = label_key\n",
+    "        \n",
+    "    def tokenize_function(self, examples):\n",
+    "        # Define the tokenizer args, depending on if the data has 2 sentences or just 1\n",
+    "        args = ((examples[self.sentence1_key],) if self.sentence2_key is None \\\n",
+    "                 else (examples[self.sentence1_key], examples[self.sentence2_key]))\n",
+    "        return self.tokenizer(*args, padding=\"max_length\", truncation=True)\n",
+    "    \n",
+    "    def tokenize_dataset(self, dataset):\n",
+    "        # Apply the tokenize function to the dataset\n",
+    "        tokenized_dataset = dataset.map(self.tokenize_function, batched=True)\n",
+    "\n",
+    "        # Remove the raw text from the tokenized dataset\n",
+    "        raw_text_columns = [self.sentence1_key, self.sentence2_key] if self.sentence2_key else [self.sentence1_key]\n",
+    "        return tokenized_dataset.remove_columns(raw_text_columns)\n",
+    "        \n",
+    "    def define_train_eval_splits(self, dataset, train_split_name, eval_split_name, train_size=None, eval_size=None):\n",
+    "        self.train_ds = dataset[train_split_name].shuffle().select(range(train_size)) if train_size \\\n",
+    "            else tokenized_dataset[train_split_name]    \n",
+    "        self.eval_ds = dataset[eval_split_name].shuffle().select(range(eval_size)) if eval_size \\\n",
+    "            else tokenized_dataset[eval_split_name]\n",
+    "        \n",
+    "    def get_label_names(self):\n",
+    "        if self.class_labels:\n",
+    "            return self.class_labels.names\n",
+    "        else:\n",
+    "            raise ValueError(\"Class labels were not defined\")\n",
+    "        \n",
+    "    def display_sample(self, split_name=\"train\", sample_size=7):\n",
+    "        # Display a sample of the raw data\n",
+    "        sentence1_sample = self.dataset[split_name][self.sentence1_key][:sample_size]\n",
+    "        sentence2_sample = self.dataset[split_name][self.sentence2_key][:sample_size] if self.sentence2_key else None\n",
+    "        label_sample = self.dataset[split_name][self.label_key][:sample_size]\n",
+    "        dataset_sample = zip(sentence1_sample, sentence2_sample, label_sample) if self.sentence2_key \\\n",
+    "            else zip(sentence1_sample, label_sample)\n",
+    "\n",
+    "        columns = [self.sentence1_key, self.sentence2_key, self.label_key] if self.sentence2_key else \\\n",
+    "            [self.sentence1_key, self.label_key]\n",
+    "\n",
+    "        # Display the sample using a dataframe\n",
+    "        sample = pd.DataFrame(dataset_sample, columns=columns)\n",
+    "        return sample.style.hide()"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "fd8512e1",
+   "metadata": {},
+   "source": [
+    "Now that the base class is defined, either run [Option A to use the Hugging Face Dataset catalog](#Option-A:-Use-a-Hugging-Face-dataset) or [Option B for a custom dataset](#Option-B:-Use-a-custom-dataset) downloaded from online or from your local system."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "640e5611",
+   "metadata": {},
+   "source": [
+    "### Option A: Use a Hugging Face dataset\n",
+    "\n",
+    "[Hugging Face Datasets](https://huggingface.co/datasets) has a catalog of datasets that can be specified by name. Information about the dataset is available in the catalog (including information on the size of the dataset and the splits).\n",
+    "\n",
+    "The next cell gets the [IMDb movie review dataset](https://huggingface.co/datasets/imdb) using the Hugging Face datasets API. If the notebook is executed multiple times, the dataset will be used from the dataset directory, to speed up the time that it takes to run.\n",
+    "\n",
+    "The IMDb dataset in Hugging Face has 3 splits: `train`, `test`, and `unsupervised`. This notebook will be using data from the `train` split for training and data from the `test` split for evaluation. The data has 2 columns: `text` (string with the movie review) and `label` (integer class label). The code in the next cell is setup to run using the IMDb dataset, so note that if a different dataset is being used, you may need to change the split names and/or the column names."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9a1d5fc0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class HFDSTextClassificationData(TextClassificationData):\n",
+    "    \"\"\"\n",
+    "    Class used for loading and preprocessing text classification datasets from the Hugging Face datasets catalog\n",
+    "    \"\"\"\n",
+    "    \n",
+    "    def __init__(self, tokenizer, dataset_dir, dataset_name, train_size, eval_size, train_split_name,\n",
+    "                 eval_split_name, sentence1_key, sentence2_key, label_key):\n",
+    "        \"\"\"\n",
+    "        Initialize the HFDSTextClassificationData class for a text classification dataset from Hugging Face.\n",
+    "        \n",
+    "        :param tokenizer: Tokenizer to preprocess the dataset\n",
+    "        :param dataset_dir: Cache directory used when loading the dataset\n",
+    "        :param dataset_name: Name of the dataset to load from the Hugging Face catalog\n",
+    "        :param train_size: Size of the training dataset. For quicker training or debug, use a subset of the data.\n",
+    "                           Set to `None` to use all the data.\n",
+    "        :param eval_size: Size of the evaluation dataset.\n",
+    "        :param train_split_name: String specifying which split to load for training (e.g. \"train[:80%]\"). See the\n",
+    "                                 https://www.tensorflow.org/datasets/splits documentation for more information on\n",
+    "                                 defining splits.\n",
+    "        :param eval_split_name: String specifying the split to load for evaluation.\n",
+    "        :param sentence1_key: Name of the sentence1 column\n",
+    "        :param sentence2_key: Name of the sentence2 column or `None` if there's only one text column\n",
+    "        :param label_key: Name of the label column\n",
+    "        \"\"\"\n",
+    "\n",
+    "        # Init base class\n",
+    "        TextClassificationData.__init__(self, dataset_name, tokenizer, sentence1_key, sentence2_key, label_key) \n",
+    "        \n",
+    "        # Load the dataset from the Hugging Face dataset API\n",
+    "        self.dataset = load_dataset(dataset_name, cache_dir=dataset_dir)\n",
+    "\n",
+    "        # Tokenize the dataset\n",
+    "        tokenized_dataset = self.tokenize_dataset(self.dataset)\n",
+    "\n",
+    "        # Get the training and eval dataset based on the specified dataset sizes\n",
+    "        self.define_train_eval_splits(tokenized_dataset, train_split_name, eval_split_name, train_size, eval_size)\n",
+    "\n",
+    "        # Save the class label information to use later when predicting\n",
+    "        self.class_labels = self.dataset[train_split_name].features[label_key]\n",
+    "\n",
+    "# Name of the Hugging Face dataset\n",
+    "dataset_name = \"imdb\"\n",
+    "\n",
+    "# For quicker training and debug runs, use a subset of the dataset by specifying the size of the train/eval datasets.\n",
+    "# Set the sizes `None` to use the full dataset. The full IMDb dataset has 25,000 training and 25,000 test examples.\n",
+    "train_dataset_size = 1000\n",
+    "eval_dataset_size = 1000\n",
+    "\n",
+    "# Name of the columns in the dataset (the column names may vary if you are not using the IMDb dataset)\n",
+    "sentence1_key = \"text\"\n",
+    "sentence2_key = None\n",
+    "label_key = \"label\"\n",
+    "\n",
+    "dataset = HFDSTextClassificationData(tokenizer, dataset_dir, dataset_name, train_dataset_size, eval_dataset_size,\n",
+    "                                     Split.TRAIN, Split.TEST, sentence1_key, sentence2_key, label_key)\n",
+    "\n",
+    "# Print a sample of the data\n",
+    "dataset.display_sample(Split.TRAIN, sample_size=5)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "362625ec",
+   "metadata": {},
+   "source": [
+    "Skip to Step 3 [Get the model and setup the Trainer](#3.-Get-the-model-and-setup-the-Trainer) to continue using the dataset from the Hugging Face catalog."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "28c0ba36",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a custom dataset\n",
+    "\n",
+    "Instead of using a dataset from the Hugging Face dataset catalog, a custom dataset from your local system or a download can be used.\n",
+    "\n",
+    "In this example, we download the [SMS Spam Collection dataset](https://archive.ics.uci.edu/ml/datasets/sms+spam+collection). (Note: Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.) The zip file has a single tab-separated value file with two columns. The first column is the label (`ham` or `spam`) and the second column is the text of the SMS message:\n",
+    "```\n",
+    "<ham or spam>\t<text>\n",
+    "<ham or spam>\t<text>\n",
+    "<ham or spam>\t<text>\n",
+    "...\n",
+    "```\n",
+    "If you are using a custom dataset that has a similarly formatted csv or tsv file, you can use the class defined below. Create your object by passing in custom values for csv file name, delimiter, the label map, mapping function, etc."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c706bfbf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class CustomCsvTextClassificationData(TextClassificationData):\n",
+    "    \"\"\"\n",
+    "    Class used for loading and preprocessing text classification datasets from CSV files\n",
+    "    \"\"\"\n",
+    "    \n",
+    "    def __init__(self, tokenizer, dataset_name, dataset_dir, data_files, delimiter, label_names, sentence1_key, sentence2_key,\n",
+    "                 label_key, train_percent=0.8, eval_percent=0.2, train_size=None, eval_size=None, map_function=None):\n",
+    "        \"\"\"\n",
+    "        Intialize the CustomCsvTextClassificationData class for a text classification\n",
+    "        dataset. The classes uses the Hugging Face datasets API to load the CSV file,\n",
+    "        and split it into a train and eval datasets based on the specified percentages.\n",
+    "        If train_size and eval_size are also defined, the datasets are reduced to the\n",
+    "        specified number of examples.\n",
+    "        \n",
+    "        :param tokenizer: Tokenizer to preprocess the dataset\n",
+    "        :param dataset_name: Dataset name for identification purposes\n",
+    "        :param dataset_dir: Directory where the csv file(s) are located\n",
+    "        :param data_files: List of data file names\n",
+    "        :param delimiter: Delimited for the csv files\n",
+    "        :param label_names: List of label names\n",
+    "        :param sentence1_key: Name of the sentence1 column\n",
+    "        :param sentence2_key: Name of the sentence2 column or `None` if there's only one text column\n",
+    "        :param label_key: Name of the label column\n",
+    "        :param train_percent: Decimal value for the percentage of the dataset that should be used for training\n",
+    "                              (e.g. 0.8 for 80%)\n",
+    "        :param eval_percent: Decimal value for the percentage of the dataset that should used for validation\n",
+    "                             (e.g. 0.2 for 20%)\n",
+    "        :param train_size: Size of the training dataset. For quicker training or debug, use a subset of the data.\n",
+    "                           Set to `None` to use all the data.\n",
+    "        :param eval_size: Size of the eval dataset. Set to `None` to use all the data.\n",
+    "        :param map_function: (Optional) Map function to apply to the dataset. For example, if the csv file has string\n",
+    "                             labels instead of numerical values, map function can do the conversion.\n",
+    "        \"\"\"\n",
+    "        # Init base class\n",
+    "        TextClassificationData.__init__(self, dataset_name, tokenizer, sentence1_key, sentence2_key, label_key)\n",
+    "        \n",
+    "        if (train_percent + eval_percent) > 1:\n",
+    "            raise ValueError(\"The combined value of the train percentage and eval percentage \" \\\n",
+    "                             \"cannot be greater than 1\")\n",
+    "        \n",
+    "        # Create a list of the column names\n",
+    "        column_names = [label_key, sentence1_key, sentence2_key] if sentence2_key else [label_key, sentence1_key]\n",
+    "        \n",
+    "        # Load the dataset using the Hugging Face API\n",
+    "        self.dataset = load_dataset(dataset_dir, delimiter=delimiter, data_files=data_files, column_names=column_names)\n",
+    "        \n",
+    "        # Optionally map the dataset labels using the map_function\n",
+    "        if map_function:\n",
+    "            self.dataset = self.dataset.map(map_function)\n",
+    "        \n",
+    "        # Setup the class labels\n",
+    "        self.class_labels = ClassLabel(num_classes=len(label_names), names=label_names)\n",
+    "        self.dataset[Split.TRAIN].features[label_key] = self.class_labels\n",
+    "        \n",
+    "        # Split the dataset based on the percentages defined\n",
+    "        self.dataset = self.dataset[Split.TRAIN].train_test_split(train_size=train_percent, test_size=eval_percent)\n",
+    "        \n",
+    "        # Tokenize the dataset\n",
+    "        tokenized_dataset = self.tokenize_dataset(self.dataset)\n",
+    "\n",
+    "        # Get the training and eval dataset based on the specified dataset sizes\n",
+    "        self.define_train_eval_splits(tokenized_dataset, Split.TRAIN, Split.TEST, train_size, eval_size)\n",
+    "\n",
+    "\n",
+    "# Modify the variables below to use a different dataset or a csv file on your local system.\n",
+    "# The csv_path variable should be pointing to a csv file with 2 columns (the label and the text)\n",
+    "dataset_url = \"https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip\"\n",
+    "dataset_dir = os.path.join(dataset_dir, \"smsspamcollection\")\n",
+    "csv_name = \"SMSSpamCollection\"\n",
+    "delimiter = \"\\t\"\n",
+    "label_names = [\"ham\", \"spam\"]\n",
+    "\n",
+    "# Rename the file to include the csv extension so that the dataset API knows how to load the file\n",
+    "renamed_csv = \"{}.csv\".format(csv_name)\n",
+    "\n",
+    "# If we don't already have the csv file, download and extract the zip file to get it.\n",
+    "if not os.path.exists(os.path.join(dataset_dir, csv_name)) and \\\n",
+    "                      not os.path.exists(os.path.join(dataset_dir, renamed_csv)):\n",
+    "    download_and_extract_zip_file(dataset_url, dataset_dir)\n",
+    "\n",
+    "if not os.path.exists(os.path.join(dataset_dir, renamed_csv)):\n",
+    "    os.rename(os.path.join(dataset_dir, csv_name), os.path.join(dataset_dir, renamed_csv))\n",
+    "    \n",
+    "# Columns\n",
+    "sentence1_key = \"text\"\n",
+    "sentence2_key = None\n",
+    "label_key = \"label\"\n",
+    "\n",
+    "# Map function to translate labels in the csv file to numerical values when loading the dataset\n",
+    "def map_spam(example):\n",
+    "    example[\"label\"] = int(example[\"label\"] == \"spam\")\n",
+    "    return example\n",
+    "\n",
+    "dataset = CustomCsvTextClassificationData(tokenizer, \"smsspamcollection\", dataset_dir, [renamed_csv], delimiter,\n",
+    "                                          label_names, sentence1_key, sentence2_key, label_key, train_size=1000,\n",
+    "                                          eval_size=1000, map_function=map_spam)\n",
+    "\n",
+    "# Print a sample of the data\n",
+    "dataset.display_sample(Split.TRAIN, 10)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "e3a24bcd",
+   "metadata": {},
+   "source": [
+    "## 3. Prepare the model for fine tuning and evaluation\n",
+    "\n",
+    "The notebook has two options to train the model.\n",
+    "\n",
+    "- Option A: Use the [`Trainer`](https://huggingface.co/docs/transformers/v4.16.2/en/main_classes/trainer#transformers.Trainer) API from Hugging Face.\n",
+    "- Option B: Use the native PyTorch API.\n",
+    "\n",
+    "In both cases, the model ends up being a transformers model and depending on the class constructor arguments, the appropriate API is selected.\n",
+    "\n",
+    "Execute the following cell to declare the base class used for the Text Classification Model setup."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "797485aa",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class TextClassificationModel():\n",
+    "    \"\"\"\n",
+    "    Class used for model loading, training and evaluation.\n",
+    "    \"\"\"\n",
+    "    def __init__(self, \n",
+    "                 model_name: str, \n",
+    "                 num_labels: int, \n",
+    "                 training_args: TrainingArguments = None, \n",
+    "                 ipex_optimize: bool = True, \n",
+    "                 device: str = \"cpu\"):\n",
+    "        \"\"\"\n",
+    "        Initialize the TextClassificationModel class for a text classification model with\n",
+    "        PyTorch. The class uses the model_name to load the pre-trained PyTorch model from\n",
+    "        Hugging Face. If the training_args are given then the Trainer API is selected for\n",
+    "        training and evaluation of the model otherwise native PyTorch API is selected for\n",
+    "        model training and evaluation\n",
+    "        \n",
+    "        :param model_name: Name of the pre-trained model to load from Hugging Face\n",
+    "        :param num_labels: Number of class labels\n",
+    "        :param training_args: A TrainingArguments object if using the Trainer API to train\n",
+    "                              the model. If None, native PyTorch API is used for training.\n",
+    "        :param ipex_optimize: If True, then the model is optimized to run on intel hardware.\n",
+    "        :param device: Device to run on the PyTorch model.\n",
+    "        \"\"\"\n",
+    "        self.model_name = model_name\n",
+    "        self.num_labels = num_labels\n",
+    "        self.training_args = training_args\n",
+    "        self.device = device\n",
+    "        self.trainer = None\n",
+    "        \n",
+    "        self.train_ds = dataset.train_ds\n",
+    "        self.eval_ds = dataset.eval_ds\n",
+    "        \n",
+    "        # Load the model using the pretrained weights\n",
+    "        self.model = AutoModelForSequenceClassification.from_pretrained(model_name, num_labels=num_labels)\n",
+    "       \n",
+    "        # Apply the ipex optimize function to the model\n",
+    "        if ipex_optimize:\n",
+    "            self.model = ipex.optimize(self.model)\n",
+    "            \n",
+    "    def train(self, \n",
+    "              dataset: TextClassificationData,\n",
+    "              optimizers: typing.Tuple[torch.optim.Optimizer, torch.optim.lr_scheduler.LambdaLR],\n",
+    "              num_train_epochs: int = 1,\n",
+    "              batch_size: int = 16,\n",
+    "              compute_metrics: typing.Callable = None,\n",
+    "              shuffle_samples: bool = True\n",
+    "             ):\n",
+    "\n",
+    "        # If training_args are given, we use the `Trainer` API to train the model\n",
+    "        if self.training_args:\n",
+    "            self.model.train()\n",
+    "            self.trainer = Trainer(model=self.model,\n",
+    "                                   args=self.training_args,\n",
+    "                                   train_dataset=self.train_ds,\n",
+    "                                   eval_dataset=self.eval_ds,\n",
+    "                                   optimizers=optimizers,\n",
+    "                                   compute_metrics=compute_metrics)\n",
+    "            self.trainer.train()\n",
+    "            \n",
+    "        # If training_args are not given, we use native PyTorch API to train the model\n",
+    "        else:\n",
+    "            \n",
+    "            # Rename the `label` column to `labels` because the model expects the argument to be named `labels`\n",
+    "            self.train_ds = self.train_ds.rename_column(\"label\", \"labels\")\n",
+    "            \n",
+    "            # Set the format of the dataset to return PyTorch tensors instead of lists\n",
+    "            self.train_ds.set_format(\"torch\")\n",
+    "            \n",
+    "            train_dataloader = DataLoader(self.train_ds, shuffle=shuffle_samples, batch_size=batch_size)\n",
+    "            \n",
+    "            # Unpack the `optimizers` parameter to get optimizer and lr_scheduler\n",
+    "            optimizer, lr_scheduler = optimizers[0], optimizers[1]\n",
+    "            \n",
+    "            # Define number of training steps for the training progress bar\n",
+    "            num_training_steps = num_train_epochs * len(train_dataloader)\n",
+    "            progress_bar = tqdm(range(num_training_steps))\n",
+    "            \n",
+    "            # Training loop\n",
+    "            self.model.to(self.device)\n",
+    "            self.model.train()\n",
+    "            for epoch in range(num_train_epochs):\n",
+    "                for batch in train_dataloader:\n",
+    "                    batch = {k: v.to(self.device) for k, v in batch.items()}\n",
+    "                    outputs = self.model(**batch)\n",
+    "                    loss = outputs.loss\n",
+    "                    loss.backward()\n",
+    "\n",
+    "                    optimizer.step()\n",
+    "                    lr_scheduler.step()\n",
+    "                    optimizer.zero_grad()\n",
+    "                    progress_bar.update(1)\n",
+    "    \n",
+    "    def evaluate(self, batch_size=16):\n",
+    "        \n",
+    "        if self.trainer:\n",
+    "            metrics = self.trainer.evaluate()\n",
+    "            for key in metrics.keys():\n",
+    "                print(\"{}: {}\".format(key, metrics[key]))\n",
+    "        else:\n",
+    "            # Rename the `label` column to `labels` because the model expects the argument to be named `labels`\n",
+    "            self.eval_ds = self.eval_ds.rename_column(\"label\", \"labels\")\n",
+    "            \n",
+    "            # Set the format of the dataset to return PyTorch tensors instead of lists\n",
+    "            self.eval_ds.set_format(\"torch\")\n",
+    "            \n",
+    "            eval_dataloader = DataLoader(self.eval_ds, batch_size=batch_size)\n",
+    "            progress_bar = tqdm(range(len(eval_dataloader)))\n",
+    "            \n",
+    "            metric = load_metric(\"accuracy\")\n",
+    "            self.model.eval()\n",
+    "            for batch in eval_dataloader:\n",
+    "                batch = {k: v.to(self.device) for k, v in batch.items()}\n",
+    "                with torch.no_grad():\n",
+    "                    outputs = self.model(**batch)\n",
+    "\n",
+    "                logits = outputs.logits\n",
+    "                predictions = torch.argmax(logits, dim=-1)\n",
+    "                metric.add_batch(predictions=predictions, references=batch[\"labels\"])\n",
+    "                progress_bar.update(1)\n",
+    "\n",
+    "            print(metric.compute())\n",
+    "            \n",
+    "    def predict(self, raw_input_text):\n",
+    "        if isinstance(raw_input_text, str):\n",
+    "            raw_input_text = list(raw_input_text)\n",
+    "        \n",
+    "        # Encode the raw text using the tokenizer\n",
+    "        encoded_input = tokenizer(raw_text_input, padding=True, return_tensors='pt')\n",
+    "        \n",
+    "        # Input the encoded text(s) to the model and get the predicted results\n",
+    "        self.model.eval()\n",
+    "        output = self.model(**encoded_input)\n",
+    "        _, predictions = torch.max(output.logits, dim=1)\n",
+    "        \n",
+    "        # Translate the predictions to class label strings\n",
+    "        prediction_labels = dataset.class_labels.int2str(predictions)\n",
+    "\n",
+    "        # Create a dataframe to display the results\n",
+    "        result_list = [list(x) for x in zip(raw_text_input, prediction_labels)]\n",
+    "        result_df = pd.DataFrame(result_list, columns=[\"Input Text\", \"Predicted Label\"])\n",
+    "        return result_df.style.hide()\n",
+    "    \n",
+    "    def parameters(self):\n",
+    "        return self.model.parameters()\n",
+    "    \n",
+    "    def save(self, output_dir):\n",
+    "        self.model.save_pretrained(output_dir)\n",
+    "        \n",
+    "    @classmethod\n",
+    "    def load(cls, output_dir):\n",
+    "        return cls(output_dir, num_labels=len(dataset.get_label_names()))"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "3e8f1edd",
+   "metadata": {},
+   "source": [
+    "Now that the `TextClassificationModel` class is defined, either use Option A to use the [`Trainer`](https://huggingface.co/docs/transformers/v4.16.2/en/main_classes/trainer#transformers.Trainer) API from Hugging Face or Option B to use the native PyTorch API."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "1a606f16",
+   "metadata": {},
+   "source": [
+    "### Option A: Use the [`Trainer`](https://huggingface.co/docs/transformers/v4.16.2/en/main_classes/trainer#transformers.Trainer) API from Hugging Face\n",
+    "\n",
+    "This step gets the pretrained model from [Hugging Face](https://huggingface.co/models) and sets up the\n",
+    "[TrainingArguments](https://huggingface.co/docs/transformers/v4.16.2/en/main_classes/trainer#transformers.TrainingArguments) and the\n",
+    "[Trainer](https://huggingface.co/docs/transformers/v4.16.2/en/main_classes/trainer#transformers.Trainer). For simplicity, this example is using default values for most of the training args, but we are specifying our output directory and the number of training epochs. If your output directory already has checkpoints from a previous run,\n",
+    "training will resume from the last checkpoint. The `overwrite_output_dir` training argument can be set to\n",
+    "`True` if you want to instead overwrite previously generated checkpoints.\n",
+    "\n",
+    "> Note that it is expected to see a warning at this step about some weights not being used. This is because\n",
+    "> the pretraining head from the original model is being replaced with a classification head."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0d70a4f8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "num_train_epochs = 2\n",
+    "batch_size = 16\n",
+    "num_labels = len(dataset.get_label_names())\n",
+    "\n",
+    "# Define a TrainingArguments object for the Trainer API to use.\n",
+    "training_args = TrainingArguments(output_dir=output_dir, num_train_epochs=num_train_epochs)\n",
+    "\n",
+    "# Get the model from Hugging Face. Since we are specifying training_args, the model is trained and\n",
+    "# evaluated with the Trainer API.\n",
+    "model = TextClassificationModel(model_name=model_name, num_labels=num_labels, training_args=training_args)\n",
+    "\n",
+    "# Define model training parameters\n",
+    "learning_rate      = 5e-5\n",
+    "optimizer          = AdamW(model.parameters(), lr=learning_rate)\n",
+    "num_training_steps = num_train_epochs * len(dataset.train_ds)\n",
+    "metric             = load_metric(\"accuracy\")\n",
+    "lr_scheduler       = get_scheduler(\n",
+    "                        name=\"linear\", optimizer=optimizer, num_warmup_steps=0, num_training_steps=num_training_steps\n",
+    "                     )\n",
+    "\n",
+    "# Helper function for the Trainer API to compute metrics\n",
+    "def compute_metrics(eval_pred):\n",
+    "    logits, labels = eval_pred\n",
+    "    predictions = np.argmax(logits, axis=-1)\n",
+    "    return metric.compute(predictions=predictions, references=labels)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "5fcabd97",
+   "metadata": {},
+   "source": [
+    "**Train and evaluate the model with the Trainer API**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e1256c40",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.train(\n",
+    "    dataset, \n",
+    "    optimizers=(optimizer, lr_scheduler), \n",
+    "    num_train_epochs=num_train_epochs, \n",
+    "    batch_size=batch_size,\n",
+    "    compute_metrics=compute_metrics\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4a7afe59",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.evaluate()"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "cce10679",
+   "metadata": {},
+   "source": [
+    "### Option B: Use the native PyTorch API\n",
+    "\n",
+    "This step gets the pretrained model from [Hugging Face](https://huggingface.co/models) and uses native PyTorch API to train and evaluate the model.\n",
+    "\n",
+    "> Note that it is expected to see a warning at this step about some weights not being used. This is because\n",
+    "> the pretraining head from the original model is being replaced with a classification head."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "202f6b01",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "num_train_epochs = 2\n",
+    "batch_size = 16\n",
+    "num_labels = len(dataset.get_label_names())\n",
+    "\n",
+    "# Get the model from Hugging Face. Since we are not specifying training_args, the model is trained and\n",
+    "# evaluated with the native PyTorch API.\n",
+    "model = TextClassificationModel(model_name=model_name, num_labels=num_labels)\n",
+    "\n",
+    "# Define model training parameters\n",
+    "learning_rate      = 5e-5\n",
+    "optimizer          = AdamW(model.parameters(), lr=learning_rate)\n",
+    "num_training_steps = num_train_epochs * len(dataset.train_ds)\n",
+    "lr_scheduler       = get_scheduler(\n",
+    "                        name=\"linear\", optimizer=optimizer, num_warmup_steps=0, num_training_steps=num_training_steps\n",
+    "                     )"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "f4821e46",
+   "metadata": {},
+   "source": [
+    "**Train and evaluate the model with the native PyTorch API**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "eeb2e694",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.train(\n",
+    "    dataset, \n",
+    "    optimizers=(optimizer, lr_scheduler), \n",
+    "    num_train_epochs=num_train_epochs, \n",
+    "    batch_size=batch_size\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7ff3b884",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.evaluate()"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "b83b873f",
+   "metadata": {},
+   "source": [
+    "## 4. Export the model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "faa4beb3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Save the model to our output directory\n",
+    "model.save(output_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "49449342",
+   "metadata": {},
+   "source": [
+    "## 5. Reload the model and make predictions\n",
+    "\n",
+    "The output directory is used to reload the model. In the next cell, we evalute the reloaded model to verify that we are getting the same metrics that we saw after fine tuning."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "e339d50d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "reloaded_model = TextClassificationModel.load(output_dir)\n",
+    "    \n",
+    "reloaded_model.evaluate()"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "c70a5386",
+   "metadata": {},
+   "source": [
+    "Next, we demonstrate how encode raw text input and get predictions from the reloaded model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "40d231c0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Setup some raw text input\n",
+    "if dataset.dataset_name == \"imdb\":\n",
+    "    raw_text_input = [\"It was okay. I finished it, but wouldn't watch it again.\",\n",
+    "                      \"So bad\",\n",
+    "                      \"Definitely not my favorite\",\n",
+    "                      \"Highly recommended\"]\n",
+    "elif dataset.dataset_name == \"smsspamcollection\":\n",
+    "    raw_text_input = [\"Happy Birthday!\",\n",
+    "                      \"Thank you for your order, please click the following link for tracking info 12345678\",\n",
+    "                      \"Congratulations! You have won a free trip to Australia!!! Reply back with your full name and address.\",\n",
+    "                      \"Can you get some milk while you're at the store?\",\n",
+    "                      \"On my way\",\n",
+    "                      \"OMG LOL :D\",\n",
+    "                      \"Urgent! The IRS has been trying to contact you regarding your tax return. Please call 555-555-5555 immediately\"]\n",
+    "else:\n",
+    "    # Define your own input text when using another dataset\n",
+    "    raw_text_input = []\n",
+    "\n",
+    "\n",
+    "model.predict(raw_text_input)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "bee40324",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@InProceedings{maas-EtAl:2011:ACL-HLT2011,\n",
+    "  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},\n",
+    "  title     = {Learning Word Vectors for Sentiment Analysis},\n",
+    "  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},\n",
+    "  month     = {June},\n",
+    "  year      = {2011},\n",
+    "  address   = {Portland, Oregon, USA},\n",
+    "  publisher = {Association for Computational Linguistics},\n",
+    "  pages     = {142--150},\n",
+    "  url       = {http://www.aclweb.org/anthology/P11-1015}\n",
+    "}\n",
+    "\n",
+    "@misc{misc_sms_spam_collection_228,\n",
+    "  author       = {Almeida, Tiago},\n",
+    "  title        = {{SMS Spam Collection}},\n",
+    "  year         = {2012},\n",
+    "  howpublished = {UCI Machine Learning Repository}\n",
+    "}\n",
+    "```\n",
+    "Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.10"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/text_classification/pytorch_text_classification/README.md b/notebooks/text_classification/pytorch_text_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..da9c58fd836b60a843cc4f7a701b6e446a37a632
--- /dev/null
+++ b/notebooks/text_classification/pytorch_text_classification/README.md
@@ -0,0 +1,48 @@
+# Text Classifier fine tuning with PyTorch
+
+This notebook demonstrates fine tuning [pretrained models from Hugging Face](https://huggingface.co/models)
+using text classification datasets from the [Hugging Face Datasets catalog](https://huggingface.co/datasets) or
+a custom dataset. The [IMDb Larget Movie Review dataset](https://ai.stanford.edu/~amaas/data/sentiment/) is used
+from the Hugging Face Datasets catalog, and the [SMS Spam Collection dataset](https://archive.ics.uci.edu/ml/datasets/sms+spam+collection)
+is used as an example of a custom dataset being loaded from a csv file.
+
+The notebook uses
+[Intel® Extension for PyTorch\*](https://intel.github.io/intel-extension-for-pytorch) which extends PyTorch
+with optimizations for extra performance boost on Intel hardware.
+
+The notebook performs the following steps:
+1. Import dependencies and setup parameters
+2. Prepare the dataset
+3. Prepare the Model for Fine Tuning and Evaluation
+4. Export the model
+5. Reload the model and make predictions
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [PyTorch notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset Citations
+```
+@InProceedings{maas-EtAl:2011:ACL-HLT2011,
+  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},
+  title     = {Learning Word Vectors for Sentiment Analysis},
+  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},
+  month     = {June},
+  year      = {2011},
+  address   = {Portland, Oregon, USA},
+  publisher = {Association for Computational Linguistics},
+  pages     = {142--150},
+  url       = {http://www.aclweb.org/anthology/P11-1015}
+}
+
+@misc{misc_sms_spam_collection_228,
+  author       = {Almeida, Tiago},
+  title        = {{SMS Spam Collection}},
+  year         = {2012},
+  howpublished = {UCI Machine Learning Repository}
+}
+```
+Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.
+
diff --git a/notebooks/text_classification/tfhub_text_classification/BERT_Binary_Text_Classification.ipynb b/notebooks/text_classification/tfhub_text_classification/BERT_Binary_Text_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..6877c1d4ebb34c463ab1821a1e36abb67c5415ea
--- /dev/null
+++ b/notebooks/text_classification/tfhub_text_classification/BERT_Binary_Text_Classification.ipynb
@@ -0,0 +1,667 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Binary text classification using BERT models from TF Hub\n",
+    "\n",
+    "This notebook demonstrates fine tuning BERT models from [TF Hub](https://tfhub.dev) with binary text classification datasets.\n",
+    "\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset)\n",
+    "3. [Build the model](#3.-Build-the-model)\n",
+    "4. [Fine tuning and evaluation](#4.-Fine-tuning-and-evaluation)\n",
+    "5. [Export the model](#5.-Export-the-model)\n",
+    "6. [Reload the model and make predictions](#6.-Reload-the-model-and-make-predictions)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [README.md](/notebooks/README.md) to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "import tensorflow_hub as hub\n",
+    "import tensorflow_datasets as tfds\n",
+    "\n",
+    "from bert_utils import get_model_map\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Note that tensorflow_text isn't used directly but the import is required to register ops used by the\n",
+    "# BERT text preprocessor\n",
+    "! pip3 install tensorflow-text==2.12 --no-deps\n",
+    "import tensorflow_text"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "This notebook will run one of the supported [BERT models from TF Hub](https://tfhub.dev/google/collections/bert/1). The table below has a list of the available models and links to their URLs in TF Hub."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load the TF Hub model map from json and print a list of the supported models\n",
+    "tfhub_model_map, models_df = get_model_map(\"tfhub_bert_model_map_classifier.json\", return_data_frame=True)\n",
+    "models_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Specify the name of the BERT model to use. This string must match one of the models listed in the table above."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"small_bert/bert_en_uncased_L-2_H-128_A-2\"\n",
+    "if model_name not in tfhub_model_map.keys():\n",
+    "    raise ValueError(\"The specified model name ({}) is not supported\".format(model_name))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define a directory to download the dataset\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Define an output directory for the saved model to be exported\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "# Output directory for logs and checkpoints generated during training\n",
+    "if not os.path.isdir(output_directory):\n",
+    "    os.makedirs(output_directory)\n",
+    "    \n",
+    "tfhub_preprocess = tfhub_model_map[model_name][\"preprocess\"]\n",
+    "tfhub_bert_encoder = tfhub_model_map[model_name][\"bert_encoder\"]\n",
+    "\n",
+    "print(\"Using TF Hub model:\", model_name)\n",
+    "print(\"BERT encoder URL:\", tfhub_bert_encoder)\n",
+    "print(\"Preprocessor URL:\", tfhub_preprocess)\n",
+    "print(\"Dataset directory:\", dataset_directory)\n",
+    "print(\"Output directory:\", output_directory)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset\n",
+    "\n",
+    "The notebook has two options for getting a dataset:\n",
+    "* Option A: Use a dataset from the [TensorFlow Datasets catalog](https://www.tensorflow.org/datasets/catalog/overview)\n",
+    "* Option B: Use a custom dataset (downloaded from another source or from your local system)\n",
+    "\n",
+    "In both cases, the code ends up defining [`tf.data.Dataset`](https://www.tensorflow.org/api_docs/python/tf/data/Dataset) objects for each split (train, validation, and test) and a map for the translating the numerical to string label.\n",
+    "\n",
+    "Execute the following cell to set the batch size and declare the base class used for the dataset setup."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define the dataset batch size\n",
+    "batch_size = 32\n",
+    "\n",
+    "# Base class used for defining the binary text classification dataset being used\n",
+    "class BinaryTextClassificationData():\n",
+    "    def __init__(self, batch_size, label_map):\n",
+    "        self.batch_size = batch_size\n",
+    "        self.label_map = label_map\n",
+    "        self.reverse_label_map = {}\n",
+    "        self.train_ds = None\n",
+    "        self.val_ds = None\n",
+    "        self.test_ds = None\n",
+    "        self.dataset_name = \"\"\n",
+    "        \n",
+    "        for k, v in self.label_map.items():\n",
+    "            self.reverse_label_map[v] = k\n",
+    "        \n",
+    "    def get_str_label(self, numerical_value):\n",
+    "        if not isinstance(numerical_value, int):\n",
+    "            numerical_value = int(tf.math.round(numerical_value))\n",
+    "        \n",
+    "        if numerical_value in self.label_map.keys():\n",
+    "            return label_map[numerical_value]\n",
+    "        else:\n",
+    "            raise ValueError(\"The key {} was not found in the label map\".format(numerical_value))"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Now that the base class is defined, either run [Option A to use the TensorFlow Dataset catalog](#Option-A:-Use-a-TensorFlow-dataset) or [Option B for a custom dataset](#Option-B:-Use-a-custom-dataset) downloaded from online or from your local system."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option A: Use a TensorFlow dataset\n",
+    "\n",
+    "[TensorFlow Datasets](https://www.tensorflow.org/datasets) has a [catalog of datasets](https://www.tensorflow.org/datasets/catalog/overview) that can be specified by name. Information about the dataset is available in the catalog (including information on the size of the dataset and the splits).\n",
+    "\n",
+    "The next cell demonstrates using the [`imdb_reviews`](https://www.tensorflow.org/datasets/catalog/imdb_reviews) dataset from the TensorFlow datasets catalog to get splits for training, validation, and test. Skip the next cell if you would like to instead use \"Option B\" for a custom dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class TFDSBinaryTextClassificationData(BinaryTextClassificationData):\n",
+    "    def __init__(self, dataset_dir, tfds_name, train_split, val_split, test_split, label_map, batch_size):\n",
+    "        \"\"\"\n",
+    "        Intialize the TFDSBinaryTextClassificationData class for a dataset binary text classification dataset\n",
+    "        from the TensorFlow dataset catalog.\n",
+    "        \n",
+    "        :param dataset_dir: Path to a dataset directory to read/write data\n",
+    "        :param tfds_name: String name of the TensorFlow dataset to load\n",
+    "        :param train_split: String specifying which split to load for training (e.g. \"train[:80%]\"). See the\n",
+    "                            https://www.tensorflow.org/datasets/splits documentation for more information on\n",
+    "                            defining splits.\n",
+    "        :param val_split: String specifying the split to load for validation.\n",
+    "        :param test_split: String specifying the split to load for test.\n",
+    "        :param label_map: Dictionary where the key is a numerical value and the value is the string label\n",
+    "        :param batch_size: Batch size\n",
+    "        \"\"\"\n",
+    "        # Init base class\n",
+    "        BinaryTextClassificationData.__init__(self, batch_size, label_map) \n",
+    "        \n",
+    "        [self.train_ds, self.val_ds, self.test_ds], info = tfds.load(tfds_name,\n",
+    "                     data_dir=dataset_dir,\n",
+    "                     split=[train_split, val_split, test_split],\n",
+    "                     batch_size=batch_size,\n",
+    "                     as_supervised=True,\n",
+    "                     shuffle_files=True,\n",
+    "                     with_info=True)\n",
+    "        self.dataset_name = tfds_name\n",
+    "        print(info)\n",
+    "\n",
+    "\n",
+    "# Name of the TFDS to use\n",
+    "tfds_name=\"imdb_reviews\"\n",
+    "\n",
+    "# Location where the dataset will be downloaded\n",
+    "dataset_directory = os.path.join(dataset_directory, tfds_name)\n",
+    "if not os.path.isdir(dataset_directory):\n",
+    "    os.makedirs(dataset_directory)\n",
+    "\n",
+    "# Label map for sentiment analysis\n",
+    "label_map = {\n",
+    "    1: \"Positive\",\n",
+    "    0: \"Negative\"\n",
+    "}\n",
+    "    \n",
+    "# Initialize the dataset splits using a dataset from the TensorFlow datasets catalog\n",
+    "dataset = TFDSBinaryTextClassificationData(dataset_dir=dataset_directory,\n",
+    "                                           tfds_name=tfds_name,\n",
+    "                                           train_split=\"train[:50%]\",\n",
+    "                                           val_split=\"train[:20%]\",\n",
+    "                                           test_split=\"test[:20%]\",\n",
+    "                                           label_map=label_map,\n",
+    "                                           batch_size=batch_size)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [3. Build the model](#3.-Build-the-model) to continue using the TF dataset."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option B: Use a custom dataset\n",
+    "\n",
+    "Instead of using a dataset from TensorFlow datasets, another dataset from your local system or a download can be used. \n",
+    "\n",
+    "In this example, we download the [SMS Spam Collection dataset](https://archive.ics.uci.edu/ml/datasets/sms+spam+collection). (Note: Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.) The zip file has a single tab-separated value file with two columns. The first column is the label (`ham` or `spam`) and the second column is the text of the SMS message:\n",
+    "```\n",
+    "<ham or spam>\t<text>\n",
+    "<ham or spam>\t<text>\n",
+    "<ham or spam>\t<text>\n",
+    "...\n",
+    "```\n",
+    "If you are using a custom dataset that has a similarly formatted csv or tsv file, you can still use the class defined below. Just create your object passing in custom values for delimiter, header (whether the file has a header row), the label map, mapping function, etc."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class CustomCsvBinaryTextClassificationData(BinaryTextClassificationData):\n",
+    "    def __init__(self, csv_file, delimiter, header, train_percent, val_percent,\n",
+    "                 test_percent, label_map, batch_size, dataset_name, map_function=None):\n",
+    "        \"\"\"\n",
+    "        Intialize the CustomCsvBinaryTextClassificationData class for a dataset binary text\n",
+    "        classification dataset that uses a single csv file.\n",
+    "        \n",
+    "        :param csv_file: Path to the csv file\n",
+    "        :param delimiter: String character that separates the fields in each row\n",
+    "        :param header: Boolean indicating whether or not the csv file has a header line that should be skipped\n",
+    "        :param train_percent: Decimal value for the percentage of the dataset that should be used for training\n",
+    "                              (e.g. 0.8 for 80%)\n",
+    "        :param val_percent: Decimal value for the percentage of the dataset that should be used for validation\n",
+    "                            (e.g. 0.1 for 10%)\n",
+    "        :param test_percent: Decimal value for the percentage of the dataset that should be used for test\n",
+    "                             (e.g. 0.1 for 10%)\n",
+    "        :param label_map: Dictionary where the key is a numerical value and the value is the string label\n",
+    "        :param batch_size: Batch size\n",
+    "        :param dataset_name: Name of the dataset. This is used later in this notebook for naming the saved model\n",
+    "                             export folder and determining which input strings to use when testing the reloaded model\n",
+    "        :param map_function: (Optional) If the csv file has string labels instead of the numerical values, provide a\n",
+    "                             map function to apply on the dataset\n",
+    "        \"\"\"\n",
+    "        # Init base class\n",
+    "        BinaryTextClassificationData.__init__(self, batch_size, label_map)\n",
+    "        \n",
+    "        self.dataset_name = dataset_name\n",
+    "        \n",
+    "        if (train_percent + val_percent + test_percent) > 1:\n",
+    "            raise ValueError(\"The combined value of the train percentage, validation percentage, and \" \\\n",
+    "                             \"test percentage cannot be greater than 1\")\n",
+    "        \n",
+    "        if not os.path.exists(csv_file):\n",
+    "            raise FileNotFoundError(\"Unable to find the csv file at\", csv_file)\n",
+    "        \n",
+    "        custom_dataset = tf.data.experimental.CsvDataset(filenames=csv_file,\n",
+    "                                                         record_defaults=[tf.string, tf.string],\n",
+    "                                                         field_delim=delimiter,\n",
+    "                                                         use_quote_delim=False,\n",
+    "                                                         header=header)\n",
+    "        \n",
+    "        # Count the number of lines in the csv file to get the dataset length\n",
+    "        custom_dataset_len = sum(1 for line in open(csv_file))\n",
+    "        \n",
+    "        if header:\n",
+    "            custom_dataset_len -= 1\n",
+    "        \n",
+    "        # Optionally map the dataset labels using the map_function\n",
+    "        if map_function:\n",
+    "            custom_dataset = custom_dataset.map(lambda x, y: (y, map_function(x)))\n",
+    "        \n",
+    "        # Create batches based on the specified batch size\n",
+    "        custom_dataset = custom_dataset.batch(batch_size)\n",
+    "        \n",
+    "        # Calculate sizes for the splits\n",
+    "        total_num_batches = int(custom_dataset_len / batch_size)\n",
+    "        train_size = int(train_percent * total_num_batches)\n",
+    "        val_size = int(val_percent * total_num_batches)\n",
+    "        test_size = int(test_percent * total_num_batches)\n",
+    "\n",
+    "        # Create the train, validation, and test splits\n",
+    "        self.train_ds = custom_dataset.take(train_size)    \n",
+    "        self.val_ds = custom_dataset.skip(train_size).take(val_size)\n",
+    "        self.test_ds = custom_dataset.skip(train_size).skip(val_size)\n",
+    "\n",
+    "        # Set the cardinality so that progress bars will work properly\n",
+    "        self.train_ds = self.train_ds.apply(tf.data.experimental.assert_cardinality(train_size))\n",
+    "        self.val_ds = self.val_ds.apply(tf.data.experimental.assert_cardinality(val_size))\n",
+    "        self.test_ds = self.test_ds.apply(tf.data.experimental.assert_cardinality(test_size))\n",
+    "\n",
+    "\n",
+    "# Modify the variables below to use a different dataset or a csv file on your local system.\n",
+    "# The csv_path variable should be pointing to a csv file with 2 columns (the label and the text)\n",
+    "dataset_url = \"https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip\"\n",
+    "dataset_directory = os.path.join(dataset_directory, \"smsspamcollection\")\n",
+    "csv_name = \"SMSSpamCollection\"\n",
+    "delimiter = \"\\t\"\n",
+    "header = False  # Set to true if the csv file has a header row\n",
+    "csv_path = os.path.join(dataset_directory, csv_name)\n",
+    "\n",
+    "# If we don't already have the csv file, download and extract the zip file to get it.\n",
+    "if not os.path.exists(csv_path):\n",
+    "    download_and_extract_zip_file(dataset_url, dataset_directory)\n",
+    "\n",
+    "# Define the label map for your dataset. The label map below is for the SMS Spam Collection dataset.\n",
+    "# The labels defined in this dictionary should match the labels in the csv file.\n",
+    "label_map = {\n",
+    "    1: \"spam\",\n",
+    "    0: \"ham\"\n",
+    "}\n",
+    "\n",
+    "# Map function to translate labels in the csv file to numerical values when loading the dataset\n",
+    "def map_spam(x):\n",
+    "    if x == \"spam\":\n",
+    "        return 1\n",
+    "    else:\n",
+    "        return 0\n",
+    "\n",
+    "# Initialize the dataset splits using the custom dataset\n",
+    "dataset = CustomCsvBinaryTextClassificationData(csv_file=csv_path,\n",
+    "                                                delimiter=delimiter,\n",
+    "                                                header=header,\n",
+    "                                                train_percent=0.8,\n",
+    "                                                val_percent=0.1,\n",
+    "                                                test_percent=0.1,\n",
+    "                                                label_map=label_map,\n",
+    "                                                batch_size=batch_size,\n",
+    "                                                dataset_name=csv_name,\n",
+    "                                                map_function=map_spam)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 3. Build the model\n",
+    "\n",
+    "Create the BERT model to fine tune using a input layer, the preprocessing layer (from TF Hub), the BERT encoder layer (from TF Hub), one dense layer, and a dropout layer."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "input_layer = tf.keras.layers.Input(shape=(), dtype=tf.string, name='input_layer')\n",
+    "preprocessing_layer = hub.KerasLayer(tfhub_preprocess, name='preprocessing')\n",
+    "encoder_inputs = preprocessing_layer(input_layer)\n",
+    "encoder_layer = hub.KerasLayer(tfhub_bert_encoder, trainable=True, name='encoder')\n",
+    "outputs = encoder_layer(encoder_inputs)\n",
+    "net = outputs['pooled_output']\n",
+    "net = tf.keras.layers.Dropout(0.1)(net)\n",
+    "net = tf.keras.layers.Dense(1, activation=None, name='classifier')(net)\n",
+    "classifier_model = tf.keras.Model(input_layer, net)\n",
+    "\n",
+    "classifier_model.summary()"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 4. Fine tuning and evaluation\n",
+    "\n",
+    "Train the model for the specified number of epochs, then evaluate the model using the test dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "\n",
+    "# The number of training epochs to run\n",
+    "num_train_epochs = 2\n",
+    "\n",
+    "# Learning rate\n",
+    "learning_rate = 3e-5\n",
+    "\n",
+    "# Maximum total input sequence length after WordPiece tokenization (longer sequences will be truncated)\n",
+    "max_seq_length = 128\n",
+    "\n",
+    "classifier_model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=learning_rate,epsilon=1e-08),\n",
+    "                         loss=tf.keras.losses.BinaryCrossentropy(from_logits=True),\n",
+    "                         metrics=tf.metrics.BinaryAccuracy())\n",
+    "\n",
+    "history = classifier_model.fit(dataset.train_ds,\n",
+    "                               validation_data=dataset.val_ds,\n",
+    "                               epochs=num_train_epochs)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Evaluate the accuracy using the test dataset. If the accuracy does not meet your expectations, try to increasing the size of the training dataset split or the number of training epochs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "loss, accuracy = classifier_model.evaluate(dataset.test_ds)\n",
+    "\n",
+    "print(f'Loss: {loss}')\n",
+    "print(f'Accuracy: {accuracy}')"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Predict using a single batch from the test dataset, and then display the results along with the input text and the actual label."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "num_steps = 1\n",
+    "predictions = classifier_model.predict(dataset.test_ds, batch_size=batch_size, steps=num_steps)\n",
+    "\n",
+    "prediction_list = []\n",
+    "step_count = 0\n",
+    "\n",
+    "for batch in dataset.test_ds:\n",
+    "    label_list = list(batch[1].numpy())\n",
+    "    text_list = list(batch[0].numpy())\n",
+    "    \n",
+    "    for i, (text, actual_label) in enumerate(zip(text_list, label_list)):\n",
+    "        score = tf.math.sigmoid(predictions[i])\n",
+    "        prediction = int(tf.math.round(score))\n",
+    "        prediction = dataset.get_str_label(prediction)\n",
+    "        prediction_list.append([text.decode('utf-8'),\n",
+    "                                tf.get_static_value(score)[0],\n",
+    "                                prediction,\n",
+    "                                dataset.get_str_label(actual_label)])\n",
+    "    \n",
+    "    step_count += 1\n",
+    "    if num_steps <= step_count:\n",
+    "        break\n",
+    "    \n",
+    "result_df = pd.DataFrame(prediction_list, columns=[\"Input Text\", \"Score\", \"Predicted Label\", \"Actual Label\"])\n",
+    "result_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 5. Export the model\n",
+    "\n",
+    "Since training has completed, export the `saved_model.pb` to the output directory in a folder with the model and dataset name."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_dir = \"{}_{}\".format(model_name, dataset.dataset_name)\n",
+    "model_dir = os.path.join(output_directory, model_dir)\n",
+    "classifier_model.save(model_dir, include_optimizer=False)\n",
+    "\n",
+    "saved_model_path = os.path.join(model_dir, \"saved_model.pb\")\n",
+    "if os.path.exists(saved_model_path):\n",
+    "    print(\"Saved model location:\", saved_model_path)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 6. Reload the model and make predictions\n",
+    "\n",
+    "Reload from the `saved_model.pb` in the output directory."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "reloaded_model = tf.saved_model.load(model_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The next section defines a list of strings to send as input to the reloaded model. If you are using a dataset other than the [IMDB movie reviews](https://www.tensorflow.org/datasets/catalog/imdb_reviews) or the [SMS Spam Collection](https://archive-beta.ics.uci.edu/ml/datasets/sms+spam+collection), you can update the snippet below with your own list of input text."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "if dataset.dataset_name == \"imdb_reviews\":\n",
+    "    input_text = [\"Awesome movie\",\n",
+    "                  \"It was entertaining, but completely predictable.\",\n",
+    "                  \"Wasn't what I expected, but I still enjoyed it\",\n",
+    "                  \"I wouldn't recommend this movie to my worst enemy\",\n",
+    "                  \"I'm not sure how good the movie was, because I fell asleep\"]\n",
+    "elif dataset.dataset_name == \"SMSSpamCollection\":\n",
+    "    input_text = [\"Happy Birthday!\",\n",
+    "                  \"Thank you for your order, please click the following link for tracking info 12345678\",\n",
+    "                  \"Congratulations! You have won a free trip to Australia!!! Reply back with your full name and address.\",\n",
+    "                  \"Can you get some milk while you're at the store?\",\n",
+    "                  \"On my way\",\n",
+    "                  \"OMG LOL :D\",\n",
+    "                  \"Urgent! The IRS has been trying to contact you regarding your tax return. Please call 555-555-5555 immediately\"]\n",
+    "else:\n",
+    "    # Define your own list of input text for another dataset\n",
+    "    input_text = []\n",
+    "    \n",
+    "if not input_text:\n",
+    "    raise ValueError(\"Please define the list of input_text strings.\")\n",
+    "\n",
+    "# Send the input text to the reloaded model\n",
+    "predict_results = tf.sigmoid(reloaded_model(tf.constant(input_text)))\n",
+    "\n",
+    "# Get the results into a data frame to display\n",
+    "result_list = [[input_text[i],\n",
+    "                tf.get_static_value(predict_results[i])[0],\n",
+    "                dataset.get_str_label(tf.get_static_value(predict_results[i])[0])] for i in range(len(input_text))]\n",
+    "result_df = pd.DataFrame(result_list, columns=[\"Input Text\", \"Score\", \"Predicted Label\"])\n",
+    "result_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@InProceedings{maas-EtAl:2011:ACL-HLT2011,\n",
+    "  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},\n",
+    "  title     = {Learning Word Vectors for Sentiment Analysis},\n",
+    "  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},\n",
+    "  month     = {June},\n",
+    "  year      = {2011},\n",
+    "  address   = {Portland, Oregon, USA},\n",
+    "  publisher = {Association for Computational Linguistics},\n",
+    "  pages     = {142--150},\n",
+    "  url       = {http://www.aclweb.org/anthology/P11-1015}\n",
+    "}\n",
+    "\n",
+    "@misc{misc_sms_spam_collection_228,\n",
+    "  author       = {Almeida, Tiago},\n",
+    "  title        = {{SMS Spam Collection}},\n",
+    "  year         = {2012},\n",
+    "  howpublished = {UCI Machine Learning Repository}\n",
+    "}\n",
+    "```\n",
+    "\n",
+    "Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/notebooks/text_classification/tfhub_text_classification/BERT_Multi_Text_Classification.ipynb b/notebooks/text_classification/tfhub_text_classification/BERT_Multi_Text_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..6a25165bf9078f564e6e0e689d63c1ca95bd3b2c
--- /dev/null
+++ b/notebooks/text_classification/tfhub_text_classification/BERT_Multi_Text_Classification.ipynb
@@ -0,0 +1,660 @@
+{
+ "cells": [
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Multiclass text classification using BERT models from TF Hub\n",
+    "\n",
+    "This notebook demonstrates fine tuning BERT models from [TF Hub](https://tfhub.dev) with multiclass text classification datasets.\n",
+    "\n",
+    "The notebook performs the following steps:\n",
+    "1. [Import dependencies and setup parameters](#1.-Import-dependencies-and-setup-parameters)\n",
+    "2. [Prepare the dataset](#2.-Prepare-the-dataset)\n",
+    "3. [Build the model](#3.-Build-the-model)\n",
+    "4. [Fine tuning and evaluation](#4.-Fine-tuning-and-evaluation)\n",
+    "5. [Export the model](#5.-Export-the-model)\n",
+    "6. [Reload the model and make predictions](#6.-Reload-the-model-and-make-predictions)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions in the [README.md](/notebooks/README.md) to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "import tensorflow_hub as hub\n",
+    "import tensorflow_datasets as tfds\n",
+    "\n",
+    "from bert_utils import get_model_map\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Note that tensorflow_text isn't used directly but the import is required to register ops used by the\n",
+    "# BERT text preprocessor\n",
+    "! pip3 install tensorflow-text==2.12.0 --no-deps\n",
+    "import tensorflow_text"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "This notebook will run one of the supported [BERT models from TF Hub](https://tfhub.dev/google/collections/bert/1). The table below has a list of the available models and links to their URLs in TF Hub."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load the TF Hub model map from json and print a list of the supported models\n",
+    "tfhub_model_map, models_df = get_model_map(\"tfhub_bert_model_map_classifier.json\", return_data_frame=True)\n",
+    "models_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Specify the name of the BERT model to use. This string must match one of the models listed in the table above."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"small_bert/bert_en_uncased_L-2_H-128_A-2\"\n",
+    "if model_name not in tfhub_model_map.keys():\n",
+    "    raise ValueError(\"The specified model name ({}) is not supported\".format(model_name))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define a directory to download the dataset\n",
+    "dataset_directory = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Define an output directory for the saved model to be exported\n",
+    "output_directory = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "# Output directory for logs and checkpoints generated during training\n",
+    "if not os.path.isdir(output_directory):\n",
+    "    os.makedirs(output_directory)\n",
+    "    \n",
+    "tfhub_preprocess = tfhub_model_map[model_name][\"preprocess\"]\n",
+    "tfhub_bert_encoder = tfhub_model_map[model_name][\"bert_encoder\"]\n",
+    "\n",
+    "print(\"Using TF Hub model:\", model_name)\n",
+    "print(\"BERT encoder URL:\", tfhub_bert_encoder)\n",
+    "print(\"Preprocessor URL:\", tfhub_preprocess)\n",
+    "print(\"Dataset directory:\", dataset_directory)\n",
+    "print(\"Output directory:\", output_directory)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Prepare the dataset\n",
+    "\n",
+    "This notebook gets the dataset from a text file or from the [TensorFlow Datasets catalog](https://www.tensorflow.org/datasets/catalog/overview).\n",
+    "\n",
+    "The code ends up defining [`tf.data.Dataset`](https://www.tensorflow.org/api_docs/python/tf/data/Dataset) objects for each split (train, validation, and test) and a map for the translating the numerical to string label.\n",
+    "\n",
+    "Execute the following cell to set the batch size and declare the base class used for the dataset setup."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define the dataset batch size\n",
+    "batch_size = 32\n",
+    "\n",
+    "# Base class used for defining the multi text classification dataset being used\n",
+    "class MultiTextClassificationData():\n",
+    "    def __init__(self, batch_size, label_map):\n",
+    "        self.batch_size = batch_size\n",
+    "        self.label_map = label_map\n",
+    "        self.reverse_label_map = {}\n",
+    "        self.train_ds = None\n",
+    "        self.val_ds = None\n",
+    "        self.test_ds = None\n",
+    "        self.dataset_name = \"\"\n",
+    "        \n",
+    "        for k, v in self.label_map.items():\n",
+    "            self.reverse_label_map[v] = k\n",
+    "        \n",
+    "    def get_str_label(self, numerical_value):\n",
+    "        if not isinstance(numerical_value, int):\n",
+    "            numerical_value = int(tf.math.round(numerical_value))\n",
+    "        \n",
+    "        if numerical_value in self.label_map.keys():\n",
+    "            return self.label_map[numerical_value]\n",
+    "        else:\n",
+    "            raise ValueError(\"The key {} was not found in the label map\".format(numerical_value))"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option A: Use a TensorFlow dataset\n",
+    "\n",
+    "[TensorFlow Datasets](https://www.tensorflow.org/datasets) has a [catalog of datasets](https://www.tensorflow.org/datasets/catalog/overview) that can be specified by name. Information about the dataset is available in the catalog (including information on the size of the dataset and the splits).\n",
+    "\n",
+    "The next cell demonstrates using the [`ag_news_subset`](https://www.tensorflow.org/datasets/catalog/ag_news_subset) dataset from the TensorFlow datasets catalog to get splits for training, validation, and test."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class TFDSMultiTextClassificationData(MultiTextClassificationData):\n",
+    "    def __init__(self, dataset_dir, tfds_name, train_split, val_split, test_split, label_map, batch_size):\n",
+    "        \"\"\"\n",
+    "        Intialize the TFDSMultiTextClassificationData class for a dataset multi text classification dataset\n",
+    "        from the TensorFlow dataset catalog.\n",
+    "        \n",
+    "        :param dataset_dir: Path to a dataset directory to read/write data\n",
+    "        :param tfds_name: String name of the TensorFlow dataset to load\n",
+    "        :param train_split: String specifying which split to load for training (e.g. \"train[:80%]\"). See the\n",
+    "                            https://www.tensorflow.org/datasets/splits documentation for more information on\n",
+    "                            defining splits.\n",
+    "        :param val_split: String specifying the split to load for validation.\n",
+    "        :param test_split: String specifying the split to load for test.\n",
+    "        :param label_map: Dictionary where the key is a numerical value and the value is the string label\n",
+    "        :param batch_size: Batch size\n",
+    "        \"\"\"\n",
+    "        # Init base class\n",
+    "        MultiTextClassificationData.__init__(self, batch_size, label_map) \n",
+    "        \n",
+    "        [self.train_ds, self.val_ds, self.test_ds], info = tfds.load(tfds_name,\n",
+    "                     data_dir=dataset_dir,\n",
+    "                     split=[train_split, val_split, test_split],\n",
+    "                     batch_size=batch_size,\n",
+    "                     as_supervised=True,\n",
+    "                     shuffle_files=True,\n",
+    "                     with_info=True)\n",
+    "        self.dataset_name = tfds_name\n",
+    "        print(info)\n",
+    "\n",
+    "\n",
+    "# Name of the TFDS to use\n",
+    "tfds_name=\"ag_news_subset\"\n",
+    "\n",
+    "# Location where the dataset will be downloaded\n",
+    "dataset_directory = os.path.join(dataset_directory, tfds_name)\n",
+    "if not os.path.isdir(dataset_directory):\n",
+    "    os.makedirs(dataset_directory)\n",
+    "\n",
+    "# Label map for sentiment analysis\n",
+    "label_map = {\n",
+    "    0: \"World\",\n",
+    "    1: \"Sports\",\n",
+    "    2: \"Business\",\n",
+    "    3: \"Sci/Tech\"\n",
+    "}\n",
+    "    \n",
+    "# Initialize the dataset splits using a dataset from the TensorFlow datasets catalog\n",
+    "dataset = TFDSMultiTextClassificationData(dataset_dir=dataset_directory,\n",
+    "                                           tfds_name=tfds_name,\n",
+    "                                           train_split=\"train[:50%]\",\n",
+    "                                           val_split=\"train[:20%]\",\n",
+    "                                           test_split=\"test[:20%]\",\n",
+    "                                           label_map=label_map,\n",
+    "                                           batch_size=batch_size)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [3. Build the model](#3.-Build-the-model) to continue using the TF dataset."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Option B: Use your own dataset\n",
+    "Instead of using a dataset from TensorFlow datasets, another dataset from your local system or a download can be used.\n",
+    "\n",
+    "In this example, we download the Conference Title dataset. This is a single tab-separated value file with two columns. The first column is the conference title and the second column is the label (VLDB, ISCAS, SIGGRAPH, INFOCOM, WWW):\n",
+    "\n",
+    "```\n",
+    "<conference title>\t<label>\n",
+    "<conference title>\t<label>\n",
+    "<conference title>\t<label>\n",
+    "...\n",
+    "```\n",
+    "\n",
+    "If you are using a custom dataset that has a similarly formatted csv or tsv file, you can still use the class defined below. Just create your object passing in custom values for delimiter, header (whether the file has a header row), the label map, mapping function, etc."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class CustomCsvMultiTextClassificationData(MultiTextClassificationData):\n",
+    "    def __init__(self, csv_file, delimiter, header, train_percent, val_percent,\n",
+    "                 test_percent, label_map, batch_size, dataset_name, map_function=None):\n",
+    "        \"\"\"\n",
+    "        Intialize the CustomCsvMultiTextClassificationData class for a dataset multi text\n",
+    "        classification dataset that uses a single csv file.\n",
+    "        \n",
+    "        :param csv_file: Path to the csv file\n",
+    "        :param delimiter: String character that separates the fields in each row\n",
+    "        :param header: Boolean indicating whether or not the csv file has a header line that should be skipped\n",
+    "        :param train_percent: Decimal value for the percentage of the dataset that should be used for training\n",
+    "                              (e.g. 0.8 for 80%)\n",
+    "        :param val_percent: Decimal value for the percentage of the dataset that should be used for validation\n",
+    "                            (e.g. 0.1 for 10%)\n",
+    "        :param test_percent: Decimal value for the percentage of the dataset that should be used for test\n",
+    "                             (e.g. 0.1 for 10%)\n",
+    "        :param label_map: Dictionary where the key is a numerical value and the value is the string label\n",
+    "        :param batch_size: Batch size\n",
+    "        :param dataset_name: Name of the dataset. This is used later in this notebook for naming the saved model\n",
+    "                             export folder and determining which input strings to use when testing the reloaded model\n",
+    "        :param map_function: (Optional) If the csv file has string labels instead of the numerical values, provide a\n",
+    "                             map function to apply on the dataset\n",
+    "        \"\"\"\n",
+    "        # Init base class\n",
+    "        MultiTextClassificationData.__init__(self, batch_size, label_map)\n",
+    "        \n",
+    "        self.dataset_name = dataset_name\n",
+    "        \n",
+    "        if (train_percent + val_percent + test_percent) > 1:\n",
+    "            raise ValueError(\"The combined value of the train percentage, validation percentage, and \" \\\n",
+    "                             \"test percentage cannot be greater than 1\")\n",
+    "        \n",
+    "        if not os.path.exists(csv_file):\n",
+    "            raise FileNotFoundError(\"Unable to find the csv file at\", csv_file)      \n",
+    "\n",
+    "        custom_dataset = tf.data.experimental.CsvDataset(filenames=csv_file,\n",
+    "                                                         record_defaults=[tf.string, tf.string],\n",
+    "                                                         field_delim=delimiter,\n",
+    "                                                         use_quote_delim=True,\n",
+    "                                                         header=header)\n",
+    "\n",
+    "        # Count the number of lines in the csv file to get the dataset length\n",
+    "        custom_dataset_len = sum(1 for line in open(csv_file))\n",
+    "\n",
+    "        if header:\n",
+    "            custom_dataset_len -= 1\n",
+    "\n",
+    "        # Optionally map the dataset labels using the map_function\n",
+    "        if map_function:\n",
+    "            custom_dataset = custom_dataset.map(map_function)\n",
+    "        \n",
+    "        # Create batches based on the specified batch size\n",
+    "        custom_dataset = custom_dataset.batch(batch_size)\n",
+    "\n",
+    "\n",
+    "        # Calculate sizes for the splits\n",
+    "        total_num_batches = int(custom_dataset_len / batch_size)\n",
+    "        train_size = int(train_percent * total_num_batches)\n",
+    "        val_size = int(val_percent * total_num_batches)\n",
+    "        test_size = int(test_percent * total_num_batches)\n",
+    "\n",
+    "        # Create the train, validation, and test splits\n",
+    "        self.train_ds = custom_dataset.take(train_size)    \n",
+    "        self.val_ds = custom_dataset.skip(train_size).take(val_size)\n",
+    "        self.test_ds = custom_dataset.skip(train_size).skip(val_size)\n",
+    "\n",
+    "        # Set the cardinality so that progress bars will work properly\n",
+    "        self.train_ds = self.train_ds.apply(tf.data.experimental.assert_cardinality(train_size))\n",
+    "        self.val_ds = self.val_ds.apply(tf.data.experimental.assert_cardinality(val_size))\n",
+    "        self.test_ds = self.test_ds.apply(tf.data.experimental.assert_cardinality(test_size))\n",
+    "\n",
+    "# Modify the variables below to use a different dataset or a csv file on your local system.\n",
+    "# The csv_path variable should be pointing to a csv file with 2 columns (the label and the text)\n",
+    "dataset_url = \"https://raw.githubusercontent.com/susanli2016/NLP-with-Python/master/data/title_conference.csv\"\n",
+    "dataset_directory = os.path.join(dataset_directory, \"titleconference\")\n",
+    "csv_name = \"title_conference.csv\"\n",
+    "delimiter = \",\"\n",
+    "header = True  # Set to true if the csv file has a header row\n",
+    "csv_path = os.path.join(dataset_directory, csv_name)\n",
+    "\n",
+    "if not os.path.exists(dataset_directory):\n",
+    "    os.makedirs(dataset_directory)\n",
+    "\n",
+    "# If we don't already have the csv file, download and extract the zip file to get it.\n",
+    "if not os.path.exists(csv_path):\n",
+    "    df = pd.read_csv(dataset_url, header=0)\n",
+    "    df.to_csv(csv_path, index=False)\n",
+    "\n",
+    "label_map = {\n",
+    "    \"VLDB\": 0,\n",
+    "    \"ISCAS\": 1,\n",
+    "    \"SIGGRAPH\": 2,\n",
+    "    \"INFOCOM\": 3, \n",
+    "    \"WWW\": 4\n",
+    "}\n",
+    "\n",
+    "int_to_label_map ={}\n",
+    "for k, v in label_map.items():\n",
+    "    int_to_label_map[v] = k\n",
+    "\n",
+    "# Map function to translate labels in the csv file to numerical values when loading the dataset\n",
+    "def map_title(features, label):\n",
+    "    label = tf.py_function(lambda x: label_map[x.numpy().decode('utf-8')], [label], tf.int64)\n",
+    "    return features, label\n",
+    "\n",
+    "# Initialize the dataset splits using the custom dataset\n",
+    "dataset = CustomCsvMultiTextClassificationData(csv_file=csv_path,\n",
+    "                                                delimiter=delimiter,\n",
+    "                                                header=header,\n",
+    "                                                train_percent=0.8,\n",
+    "                                                val_percent=0.1,\n",
+    "                                                test_percent=0.1,\n",
+    "                                                batch_size=batch_size,\n",
+    "                                                label_map=int_to_label_map,\n",
+    "                                                dataset_name=csv_name,\n",
+    "                                                map_function=map_title)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 3. Build the model\n",
+    "\n",
+    "Create the BERT model to fine tune using a input layer, the preprocessing layer (from TF Hub), the BERT encoder layer (from TF Hub), one dense layer, and a dropout layer."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "input_layer = tf.keras.layers.Input(shape=(), dtype=tf.string, name='input_layer')\n",
+    "preprocessing_layer = hub.KerasLayer(tfhub_preprocess, name='preprocessing')\n",
+    "encoder_inputs = preprocessing_layer(input_layer)\n",
+    "encoder_layer = hub.KerasLayer(tfhub_bert_encoder, trainable=True, name='encoder')\n",
+    "outputs = encoder_layer(encoder_inputs)\n",
+    "net = outputs['pooled_output']\n",
+    "net = tf.keras.layers.Dense(16, activation='relu', name='fully_connected_layer')(net)\n",
+    "# Add dropout layer for regularization\n",
+    "net = tf.keras.layers.Dropout(0.2)(net)\n",
+    "net = tf.keras.layers.Dense(len(label_map), activation='softmax', name='classifier')(net)\n",
+    "classifier_model = tf.keras.Model(input_layer, net)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 4. Fine tuning and evaluation\n",
+    "\n",
+    "Train the model for the specified number of epochs, then evaluate the model using the test dataset."
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "> Note that there is a known error during custom dataset training: `train_function (Empty logs). Please use Model.compile(..., run_eagerly=True), or tf.config.run_functions_eagerly(True) for more information of where went wrong, or file a issue/bug to tf.keras.`\n",
+    "> If you see this error, try using the first dataset for at least partially training (it doesn't have to finish). Then re-run with the custom dataset and training should work. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "%%time\n",
+    "\n",
+    "# The number of training epochs to run\n",
+    "num_train_epochs = 1\n",
+    "\n",
+    "# Learning rate\n",
+    "learning_rate = 3e-5\n",
+    "\n",
+    "# Maximum total input sequence length after WordPiece tokenization (longer sequences will be truncated)\n",
+    "max_seq_length = 128\n",
+    "\n",
+    "classifier_model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=3e-5), \n",
+    "                        loss='sparse_categorical_crossentropy', \n",
+    "                        metrics=['accuracy'], run_eagerly=True)\n",
+    "\n",
+    "history = classifier_model.fit(dataset.train_ds,\n",
+    "                               validation_data=dataset.val_ds,\n",
+    "                               epochs=num_train_epochs)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Evaluate the accuracy using the test dataset. If the accuracy does not meet your expectations, try to increasing the size of the training dataset split or the number of training epochs."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "loss, accuracy = classifier_model.evaluate(dataset.test_ds)\n",
+    "\n",
+    "print(f'Loss: {loss}')\n",
+    "print(f'Accuracy: {accuracy}')"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Predict using a single batch from the test dataset, and then display the results along with the input text and the actual label."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "num_steps = 1\n",
+    "predictions = classifier_model.predict(dataset.test_ds, batch_size=batch_size, steps=num_steps)\n",
+    "\n",
+    "prediction_list = []\n",
+    "step_count = 0\n",
+    "\n",
+    "for batch in dataset.test_ds:\n",
+    "    label_list = list(batch[1].numpy())\n",
+    "    text_list = list(batch[0].numpy())\n",
+    "    \n",
+    "    for i, (text, actual_label) in enumerate(zip(text_list, label_list)):\n",
+    "        score = tf.nn.softmax(predictions[i])\n",
+    "        score = tf.reduce_max(score)\n",
+    "        prediction = tf.math.argmax(predictions[i]).numpy()\n",
+    "        prediction = dataset.get_str_label(prediction)\n",
+    "        prediction_list.append([text.decode('utf-8'),\n",
+    "                                tf.get_static_value(score),\n",
+    "                                prediction,\n",
+    "                                dataset.get_str_label(actual_label)])\n",
+    "    \n",
+    "    step_count += 1\n",
+    "    if num_steps <= step_count:\n",
+    "        break\n",
+    "    \n",
+    "result_df = pd.DataFrame(prediction_list, columns=[\"Input Text\", \"Score\", \"Predicted Label\", \"Actual Label\"])\n",
+    "result_df.style.hide(axis=\"index\")\n",
+    "\n"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 5. Export the model\n",
+    "\n",
+    "Since training has completed, export the `saved_model.pb` to the output directory in a folder with the model and dataset name."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_dir = \"{}_{}\".format(model_name, dataset.dataset_name)\n",
+    "model_dir = os.path.join(output_directory, model_dir)\n",
+    "classifier_model.save(model_dir, include_optimizer=False)\n",
+    "\n",
+    "saved_model_path = os.path.join(model_dir, \"saved_model.pb\")\n",
+    "if os.path.exists(saved_model_path):\n",
+    "    print(\"Saved model location:\", saved_model_path)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 6. Reload the model and make predictions\n",
+    "\n",
+    "Reload from the `saved_model.pb` in the output directory."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "reloaded_model = tf.saved_model.load(model_dir)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "The next section defines a list of strings to send as input to the reloaded model. If you are using a dataset other than the [AG News dataset](https://www.tensorflow.org/datasets/catalog/ag_news_subset), you can update the snippet below with your own list of input text."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "\n",
+    "input_text = [\"WASHINGTON - Employers stepped up hiring in August, expanding payrolls by 144,000 and lowering the unemployment rate to 5.4 percent.\",\n",
+    "              \"PRESENTACION, Philippines (Reuters) - Philippine communist rebels freed Wednesday two soldiers they had held as 'prisoners of war' for'\\\n",
+    "              'more than five months, saying they wanted to rebuild confidence in peace talks with the government.\", \n",
+    "              \"Geneva - Worldwide sales of industrial robots surged to record levels in the first half of 2004 after equipment prices fell while labour' \\\n",
+    "              'costs grew, the United Nations Economic Commission for Europe said in a report to be released today.\"]\n",
+    "    \n",
+    "if not input_text:\n",
+    "    raise ValueError(\"Please define the list of input_text strings.\")\n",
+    "\n",
+    "# Send the input text to the reloaded model\n",
+    "predict_results = tf.nn.softmax(reloaded_model(tf.constant(input_text)))\n",
+    "\n",
+    "# Get the results into a data frame to display\n",
+    "result_list = [[input_text[i],\n",
+    "                tf.get_static_value(tf.reduce_max(predict_results[i])),\n",
+    "                dataset.get_str_label(tf.math.argmax(predict_results[i]))] for i in range(len(input_text))]\n",
+    "result_df = pd.DataFrame(result_list, columns=[\"Input Text\", \"Score\", \"Predicted Label\"])\n",
+    "result_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@misc{zhang2015characterlevel,\n",
+    "    title={Character-level Convolutional Networks for Text Classification},\n",
+    "    author={Xiang Zhang and Junbo Zhao and Yann LeCun},\n",
+    "    year={2015},\n",
+    "    eprint={1509.01626},\n",
+    "    archivePrefix={arXiv},\n",
+    "    primaryClass={cs.LG}\n",
+    "}\n",
+    "```"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "tlt_notebook_venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.15"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "e0aa4059be174cbf31be2e5e13e301e374cc50c7151267adca3135ebe59561bd"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/notebooks/text_classification/tfhub_text_classification/README.md b/notebooks/text_classification/tfhub_text_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..a58e8e63831d74d956c967144354aa0d99ff2f52
--- /dev/null
+++ b/notebooks/text_classification/tfhub_text_classification/README.md
@@ -0,0 +1,50 @@
+# Text Classifier fine tuning with TensorFlow
+
+These notebooks demonstrate fine tuning using various [BERT](https://arxiv.org/abs/1810.04805) models
+from [TF Hub](https://tfhub.dev) using Intel® Optimization for TensorFlow for text classification.
+
+The notebook performs the following steps:
+1. Install dependencies and setup parameters
+1. Prepare the dataset
+1. Build the model
+1. Fine tuning and evaluation
+1. Export the model
+1. Reload the model and make predictions
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [TensorFlow notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations:
+```
+@InProceedings{maas-EtAl:2011:ACL-HLT2011,
+  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},
+  title     = {Learning Word Vectors for Sentiment Analysis},
+  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},
+  month     = {June},
+  year      = {2011},
+  address   = {Portland, Oregon, USA},
+  publisher = {Association for Computational Linguistics},
+  pages     = {142--150},
+  url       = {http://www.aclweb.org/anthology/P11-1015}
+}
+
+@misc{zhang2015characterlevel,
+    title={Character-level Convolutional Networks for Text Classification},
+    author={Xiang Zhang and Junbo Zhao and Yann LeCun},
+    year={2015},
+    eprint={1509.01626},
+    archivePrefix={arXiv},
+    primaryClass={cs.LG}
+}
+
+@misc{misc_sms_spam_collection_228,
+  author       = {Almeida, Tiago},
+  title        = {{SMS Spam Collection}},
+  year         = {2012},
+  howpublished = {UCI Machine Learning Repository}
+}
+```
+Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.
\ No newline at end of file
diff --git a/notebooks/text_classification/tfhub_text_classification/bert_utils.py b/notebooks/text_classification/tfhub_text_classification/bert_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..c9ebf090273dd0839ca5dfa26cf46bfcea05b6e1
--- /dev/null
+++ b/notebooks/text_classification/tfhub_text_classification/bert_utils.py
@@ -0,0 +1,57 @@
+#
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import json
+import os
+import pandas as pd
+
+from zipfile import ZipFile
+
+
+def get_model_map(json_path, return_data_frame=False):
+    """
+    Gets the model map from the speified json path and loads it into a python dictionary. If the
+    data frame option is enabled, it will also return the list of models in a pandas data frame
+    with column headers so that it can be used to display in a notebook.
+    """
+    with open(json_path) as json_file:
+        tfhub_model_map = json.load(json_file)
+
+    if return_data_frame:
+        # Generate list of model names and URL links to TF Hub based on the model map
+        model_options = [[i,
+                          tfhub_model_map[i]["num_hidden_layers"],
+                          tfhub_model_map[i]["hidden_size"],
+                          tfhub_model_map[i]["num_attention_heads"],
+                          "<a href=\"{0}\" target=\"_blank\">{0}</a>".format(
+                              tfhub_model_map[i]["bert_encoder"])]
+                         for i in tfhub_model_map.keys()]
+
+        if len(model_options) == 0:
+            print("Warning: No models were found in the json file:", json_path)
+
+        pd.set_option('display.max_colwidth', None)
+        models_df = pd.DataFrame(model_options,
+                                 columns=["Model",
+                                          "Hidden layers",
+                                          "Hidden size",
+                                          "Attention heads",
+                                          "TF Hub BERT encoder URL"])
+        return tfhub_model_map, models_df
+    else:
+        return tfhub_model_map
diff --git a/notebooks/text_classification/tfhub_text_classification/tfhub_bert_model_map_classifier.json b/notebooks/text_classification/tfhub_text_classification/tfhub_bert_model_map_classifier.json
new file mode 100644
index 0000000000000000000000000000000000000000..e0a7ddb078de2ad32c21c6035babb3dfc1de71c7
--- /dev/null
+++ b/notebooks/text_classification/tfhub_text_classification/tfhub_bert_model_map_classifier.json
@@ -0,0 +1,210 @@
+{
+    "bert_en_wwm_uncased_L-24_H-1024_A-16": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/bert_en_wwm_uncased_L-24_H-1024_A-16/4",
+        "hidden_size": 1024,
+        "num_hidden_layers": 24,
+        "num_attention_heads": 16,
+        "checkpoint_zip": "https://storage.googleapis.com/cloud-tpu-checkpoints/bert/keras_bert/wwm_uncased_L-24_H-1024_A-16.tar.gz"
+    },
+    "bert_en_uncased_L-12_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/bert_en_uncased_L-12_H-768_A-12/3",
+        "hidden_size": 768,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/cloud-tpu-checkpoints/bert/keras_bert/uncased_L-12_H-768_A-12.tar.gz"
+    },
+    "small_bert/bert_en_uncased_L-2_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-2_H-128_A-2/1",
+        "hidden_size": 128,
+        "num_hidden_layers": 2,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-2_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-2_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-2_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 2,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-2_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-2_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-2_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 2,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-2_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-2_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-2_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 2,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-2_H-768_A-12.zip"
+    },
+    "small_bert/bert_en_uncased_L-4_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-4_H-128_A-2/2",
+        "hidden_size": 128,
+        "num_hidden_layers": 4,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-4_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-4_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-4_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 4,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-4_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-4_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-4_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 4,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-4_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-4_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-4_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 4,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-4_H-768_A-12.zip"
+    },
+    "small_bert/bert_en_uncased_L-6_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-6_H-128_A-2/2",
+        "hidden_size": 128,
+        "num_hidden_layers": 6,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-6_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-6_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-6_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 6,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-6_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-6_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-6_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 6,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-6_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-6_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-6_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 6,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-6_H-768_A-12.zip"
+    },
+    "small_bert/bert_en_uncased_L-8_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-8_H-128_A-2/2",
+        "hidden_size": 128,
+        "num_hidden_layers": 8,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-8_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-8_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-8_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 8,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-8_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-8_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-8_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 8,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-8_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-8_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-8_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 8,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-8_H-768_A-12.zip"
+    },
+    "small_bert/bert_en_uncased_L-10_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-10_H-128_A-2/2",
+        "hidden_size": 128,
+        "num_hidden_layers": 10,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-10_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-10_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-10_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 10,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-10_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-10_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-10_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 10,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-10_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-10_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-10_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 10,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-10_H-768_A-12.zip"
+    },
+    "small_bert/bert_en_uncased_L-12_H-128_A-2": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-12_H-128_A-2/2",
+        "hidden_size": 128,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 2,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-12_H-128_A-2.zip"
+    },
+    "small_bert/bert_en_uncased_L-12_H-256_A-4": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-12_H-256_A-4/2",
+        "hidden_size": 256,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 4,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-12_H-256_A-4.zip"
+    },
+    "small_bert/bert_en_uncased_L-12_H-512_A-8": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-12_H-512_A-8/2",
+        "hidden_size": 512,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 8,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-12_H-512_A-8.zip"
+    },
+    "small_bert/bert_en_uncased_L-12_H-768_A-12": {
+        "preprocess": "https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3",
+        "bert_encoder": "https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-12_H-768_A-12/2",
+        "hidden_size": 768,
+        "num_hidden_layers": 12,
+        "num_attention_heads": 12,
+        "checkpoint_zip": "https://storage.googleapis.com/bert_models/2020_02_20/uncased_L-12_H-768_A-12.zip"
+    }
+}
diff --git a/notebooks/text_classification/tlt_api_pyt_text_classification/README.md b/notebooks/text_classification/tlt_api_pyt_text_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..099771cd5d6cb7f223e901bb1f106e958053ee7b
--- /dev/null
+++ b/notebooks/text_classification/tlt_api_pyt_text_classification/README.md
@@ -0,0 +1,43 @@
+# Text Classifier fine tuning with PyTorch and the Intel® Transfer Learning Tool API
+
+This notebook demonstrates how to use the Intel Transfer Learning Tool API to do fine tuning for
+text classification using various [BERT](https://arxiv.org/abs/1810.04805) models
+from [Hugging Face](https://huggingface.co/datasets).
+
+The notebook performs the following steps:
+1. Install dependencies and setup parameters
+1. Get the model
+1. Get the dataset
+1. Prepare the dataset
+1. Fine tuning
+1. Predict
+1. Export the saved model
+1. Quantization
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [PyTorch notebook environment](/notebooks/setup.md).
+
+## References
+Dataset citations:
+```
+@InProceedings{maas-EtAl:2011:ACL-HLT2011,
+  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},
+  title     = {Learning Word Vectors for Sentiment Analysis},
+  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},
+  month     = {June},
+  year      = {2011},
+  address   = {Portland, Oregon, USA},
+  publisher = {Association for Computational Linguistics},
+  pages     = {142--150},
+  url       = {http://www.aclweb.org/anthology/P11-1015}
+}
+
+@misc{misc_sms_spam_collection_228,
+  author       = {Almeida, Tiago},
+  title        = {{SMS Spam Collection}},
+  year         = {2012},
+  howpublished = {UCI Machine Learning Repository}
+}
+```
+Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.
diff --git a/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb b/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..7e10161a03983523ee38ca6d6854c3f3b1d78e42
--- /dev/null
+++ b/notebooks/text_classification/tlt_api_pyt_text_classification/TLT_PYT_Text_Classification.ipynb
@@ -0,0 +1,578 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "ac1059eb",
+   "metadata": {},
+   "source": [
+    "# Text Classification fine tuning using Pytorch and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the `tlt` library to fine tune a Hugging Face pretrained model for text classification."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0bb70464",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a Pytorch environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "20ab9972",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "\n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "47787deb",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported Hugging Face text classification models. This is a list of pretrained models from Hugging Face that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models()` function call to get more information about each model (such as the links to Huggingface, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "52a4af60",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available text classification models\n",
+    "model_factory.print_supported_models(use_case='text_classification', framework='pytorch')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7293733f",
+   "metadata": {},
+   "source": [
+    "Use the Intel Transfer Learning Tool model factory to get one of the models listed in the previous cell. The `get_model` function returns a TLT model object that will later be used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "050d7b0a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"bert-base-cased\"\n",
+    "framework = \"pytorch\"\n",
+    "\n",
+    "model = model_factory.get_model(model_name, framework)\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "37bf5a93",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6867f79e",
+   "metadata": {},
+   "source": [
+    "### Option A: Use your own dataset\n",
+    "This option allows for using your own text classification dataset from a `.csv` file. The dataset factory will expect text classification .csv files to have two columns where the first column is the label and the second column is the text/sentence to classify.\n",
+    "\n",
+    "For example, the contents of a comma separated value file should look similar to this:\n",
+    "```\n",
+    "<label>,<text>\n",
+    "<label>,<text>\n",
+    "<label>,<text>\n",
+    "```\n",
+    "\n",
+    "If the .csv has more columns, the `select_cols` or `exclude_cols` parameters can be used to filter out which columns are parsed.\n",
+    "\n",
+    "This example is downloading the [SMS Spam Collection](https://archive.ics.uci.edu/ml/datasets/sms+spam+collection) dataset, which has a tab separated value file in the .zip file. This dataset has labeled SMS text messages that are either being classified as `ham` or `spam`. The first column in the data file has the label (`ham` or `spam`) and the second column is the text of the SMS mesage. (Note: Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.)\n",
+    "\n",
+    "When using your own dataset, update the path to your dataset directory, as well the other variables with properties about the dataset like the csv file name, class names, delimiter, header, and the map function (if string labels need to be translated into numerical values)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41edc8fc",
+   "metadata": {
+     "tags": ["remove_for_hf_dataset"]
+   },
+   "outputs": [],
+   "source": [
+    "# Modify the variables below to use a different dataset or a csv file on your local system.\n",
+    "# The csv_path variable should be pointing to a csv file with 2 columns (the label and the text)\n",
+    "dataset_url = \"https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip\"\n",
+    "dataset_dir = os.path.join(dataset_dir, \"sms_spam_collection\")\n",
+    "csv_name = \"SMSSpamCollection\"\n",
+    "delimiter = \"\\t\"\n",
+    "label_names = [\"ham\", \"spam\"]\n",
+    "\n",
+    "# Rename the file to include the csv extension so that the dataset API knows how to load the file\n",
+    "renamed_csv = \"{}.csv\".format(csv_name)\n",
+    "print(renamed_csv)\n",
+    "\n",
+    "# If we don't already have the csv file, download and extract the zip file to get it.\n",
+    "if not os.path.exists(os.path.join(dataset_dir, csv_name)) and \\\n",
+    "                      not os.path.exists(os.path.join(dataset_dir, renamed_csv)):\n",
+    "    download_and_extract_zip_file(dataset_url, dataset_dir)\n",
+    "\n",
+    "if not os.path.exists(os.path.join(dataset_dir, renamed_csv)):\n",
+    "    os.rename(os.path.join(dataset_dir, csv_name), os.path.join(dataset_dir, renamed_csv))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "94e348c2",
+   "metadata": {
+     "tags": ["remove_for_hf_dataset"]
+   },
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.load_dataset(dataset_dir=dataset_dir, use_case=\"text_classification\",\n",
+    "                                       framework=\"pytorch\", csv_file_name=renamed_csv, class_names=label_names,\n",
+    "                                       column_names=[\"label\", \"text\"], delimiter=delimiter, header=None)\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "28504679",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [4. Prepare the dataset](#4.-Prepare-the-dataset) to continue using your own dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ccac8980",
+   "metadata": {},
+   "source": [
+    "### Option B: Use the HuggingFace catalog\n",
+    "\n",
+    "Option B allows for using a dataset from the [HuggingFace datasets catalog](https://huggingface.co/datasets).\n",
+    "Current supported datasets: \n",
+    "- **imdb**\n",
+    "- **tweet_eval/** -- emoji, emotion, hate, irony, offensive, sentiment, stance_abortion, stance_atheism, stance_climate, stance_feminist, stance_hillary\n",
+    "- **rotten_tomatoes**\n",
+    "- **ag_news**\n",
+    "- **sst2**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d93313bf",
+   "metadata": {
+     "tags": ["remove_for_custom_dataset"]
+   },
+   "outputs": [],
+   "source": [
+    "dataset_name = \"tweet_eval/sentiment\"\n",
+    "dataset = dataset_factory.get_dataset(dataset_dir, model.use_case, model.framework, dataset_name,\n",
+    "                                      dataset_catalog=\"huggingface\", shuffle_files=True)\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "539d53b7",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cell to preprocess the dataset. The dataset is batched and then split into subsets for training and validation."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "587d1d9e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Batch the dataset and create splits for training and validation\n",
+    "dataset.preprocess(model_name, batch_size=32)\n",
+    "dataset.shuffle_split(train_pct=0.75, val_pct=0.25)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "352eda54",
+   "metadata": {},
+   "source": [
+    "## 5. Fine tuning\n",
+    "\n",
+    "The Intel Transfer Learning Tool model's train function is called with the dataset that was just prepared, along with an output directory for checkpoints, and the number of training epochs.\n",
+    "\n",
+    "With the do_eval parameter set to True by default, this step will also show how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "492ee811",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "-  **use_trainer** (bool): If use_trainer is True, then the model training is done using the Hugging Face Trainer\n",
+    "and if use_trainer is False, the model training is done using native PyTorch training loop\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "955a4a7e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "history = model.train(dataset, output_dir, epochs=1, ipex_optimize=True, use_trainer=False)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7eacff69",
+   "metadata": {},
+   "source": [
+    "A complete model summary can be printed for all modules in case any need to be unfrozen:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2f116a14",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.list_layers(verbose=True)"
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "70c57445",
+   "metadata": {},
+   "source": [
+    "Layers can be unfrozen by passing their string names, such as the following:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "c94963c3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.unfreeze_layer(\"features\") # Unfreezes the features layers\n",
+    "model.list_layers(verbose=True) "
+   ]
+  },
+  {
+   "attachments": {},
+   "cell_type": "markdown",
+   "id": "7e08a1c9",
+   "metadata": {},
+   "source": [
+    "## 6. Predict\n",
+    "\n",
+    "The model's predict function can be called with a batch of data from the dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1ed07887",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get a single batch from the dataset object\n",
+    "data_batch = dataset.get_batch()\n",
+    "\n",
+    "# Call predict using the batch\n",
+    "batch_predictions = model.predict(data_batch)\n",
+    "\n",
+    "# Maximum number of rows to show in the data frame\n",
+    "max_items = 10\n",
+    "# Collect the sentence text, score, and actual label for the batch\n",
+    "prediction_list = []\n",
+    "\n",
+    "for i, tensor in enumerate(data_batch['input_ids']):\n",
+    "    sentence = dataset.get_text(tensor)[0]\n",
+    "    score = batch_predictions[i]\n",
+    "    prediction_list.append([sentence,\n",
+    "                            dataset.get_str_label(float(score)),\n",
+    "                            dataset.get_str_label(float(data_batch['label'][i]))])\n",
+    "    if i + 1 >= max_items:\n",
+    "        break\n",
+    "\n",
+    "# Display the results using a data frame\n",
+    "result_df = pd.DataFrame(prediction_list, columns=[\"Input Text\", \"Predicted Label\", \"Actual Label\"])\n",
+    "result_df.style.hide(axis=\"index\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7721d95b",
+   "metadata": {},
+   "source": [
+    "### Predict on Text"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f62be263",
+   "metadata": {},
+   "source": [
+    "Raw text can also be passed to the predict function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6f3cbd35",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "result = model.predict(\"Good movie\")\n",
+    "\n",
+    "print(\"Predicted score:\", float(result))\n",
+    "print(\"Predicted label:\", dataset.get_str_label(float(result)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "64ada826",
+   "metadata": {},
+   "source": [
+    "## 7. Export the saved model\n",
+    "\n",
+    "Lastly, we can call the model export function to generate a saved_model.pb. Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3981b2f5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "458f365e",
+   "metadata": {},
+   "source": [
+    "## 8. Quantization\n",
+    "\n",
+    "In this section, the Intel Transfer Learning Tool API uses Intel® Neural Compressor (INC) to quantize the model to get optimal inference performance.\n",
+    "\n",
+    "We use the Intel Neural Compressor config to benchmark the full precision model to see how it performs, as our baseline.\n",
+    "\n",
+    "> Note that there is a known issue when running Intel Neural Compressor from a notebook that you may sometimes see the error \n",
+    "> `zmq.error.ZMQError: Address already in use`. If you see this error, rerun the cell again."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "66eb7c8a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "result = model.benchmark(dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ae3dd2eb",
+   "metadata": {},
+   "source": [
+    "Next we use Intel Neural Compressor to automatically search for the optimal quantization recipe for low-precision model inference. Running post training quantization may take several minutes."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "02d43148",
+   "metadata": {},
+   "source": [
+    "Next we use INC to automatically search for the optimal quantization recipe for low-precision model inference within the accuracy loss constrains defined in the config. Running post training quantization may take several minutes, depending on your hardware and the exit policy (timeout and max trials)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "759cb276",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "inc_output_dir = os.path.join(output_dir, 'quantized_models', model.model_name,\n",
+    "                                       os.path.basename(saved_model_dir))\n",
+    "model.quantize(inc_output_dir, dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fd539f96",
+   "metadata": {},
+   "source": [
+    "Let's benchmark using the quantized model, so that we can compare the performance to the full precision model that was originally benchmarked."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4cba3376",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "quantized_result = model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "970d771d",
+   "metadata": {},
+   "source": [
+    "You can inspect the disk size of the pre- and post-quantization model files:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "59a4c8e0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print('The size of the un-compressed model:')\n",
+    "!du -h {saved_model_dir}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "864a616d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print('The size of the compressed model:')\n",
+    "!du -h {inc_output_dir}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3d0ed367",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@InProceedings{maas-EtAl:2011:ACL-HLT2011,\n",
+    "  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},\n",
+    "  title     = {Learning Word Vectors for Sentiment Analysis},\n",
+    "  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},\n",
+    "  month     = {June},\n",
+    "  year      = {2011},\n",
+    "  address   = {Portland, Oregon, USA},\n",
+    "  publisher = {Association for Computational Linguistics},\n",
+    "  pages     = {142--150},\n",
+    "  url       = {http://www.aclweb.org/anthology/P11-1015}\n",
+    "}\n",
+    "\n",
+    "@inproceedings{rosenthal2017semeval,\n",
+    "  title={SemEval-2017 task 4: Sentiment analysis in Twitter},\n",
+    "  author={Rosenthal, Sara and Farra, Noura and Nakov, Preslav},\n",
+    "  booktitle={Proceedings of the 11th international workshop on semantic evaluation (SemEval-2017)},\n",
+    "  pages={502--518},\n",
+    "  year={2017}\n",
+    "}\n",
+    "\n",
+    "@misc{misc_sms_spam_collection_228,\n",
+    "  author       = {Almeida, Tiago},\n",
+    "  title        = {{SMS Spam Collection}},\n",
+    "  year         = {2012},\n",
+    "  howpublished = {UCI Machine Learning Repository}\n",
+    "}\n",
+    "```\n",
+    "Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  },
+  "vscode": {
+   "interpreter": {
+    "hash": "e0aa4059be174cbf31be2e5e13e301e374cc50c7151267adca3135ebe59561bd"
+   }
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/notebooks/text_classification/tlt_api_tf_text_classification/README.md b/notebooks/text_classification/tlt_api_tf_text_classification/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..2a88c7bc49e95c708d49c7a245ab4e4e8479ca58
--- /dev/null
+++ b/notebooks/text_classification/tlt_api_tf_text_classification/README.md
@@ -0,0 +1,51 @@
+# Text Classifier fine tuning with TensorFlow and the Intel® Transfer Learning Tool API
+
+This notebook demonstrates how to use the Intel Transfer Learning Tool API to do fine tuning for
+text classification using various [BERT](https://arxiv.org/abs/1810.04805) models
+from [Hugging Face](https://huggingface.co).
+
+The notebook performs the following steps:
+1. Import dependencies and setup parameters
+1. Get the model
+1. Get the dataset
+1. Prepare the dataset
+1. Fine tuning
+1. Predict
+1. Export the saved model
+1. Quantization
+
+## Running the notebook
+
+To run the notebook, follow the instructions to setup the [TensorFlow notebook environment](/notebooks/setup.md).
+
+## References
+
+Dataset citations:
+```
+@InProceedings{maas-EtAl:2011:ACL-HLT2011,
+  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},
+  title     = {Learning Word Vectors for Sentiment Analysis},
+  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},
+  month     = {June},
+  year      = {2011},
+  address   = {Portland, Oregon, USA},
+  publisher = {Association for Computational Linguistics},
+  pages     = {142--150},
+  url       = {http://www.aclweb.org/anthology/P11-1015}
+}
+
+@inproceedings{wang2019glue,
+  title={{GLUE}: A Multi-Task Benchmark and Analysis Platform for Natural Language Understanding},
+  author={Wang, Alex and Singh, Amanpreet and Michael, Julian and Hill, Felix and Levy, Omer and Bowman, Samuel R.},
+  note={In the Proceedings of ICLR.},
+  year={2019}
+}
+
+@misc{misc_sms_spam_collection_228,
+  author       = {Almeida, Tiago},
+  title        = {{SMS Spam Collection}},
+  year         = {2012},
+  howpublished = {UCI Machine Learning Repository}
+}
+```
+Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.
diff --git a/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb b/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb
new file mode 100644
index 0000000000000000000000000000000000000000..fba56b673f8608fe5f87db9c689fe7abf4e8212e
--- /dev/null
+++ b/notebooks/text_classification/tlt_api_tf_text_classification/TLT_TF_Text_Classification.ipynb
@@ -0,0 +1,581 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "ac1059eb",
+   "metadata": {},
+   "source": [
+    "# Text Classification fine tuning using TensorFlow and the Intel® Transfer Learning Tool API\n",
+    "\n",
+    "This notebook uses the `tlt` library to fine tune a TensorFlow pretrained model from Hugging Face for text classification."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0bb70464",
+   "metadata": {},
+   "source": [
+    "## 1. Import dependencies and setup parameters\n",
+    "\n",
+    "This notebook assumes that you have already followed the instructions to setup a TensorFlow environment with all the dependencies required to run the notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "20ab9972",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import pandas as pd\n",
+    "import tensorflow as tf\n",
+    "\n",
+    "# tlt imports\n",
+    "from tlt.datasets import dataset_factory\n",
+    "from tlt.models import model_factory\n",
+    "from tlt.utils.file_utils import download_and_extract_zip_file\n",
+    "\n",
+    "# Specify a directory for the dataset to be downloaded\n",
+    "dataset_dir = os.environ[\"DATASET_DIR\"] if \"DATASET_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"dataset\")\n",
+    "     \n",
+    "# Specify a directory for output\n",
+    "output_dir = os.environ[\"OUTPUT_DIR\"] if \"OUTPUT_DIR\" in os.environ else \\\n",
+    "    os.path.join(os.environ[\"HOME\"], \"output\")\n",
+    "\n",
+    "print(\"Dataset directory:\", dataset_dir)\n",
+    "print(\"Output directory:\", output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "47787deb",
+   "metadata": {},
+   "source": [
+    "## 2. Get the model\n",
+    "\n",
+    "In this step, we call the Intel Transfer Learning Tool model factory to list supported TensorFlow image classification models. This is a list of pretrained models from Hugging Face that we tested with our API. Optionally, the `verbose=True` argument can be added to the `print_supported_models` function call to get more information about each model (such as the model hub, the original dataset, etc)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "52a4af60",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# See a list of available text classification models\n",
+    "model_factory.print_supported_models(use_case='text_classification', framework='tensorflow')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7293733f",
+   "metadata": {},
+   "source": [
+    "Use the Intel Transfer Learning Tool model factory to get one of the models listed in the previous cell. The `get_model` function returns a TLT model object that will later be used for training."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "050d7b0a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model_name = \"google/bert_uncased_L-2_H-128_A-2\"\n",
+    "framework = \"tensorflow\"\n",
+    "\n",
+    "model = model_factory.get_model(model_name, framework)\n",
+    "\n",
+    "print(\"Model name:\", model.model_name)\n",
+    "print(\"Framework:\", model.framework)\n",
+    "print(\"Use case:\", model.use_case)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "37bf5a93",
+   "metadata": {},
+   "source": [
+    "## 3. Get the dataset"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6867f79e",
+   "metadata": {},
+   "source": [
+    "### Option A: Use your own dataset\n",
+    "This option allows for using your own text classification dataset from a .csv file. The dataset factory will expect text classification .csv files to have two columns where the first column is the label and the second column is the text/sentence to classify.\n",
+    "\n",
+    "For example, the contents of a comma separated value file should look similar to this:\n",
+    "```\n",
+    "<label>,<text>\n",
+    "<label>,<text>\n",
+    "<label>,<text>\n",
+    "```\n",
+    "\n",
+    "If the .csv has more columns, the `select_cols` or `exclude_cols` parameters can be used to filter out which columns are parsed.\n",
+    "\n",
+    "This example is downloading the [SMS Spam Collection](https://archive.ics.uci.edu/ml/datasets/sms+spam+collection) dataset, which has a tab separated value file in the .zip file. This dataset has labeled SMS text messages that are either being classified as `ham` or `spam`. The first column in the data file has the label (`ham` or `spam`) and the second column is the text of the SMS mesage. (Note: Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it.)\n",
+    "\n",
+    "When using your own dataset, update the path to your dataset directory, as well the other variables with properties about the dataset like the csv file name, class names, delimiter, header, and the map function (if string labels need to be translated into numerical values)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "41edc8fc",
+   "metadata": {
+    "tags": [
+     "remove_for_tf_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "zip_file_url = \"https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip\"\n",
+    "sms_data_directory = os.path.join(dataset_dir, \"sms_spam_collection\")\n",
+    "csv_file_name = \"SMSSpamCollection\"\n",
+    "\n",
+    "# If the SMS Spam collection csv file is not found, download and extract the file:\n",
+    "if not os.path.exists(os.path.join(sms_data_directory, csv_file_name)):\n",
+    "    # Download the zip file with the SMS Spam collection dataset\n",
+    "    download_and_extract_zip_file(zip_file_url, sms_data_directory)\n",
+    "\n",
+    "    # Print list of files that we have in our dataset directory\n",
+    "    print(os.listdir(sms_data_directory))\n",
+    "    \n",
+    "# Specify the class names for the dataset being used\n",
+    "class_names = [\"ham\", \"spam\"]\n",
+    "\n",
+    "# Specify the delimiter for the csv file\n",
+    "delimiter = \"\\t\"\n",
+    "\n",
+    "# Specify if the csv file has a header row that should be skipped when parsing the dataset\n",
+    "header = False\n",
+    "\n",
+    "# Function to map the string label from the dataset to a numerical value\n",
+    "def label_map_func(x):\n",
+    "    return int(x == \"spam\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f93d5eed",
+   "metadata": {},
+   "source": [
+    "After the dataset has been downloaded and extracted, use the dataset factory to load the dataset. The `load_dataset` method has parameters with information used to load the dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "94e348c2",
+   "metadata": {
+    "tags": [
+     "remove_for_tf_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "dataset = dataset_factory.load_dataset(sms_data_directory, \"text_classification\", \"tensorflow\",\n",
+    "                                       csv_file_name=csv_file_name, class_names=class_names,\n",
+    "                                       label_map_func=label_map_func, delimiter=delimiter, header=header)\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "28504679",
+   "metadata": {},
+   "source": [
+    "Skip to the next step [4. Prepare the dataset](#4.-Prepare-the-dataset) to continue using your own dataset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ccac8980",
+   "metadata": {},
+   "source": [
+    "### Option B: Use the Tensorflow datasets catalog\n",
+    "\n",
+    "Option B allows for using a dataset from the [TensorFlow datasets catalog](https://www.tensorflow.org/datasets/catalog/overview). The dataset factory currently supports the following TFDS text classification datasets: [imdb_reviews](https://www.tensorflow.org/datasets/catalog/imdb_reviews), [glue/sst2](https://www.tensorflow.org/datasets/catalog/glue#gluesst2), [glue/cola](https://www.tensorflow.org/datasets/catalog/glue#gluecola_default_config), and [ag_news_subset](https://www.tensorflow.org/datasets/catalog/ag_news_subset)."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d93313bf",
+   "metadata": {
+    "tags": [
+     "remove_for_custom_dataset"
+    ]
+   },
+   "outputs": [],
+   "source": [
+    "# Supported datasets: imdb_reviews, glue/sst2, glue/cola, ag_news_subset\n",
+    "dataset_name = \"ag_news_subset\"\n",
+    "dataset = dataset_factory.get_dataset(dataset_dir, model.use_case, model.framework, dataset_name,\n",
+    "                                      dataset_catalog=\"tf_datasets\", shuffle_files=True)\n",
+    "\n",
+    "print(dataset.info)\n",
+    "print(\"\\nClass names:\", str(dataset.class_names))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "539d53b7",
+   "metadata": {},
+   "source": [
+    "## 4. Prepare the dataset\n",
+    "\n",
+    "Once you have your dataset from Option A or Option B above, use the following cells to split and preprocess the data. We split them into training and validation subsets, then resize the images to match the selected models, and then batch the images."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "587d1d9e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create splits for training and validation and batch the dataset\n",
+    "dataset.shuffle_split(train_pct=0.75, val_pct=0.25)\n",
+    "dataset.preprocess(batch_size=32)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "352eda54",
+   "metadata": {},
+   "source": [
+    "## 5. Fine tuning\n",
+    "\n",
+    "The TLT model's train function is called with the dataset that was just prepared, along with an output directory for checkpoints, and the number of training epochs.\n",
+    "\n",
+    "Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance.\n",
+    "\n",
+    "With the do_eval paramter set to True by default, this step will also show how the model can be evaluated. The model's evaluate function returns a list of metrics calculated from the dataset's validation subset."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "492ee811",
+   "metadata": {},
+   "source": [
+    "### Arguments\n",
+    "\n",
+    "#### Required\n",
+    "-  **dataset** (ImageClassificationDataset, required): Dataset to use when training the model\n",
+    "-  **output_dir** (str): Path to a writeable directory for checkpoint files\n",
+    "-  **epochs** (int): Number of epochs to train the model (default: 1)\n",
+    "\n",
+    "#### Optional\n",
+    "-  **initial_checkpoints** (str): Path to checkpoint weights to load. If the path provided is a directory, the latest checkpoint will be used.\n",
+    "-  **early_stopping** (bool): Enable early stopping if convergence is reached while training at the end of each epoch. (default: False)\n",
+    "-  **lr_decay** (bool): If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at the end of each epoch.\n",
+    "-  **enable_auto_mixed_precision** (bool or None): Enable auto mixed precision for training. Mixed precision uses both 16-bit and 32-bit floating point types to make training run faster and use less memory. It is recommended to enable auto mixed precision training when running on platforms that support bfloat16 (Intel third or fourth generation Xeon processors). If it is enabled on a platform that does not support bfloat16, it can be detrimental to the training performance. If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "-  **extra_layers** (list[int]): Optionally insert additional dense layers between the base model and output layer. This can help increase accuracy when fine-tuning a TFHub model. The input should be a list of integers representing the number and size of the layers, for example [1024, 512] will insert two dense layers, the first with 1024 neurons and the second with 512 neurons.\n",
+    "\n",
+    "Note: refer to release documentation for an up-to-date list of train arguments and their current descriptions"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "955a4a7e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# If enable_auto_mixed_precision is set to None, auto mixed precision will be automatically enabled when running \n",
+    "# with Intel fourth generation Xeon processors, and disabled for other platforms.\n",
+    "enable_auto_mixed_precision = None\n",
+    "\n",
+    "history = model.train(dataset, output_dir, epochs=1, enable_auto_mixed_precision=enable_auto_mixed_precision)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "32dd7c0a",
+   "metadata": {},
+   "source": [
+    "Evaluate the trained model:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1e728d46",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "metrics_names = model._model.metrics_names\n",
+    "metrics = model.evaluate(dataset)\n",
+    "\n",
+    "for metric_name, metric_value in zip(metrics_names, metrics):\n",
+    "    print(\"{}: {}\".format(metric_name, metric_value))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7e08a1c9",
+   "metadata": {},
+   "source": [
+    "## 6. Predict\n",
+    "\n",
+    "The model's predict function can be called with a batch of data from the dataset."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1ed07887",
+   "metadata": {
+    "scrolled": false
+   },
+   "outputs": [],
+   "source": [
+    "# Get a single batch from the dataset object\n",
+    "data_batch, labels = dataset.get_batch()\n",
+    "\n",
+    "# Call predict using the batch\n",
+    "batch_predictions = model.predict(data_batch)\n",
+    "\n",
+    "# Maximum number of rows to show in the data frame\n",
+    "max_items = 10\n",
+    "num_classes = len(dataset.class_names)\n",
+    "# Collect the sentence text, score, and actual label for the batch\n",
+    "prediction_list = []\n",
+    "for i, (text, actual_label) in enumerate(zip(data_batch, labels)):\n",
+    "    sentence = text.numpy().decode('utf-8')\n",
+    "    score = batch_predictions[i]\n",
+    "    if num_classes == 2:\n",
+    "        prediction = float(score)\n",
+    "    else:\n",
+    "        prediction = float(np.argmax(score))\n",
+    "    \n",
+    "    prediction_list.append([sentence,\n",
+    "                            max(tf.get_static_value(score)),\n",
+    "                            dataset.get_str_label(prediction),\n",
+    "                            dataset.get_str_label(int(actual_label.numpy()))])\n",
+    "    if i + 1 >= max_items:\n",
+    "        break\n",
+    "\n",
+    "# Display the results using a data frame\n",
+    "result_df = pd.DataFrame(prediction_list, columns=[\"Input Text\", \"Prediction Score\", \"Prediction\", \"Actual Label\"])\n",
+    "# Center the column headers and hide the index\n",
+    "result_df.style.set_table_styles([{'selector': 'th', 'props': [('text-align', 'center')]}]).hide(axis=\"index\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "f62be263",
+   "metadata": {},
+   "source": [
+    "Raw text can also be passed to the predict function."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6f3cbd35",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "score = model.predict(\"Awesome movie!\")\n",
+    "\n",
+    "if num_classes == 2:\n",
+    "    result = float(score)\n",
+    "else:\n",
+    "    result = float(np.argmax(score))\n",
+    "\n",
+    "print(\"Predicted score:\", np.max(score))\n",
+    "print(\"Predicted label:\", dataset.get_str_label(float(result)))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "64ada826",
+   "metadata": {},
+   "source": [
+    "## 7. Export the saved model\n",
+    "\n",
+    "Lastly, we can call the Intel Transfer Learning Tool model export function to generate a `saved_model.pb`. The model is saved in a format that is ready to use with [TensorFlow Serving](https://github.com/tensorflow/serving). Each time the model is exported, a new numbered directory is created, which allows serving to pick up the latest model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3981b2f5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "saved_model_dir = model.export(output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "7b0c400c",
+   "metadata": {},
+   "source": [
+    "## 8. Quantization\n",
+    "\n",
+    "In this section, the Intel Transfer Learning Tool API uses Intel® Neural Compressor (INC) to quantize the model to get optimal inference performance."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b924c81b",
+   "metadata": {},
+   "source": [
+    "We use the Intel Neural Compressor config to benchmark the full precision model to see how it performs, as our baseline.\n",
+    "\n",
+    "> Note that there is a known issue when running Intel Neural Compressor from a notebook that you may sometimes see the error \n",
+    "> `zmq.error.ZMQError: Address already in use`. If you see this error, rerun the cell again."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "08fdb72d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "results = model.benchmark(dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d7b33e37",
+   "metadata": {},
+   "source": [
+    "Next we use Intel Neural Compressor to automatically search for the optimal quantization recipe for low-precision model inference. Running post training quantization may take several minutes."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "29918c14",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "inc_output_dir = os.path.join(output_dir, 'quantized_models', model.model_name,\n",
+    "                                       os.path.basename(saved_model_dir))\n",
+    "model.quantize(inc_output_dir, dataset)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fd6c2674",
+   "metadata": {},
+   "source": [
+    "Let's benchmark using the quantized model, so that we can compare the performance to the full precision model that was originally benchmarked."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "bcb08097",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "quantized_results = model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "0459a8c3",
+   "metadata": {},
+   "source": [
+    "Let's also inspect the disk size of the pre- and post-quantization model files:"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "8b726f30",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print('The size of the un-compressed model:')\n",
+    "!du -h {saved_model_dir}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "04b4408d",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print('The size of the compressed model:')\n",
+    "!du -h {inc_output_dir}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "3d0ed367",
+   "metadata": {},
+   "source": [
+    "## Citations\n",
+    "\n",
+    "```\n",
+    "@InProceedings{maas-EtAl:2011:ACL-HLT2011,\n",
+    "  author    = {Maas, Andrew L.  and  Daly, Raymond E.  and  Pham, Peter T.  and  Huang, Dan  and  Ng, Andrew Y.  and  Potts, Christopher},\n",
+    "  title     = {Learning Word Vectors for Sentiment Analysis},\n",
+    "  booktitle = {Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies},\n",
+    "  month     = {June},\n",
+    "  year      = {2011},\n",
+    "  address   = {Portland, Oregon, USA},\n",
+    "  publisher = {Association for Computational Linguistics},\n",
+    "  pages     = {142--150},\n",
+    "  url       = {http://www.aclweb.org/anthology/P11-1015}\n",
+    "}\n",
+    "\n",
+    "@misc{zhang2015characterlevel,\n",
+    "    title={Character-level Convolutional Networks for Text Classification},\n",
+    "    author={Xiang Zhang and Junbo Zhao and Yann LeCun},\n",
+    "    year={2015},\n",
+    "    eprint={1509.01626},\n",
+    "    archivePrefix={arXiv},\n",
+    "    primaryClass={cs.LG}\n",
+    "}\n",
+    "\n",
+    "@misc{misc_sms_spam_collection_228,\n",
+    "  author       = {Almeida, Tiago},\n",
+    "  title        = {{SMS Spam Collection}},\n",
+    "  year         = {2012},\n",
+    "  howpublished = {UCI Machine Learning Repository}\n",
+    "}\n",
+    "```\n",
+    "Please see this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this data set and does not confer any rights to it."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.16"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/pytorch_requirements.txt b/pytorch_requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..b23a802d096dd3cade95a1a3e7fc1b5190203a10
--- /dev/null
+++ b/pytorch_requirements.txt
@@ -0,0 +1,10 @@
+charset-normalizer~=3.1.0
+datasets~=2.12.0
+intel-extension-for-pytorch==1.13.100
+neural-compressor==2.1.1
+protobuf~=4.23.2
+python-dateutil~=2.8.2
+torch==1.13.1
+torchvision==0.14.1
+transformers[torch]~=4.30.0
+
diff --git a/run_notebooks.sh b/run_notebooks.sh
new file mode 100644
index 0000000000000000000000000000000000000000..87b5183a135ea89647b69b92fca50c53f178bd9e
--- /dev/null
+++ b/run_notebooks.sh
@@ -0,0 +1,74 @@
+#!/usr/bin/env bash
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+tf_notebooks=(
+    "notebooks/image_classification/tf_image_classification/Image_Classification_Transfer_Learning.ipynb"
+    "notebooks/question_answering/tfhub_question_answering/BERT_Question_Answering.ipynb"
+    "notebooks/text_classification/tfhub_text_classification/BERT_Binary_Text_Classification.ipynb"
+    "notebooks/text_classification/tfhub_text_classification/BERT_Multi_Text_Classification.ipynb"
+)
+
+pyt_notebooks=(
+    "notebooks/image_classification/pytorch_image_classification/PyTorch_Image_Classification_Transfer_Learning.ipynb"
+    "notebooks/text_classification/pytorch_text_classification/PyTorch_Text_Classifier_fine_tuning.ipynb"
+)
+
+if [[ $# -eq 0 ]] ; then
+    echo "No argument supplied. Please input tensorflow, pytorch, a notebook path, or a directory containing one or more notebooks."
+    exit 1
+fi
+
+CURDIR=$PWD
+INPUT=$1
+
+if [[ $INPUT == "tensorflow" ]] ; then
+    notebooks=${tf_notebooks[*]}
+elif [[ $INPUT == "pytorch" ]] ; then
+    notebooks=${pyt_notebooks[*]}
+else
+    # Parse the filename from the path
+    DIR=${INPUT%/*}
+    FILE="${INPUT##*/}"
+
+    # If no file was given, find all notebooks in the directory
+    if [ -z "$FILE" ] ; then
+        readarray -d '' notebooks < <(find ${DIR} -maxdepth 1 -name *.ipynb -print0)
+    else
+        notebooks=($1)
+    fi
+fi
+
+echo "Notebooks: ${notebooks[*]}"
+for notebook in ${notebooks[*]}; do
+    DIR=${notebook%/*}
+    echo "Running ${notebook}..."
+
+    if [[ $# -eq 2 ]] ; then
+        echo "Stripping tag ${2}..."
+        jupyter nbconvert --to script \
+            --TagRemovePreprocessor.enabled=True \
+            --TagRemovePreprocessor.remove_cell_tags $2 \
+            --output notebook_test ${notebook}
+    else
+        jupyter nbconvert --to script --output notebook_test ${notebook}
+    fi
+
+    pushd ${DIR}
+    PYTHONPATH=${CURDIR} ipython notebook_test.py
+    rm notebook_test.py
+    popd
+done
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000000000000000000000000000000000000..aac9d9b85b7a73c3df7adadbbab7bc61635932d3
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,71 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+from pathlib import Path
+from setuptools import setup, find_packages
+
+COMMON_PACKAGES = ["click"]
+
+# read the contents of your README file
+this_directory = Path(__file__).parent
+long_description = (this_directory / "README.md").read_text()
+
+def get_framework_requirements(framework_name):
+    """ Gets framework related requirements from its requirements.txt file """
+    with open('{}_requirements.txt'.format(framework_name)) as f:
+        requirements = f.read().splitlines()
+
+    if os.environ.get("EXCLUDE_FRAMEWORK", default="False") == "True":
+        # items to exclude if we don't want to install the framework
+        exclude_list = ["tensorflow", "intel-tensorflow", "torch", "intel-extension-for-pytorch", "torchvision"]
+        requirements = [r for r in requirements if r.split('=')[0] not in exclude_list]
+
+    return requirements
+
+EXTRA_PACKAGES = {
+    "tensorflow": get_framework_requirements("tensorflow"),
+    "pytorch": get_framework_requirements("pytorch")
+}
+
+setup(name="intel-transfer-learning-tool",
+      description="Intel® Transfer Learning Tool",
+      version="0.5.0",
+      url='https://github.com/IntelAI/transfer-learning',
+      license='Apache 2.0',
+      author='IntelAI',
+      author_email='IntelAI@intel.com',
+      long_description=long_description,
+      long_description_content_type='text/markdown',
+      packages=find_packages(),
+      install_requires= \
+        COMMON_PACKAGES + \
+        EXTRA_PACKAGES['pytorch'] + \
+        EXTRA_PACKAGES['tensorflow'],
+      extras_require=EXTRA_PACKAGES,
+      python_requires=">3.8",
+      entry_points={
+        "console_scripts": [
+            "tlt = tlt.tools.cli.main:cli_group"
+            ]
+        },
+      include_package_data=True
+      )
diff --git a/tensorflow_requirements.txt b/tensorflow_requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..930e28e93867b8522ab2ffa86841d60d0f05ebfd
--- /dev/null
+++ b/tensorflow_requirements.txt
@@ -0,0 +1,7 @@
+intel-tensorflow==2.12.0
+neural-compressor==2.1.1
+numpy~=1.23.5
+tensorflow-datasets~=4.9.2
+tensorflow-hub~=0.13.0
+tensorflow==2.12.0
+transformers~=4.30.0
diff --git a/tests/README.md b/tests/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..b0b7ba8f5d0ed33a4e5a55102a3ad9152871bb5c
--- /dev/null
+++ b/tests/README.md
@@ -0,0 +1,116 @@
+# Testing Intel® Transfer Learning Tool
+
+To run these tests, first install the [Intel Transfer Learning Tool](/tlt) for TensorFlow and/or PyTorch.
+Then install the following dependencies:
+
+```
+# Clone this repo, if you don't already have it
+git clone https://github.com/IntelAI.transfer-learning.git
+cd transfer-learning
+
+# Run tests with make, or skip this step to run individually
+make test
+
+# Run only unittests with make
+make unittest
+
+# Run only integration tests with make
+make integration
+
+# Create a virtual env or conda env for the test environment
+conda create --name tlt_dev_venv python=3.9
+
+# Install tlt for TensorFlow and/or PyTorch
+pip3 install --editable .
+
+# Install the test requirements
+pip3 install -r tests/requirements-test.txt
+```
+
+## API Tests
+There are unit and integration tests that exercise the API.
+Make sure you are in the `transfer-learning/` directory and use the command
+below to run all tests:
+```
+PYTHONPATH=$(pwd)/tests py.test -s
+```
+
+### Markers
+
+The following custom markers have been defined in the transfer learning tests:
+```
+@pytest.mark.tensorflow: test requires tensorflow to be installed
+
+@pytest.mark.pytorch: test requires pytorch to be installed
+
+@pytest.mark.common: test does not require a specific framework to be installed
+
+@pytest.mark.integration: test will run all integration tests
+```
+
+### Sample test run commands using markers
+
+To run only the TensorFlow tests run:
+```
+PYTHONPATH=$(pwd)/tests py.test -s -m tensorflow
+```
+
+To run the TensorFlow tests and the common tests:
+```
+PYTHONPATH=$(pwd)/tests py.test -s -m "tensorflow or common"
+```
+
+To run only the PyTorch tests run:
+```
+PYTHONPATH=$(pwd)/tests py.test -s -m pytorch
+```
+
+> Note: After the tests have run, there will be downloaded data in `/tmp/data`
+that has not been cleaned up. Currently, the developer has to manage this, but
+we should create fixtures that take care of it.
+
+There are some executable examples in module docstrings. To run them as tests, follow
+the steps in the [docs README.md](/docs/README.md).
+
+## Jupyter Notebook Tests
+There are Makefile targets and a bash script that will automatically run the Jupyter notebooks.
+There are a few different ways to use them. All of the ways require that you are in the `transfer-learning/` directory
+and that you have set dataset and output directories:
+
+```
+export DATASET_DIR=<directory to download the datasets>
+export OUTPUT_DIR=<output directory for the saved models>
+```
+
+To run the <b>Intel Transfer Learning Tool tutorial notebooks</b> using custom datasets:
+```
+make test_notebook_custom
+```
+
+To run the <b>Intel Transfer Learning Tool tutorial notebooks</b> using datasets from public catalogs:
+```
+make test_notebook_catalog
+```
+
+To run all the <b>native PyTorch notebooks</b> using a test environment for PyTorch without Intel Transfer Learning Tool:
+```
+make test_pyt_notebook
+```
+
+To run all the <b>native TensorFlow notebooks</b> using a test environment for TensorFlow without Intel Transfer Learning Tool:
+```
+make test_tf_notebook
+```
+
+To use the virtual environment of your choice and run a single notebook or multiple notebooks in the same directory:
+```
+source <env>/bin/activate
+bash run_notebooks.sh <directory or file path>
+```
+
+Optional: to run a notebook with certain cells omitted, send in the metadata tag as a second argument. For example:
+```
+source <env>/bin/activate
+bash run_notebooks.sh notebooks/image_classification/tlt_api_tf_image_classification/TLT_TF_Image_Classification_Transfer_Learning.ipynb remove_for_tf_dataset
+```
+
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 0000000000000000000000000000000000000000..148205ba712bfa51c4096df6f42880f9ce2a7aa2
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,81 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2018-2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import inspect
+import os
+import pytest
+import sys
+from mock import MagicMock
+
+
+MODULES = ('tlt.tests',)
+MODULES_REPLACE = ('tests', 'tlt')
+
+
+def patch_setattr(module_names, module_replace, monkeypatch, path, m):
+    """ Credit for this goes mostly to @megawidget
+    do not call this directly -- assumes the fixture's caller is two stacks up
+    and will correspondingly guess the module path to patch
+    `path` can be:
+        1. an object, if it's defined in the module you're testing
+        2. a name, if it's imported in the module you're testing
+        3. a full path a la traditional monkeypatch
+    """
+    if hasattr(path, '__module__'):
+        monkeypatch.setattr('.'.join((path.__module__, path.__name__)), m)
+        return
+    elif any(path.startswith(i + '.') for i in module_names):
+        # full path.  OK.
+        monkeypatch.setattr(path, m)
+    else:
+        # assume we're patching stuff in the file the test file is supposed to
+        # be testing
+        fn = inspect.getouterframes(inspect.currentframe())[2][1]
+        fn = os.path.splitext(os.path.relpath(fn))[0]
+        print("fn = " + fn)
+        module = fn.replace(os.path.sep, '.').replace('test_', '').replace(
+            *module_replace)
+        try:
+            monkeypatch.setattr('.'.join((module, path)), m)
+        except AttributeError:
+            # handle mocking builtins like `open`
+            if sys.version_info.major == 3:
+                builtin = 'builtins'
+            else:
+                builtin = '__builtin__'
+            # NOTE: `path` should be just the builtin, like `open`
+            # usage: patch('open')
+            monkeypatch.setattr("{}.{}".format(builtin, path), m)
+
+
+@pytest.fixture
+def patch(monkeypatch):
+    """allows us to add easy autouse fixtures by patching anything we want
+       Usage: return something like this in a @pytest.fixture
+       - patch('files.fetch_action_arg', MagicMock(return_value='output'))
+       Without the second arg, will default to just MagicMock()
+    """
+
+    def wrapper(path, mock=None):
+        m = mock if mock is not None else MagicMock()
+        patch_setattr(MODULES, MODULES_REPLACE, monkeypatch, path, m)
+        return m
+
+    return wrapper
diff --git a/tests/pytorch_tests/__init__.py b/tests/pytorch_tests/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/pytorch_tests/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/pytorch_tests/test_image_anomaly_detection.py b/tests/pytorch_tests/test_image_anomaly_detection.py
new file mode 100644
index 0000000000000000000000000000000000000000..0f6475450794d1dbcd759028ae11670f2ab51bad
--- /dev/null
+++ b/tests/pytorch_tests/test_image_anomaly_detection.py
@@ -0,0 +1,247 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+try:
+    import torch
+    import torch.nn as nn
+    import torch.nn.functional as functional
+except ModuleNotFoundError:
+    print("WARNING: Unable to import torch. Torch may not be installed")
+
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.utils.file_utils import download_and_extract_tar_file
+
+try:
+    from tlt.models.image_anomaly_detection.pytorch_image_anomaly_detection_model import extract_features
+except ModuleNotFoundError:
+    print("WARNING: Unable to import torch. Torch may not be installed")
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+class TestImageAnomalyDetectionCustomDataset:
+    """
+    Tests for PyTorch image anomaly detection using a custom dataset using the flowers dataset
+    """
+    @classmethod
+    def setup_class(cls):
+        os.makedirs('/tmp/data', exist_ok=True)
+        temp_dir = tempfile.mkdtemp(dir='/tmp/data')
+        custom_dataset_path = os.path.join(temp_dir, "flower_photos")
+
+        if not os.path.exists(custom_dataset_path):
+            download_url = "https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz"
+            download_and_extract_tar_file(download_url, temp_dir)
+            # Rename daisy to "good" and delete all but one other kind to make the dataset small
+            os.rename(os.path.join(custom_dataset_path, 'daisy'), os.path.join(custom_dataset_path, 'good'))
+            for flower in ['dandelion', 'roses', 'sunflowers']:
+                shutil.rmtree(os.path.join(custom_dataset_path, flower))
+
+        os.makedirs('/tmp/output', exist_ok=True)
+        cls._output_dir = tempfile.mkdtemp(dir='/tmp/output')
+        os.environ["TORCH_HOME"] = cls._output_dir
+        cls._temp_dir = temp_dir
+        cls._dataset_dir = custom_dataset_path
+
+    @classmethod
+    def teardown_class(cls):
+        # remove directories
+        for dir in [cls._output_dir, cls._temp_dir]:
+            if os.path.exists(dir):
+                print("Deleting test directory:", dir)
+                shutil.rmtree(dir)
+
+    @pytest.mark.parametrize('model_name',
+                             ['resnet18'])
+    def test_custom_dataset_workflow(self, model_name):
+        """
+        Tests the workflow for PYT image anomaly detection using a custom dataset
+        """
+        framework = 'pytorch'
+        use_case = 'image_anomaly_detection'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+        assert ['tulips'] == dataset.defect_names
+        assert ['bad', 'good'] == dataset.class_names
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework, use_case)
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.preprocess(model.image_size, 32)
+        dataset.shuffle_split(train_pct=0.5, val_pct=0.5, seed=10)
+
+        # Train for 1 epoch
+        pca_components, trained_model = model.train(dataset, self._output_dir,
+                                                    layer_name='layer3', seed=10, simsiam=False)
+
+        # Extract features
+        images, labels = dataset.get_batch(subset='validation')
+        features = extract_features(trained_model, images, layer_name='layer3', pooling=['avg', 2])
+        assert len(features) == 32
+
+        # Evaluate
+        threshold, auroc = model.evaluate(dataset, pca_components)
+        assert isinstance(auroc, float)
+
+        # Predict with a batch
+        predictions = model.predict(images, pca_components)
+        assert len(predictions) == 32
+
+    def test_custom_model_workflow(self):
+        """
+        Tests the workflow for PYT image anomaly detection using a custom model and custom dataset
+        """
+        framework = 'pytorch'
+        use_case = 'image_anomaly_detection'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+
+        # Define a model
+        class Net(nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.conv1 = nn.Conv2d(3, 6, 5)
+                self.pool = nn.MaxPool2d(2, 2)
+                self.conv2 = nn.Conv2d(6, 16, 5)
+                self.fc1 = nn.Linear(16 * 5 * 5, 120)
+                self.fc2 = nn.Linear(120, 84)
+                self.fc3 = nn.Linear(84, 10)
+
+            def forward(self, x):
+                x = self.pool(functional.relu(self.conv1(x)))
+                x = self.pool(functional.relu(self.conv2(x)))
+                x = torch.flatten(x, 1)
+                x = functional.relu(self.fc1(x))
+                x = functional.relu(self.fc2(x))
+                x = self.fc3(x)
+                return x
+
+        net = Net()
+
+        # Load the model
+        model = model_factory.load_model('custom_model', net, framework=framework, use_case=use_case)
+        model.list_layers()
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.preprocess(image_size=224, batch_size=32)
+        dataset.shuffle_split(train_pct=0.5, val_pct=0.5, seed=10)
+
+        # Train for 1 epoch
+        pca_components, trained_model = model.train(dataset, self._output_dir,
+                                                    layer_name='conv2', seed=10, simsiam=False)
+
+        # Extract features
+        images, labels = dataset.get_batch(subset='validation')
+        features = extract_features(trained_model, images, layer_name='conv2', pooling=['avg', 2])
+        assert len(features) == 32
+
+        # Evaluate
+        threshold, auroc = model.evaluate(dataset, pca_components)
+        assert isinstance(auroc, float)
+
+        # Predict with a batch
+        predictions = model.predict(images, pca_components)
+        assert len(predictions) == 32
+
+    @pytest.mark.parametrize('model_name',
+                             ['resnet18'])
+    def test_simsiam_workflow(self, model_name):
+        """
+        Tests the workflow for PYT image anomaly detection using a custom dataset
+        and simsiam feature extractor enabled
+        """
+        framework = 'pytorch'
+        use_case = 'image_anomaly_detection'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+        assert ['tulips'] == dataset.defect_names
+        assert ['bad', 'good'] == dataset.class_names
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework, use_case)
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.preprocess(model.image_size, 32)
+        dataset.shuffle_split(train_pct=0.5, val_pct=0.5, seed=10)
+
+        # Train for 1 epoch
+        pca_components, trained_model = model.train(dataset, self._output_dir, epochs=1,
+                                                    layer_name='layer3', feature_dim=1000, pred_dim=250,
+                                                    seed=10, simsiam=True, initial_checkpoints=None)
+
+        # Evaluate
+        threshold, auroc = model.evaluate(dataset, pca_components)
+        assert isinstance(auroc, float)
+
+        # Predict with a batch
+        images, labels = dataset.get_batch(subset='validation')
+        predictions = model.predict(images, pca_components)
+        assert len(predictions) == 32
+
+    @pytest.mark.parametrize('model_name',
+                             ['resnet18'])
+    def test_cutpaste_workflow(self, model_name):
+        """
+        Tests the workflow for PYT image anomaly detection using a custom dataset
+        and cutpaste feature extractor enabled
+        """
+        framework = 'pytorch'
+        use_case = 'image_anomaly_detection'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+        assert ['tulips'] == dataset.defect_names
+        assert ['bad', 'good'] == dataset.class_names
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework, use_case)
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.preprocess(model.image_size, 32)
+        dataset.shuffle_split(train_pct=0.5, val_pct=0.25, test_pct=0.25, seed=10)
+
+        # Train for 1 epoch
+        pca_components, trained_model = model.train(dataset, self._output_dir, epochs=1,
+                                                    layer_name='layer3', optim='sgd', freeze_resnet=20,
+                                                    head_layer=2, cutpaste_type='normal', seed=10,
+                                                    cutpaste=True)
+
+        # Evaluate
+        threshold, auroc = model.evaluate(dataset, pca_components, use_test_set=True)
+        assert isinstance(auroc, float)
+
+        # Predict with a batch
+        images, labels = dataset.get_batch(subset='test')
+        predictions = model.predict(images, pca_components)
+        assert len(predictions) == 32
diff --git a/tests/pytorch_tests/test_image_classification.py b/tests/pytorch_tests/test_image_classification.py
new file mode 100644
index 0000000000000000000000000000000000000000..4a5d9249ad9aae1525f637b23104ed9ece56bb34
--- /dev/null
+++ b/tests/pytorch_tests/test_image_classification.py
@@ -0,0 +1,387 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import numpy as np
+import pytest
+import shutil
+import tempfile
+
+try:
+    import torch
+    import torch.nn as nn
+    import torch.nn.functional as functional
+except ModuleNotFoundError:
+    print("WARNING: Unable to import torch. Torch may not be installed")
+
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.utils.file_utils import download_and_extract_tar_file
+
+
+@pytest.mark.skip(reason='TODO: Solve test fails with urllib.error.HTTPError: HTTP Error 403: rate limit exceeded')
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name,extra_layers,correct_num_layers,test_inc',
+                         [['efficientnet_b0', 'CIFAR10', None, 2, False],
+                          ['resnet18_ssl', 'CIFAR10', None, 1, False],
+                          ['efficientnet_b0', 'CIFAR10', [1024, 512], 6, False],
+                          ['resnet18', 'CIFAR10', [1024, 512], 5, True]])
+def test_pyt_image_classification(model_name, dataset_name, extra_layers, correct_num_layers, test_inc):
+    """
+    Tests basic transfer learning functionality for PyTorch image classification models using a torchvision dataset
+    """
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+    os.environ["TORCH_HOME"] = output_dir
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', 'image_classification', framework, dataset_name,
+                                          'torchvision', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    # Preprocess the dataset
+    dataset.preprocess(image_size='variable', batch_size=32)
+    dataset.shuffle_split(train_pct=0.05, val_pct=0.05, seed=10)
+    assert dataset._validation_type == 'shuffle_split'
+
+    # Evaluate before training
+    pretrained_metrics = model.evaluate(dataset)
+    assert len(pretrained_metrics) > 0
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False, extra_layers=extra_layers, seed=10)
+    assert len(list(model._model.children())[-1]) == correct_num_layers
+
+    # Evaluate
+    trained_metrics = model.evaluate(dataset)
+    assert trained_metrics[0] <= pretrained_metrics[0]  # loss
+    assert trained_metrics[1] >= pretrained_metrics[1]  # accuracy
+
+    # Predict with a batch
+    images, labels = dataset.get_batch()
+    predictions = model.predict(images)
+    assert len(predictions) == 32
+    probabilities = model.predict(images, return_type='probabilities')
+    assert probabilities.shape == torch.Size([32, 10])  # CIFAR has 10 classes
+    np.testing.assert_almost_equal(torch.sum(probabilities), np.float32(32), decimal=4)
+
+    # Export the saved model
+    saved_model_dir = model.export(output_dir)
+    assert os.path.isdir(saved_model_dir)
+    assert os.path.isfile(os.path.join(saved_model_dir, "model.pt"))
+
+    # Reload the saved model
+    reload_model = model_factory.get_model(model_name, framework)
+    reload_model.load_from_directory(saved_model_dir)
+
+    # Evaluate
+    reload_metrics = reload_model.evaluate(dataset)
+    assert reload_metrics == trained_metrics
+
+    # Ensure we get not implemented errors for graph_optimization
+    with pytest.raises(NotImplementedError):
+        model.optimize_graph(os.path.join(saved_model_dir, 'optimized'))
+
+    # Test quantization and benchmarking
+    if test_inc:
+        inc_output_dir = os.path.join(output_dir, "quantized", 'resnet18')
+        os.makedirs(inc_output_dir, exist_ok=True)
+        model.quantize(inc_output_dir, dataset)
+        assert os.path.exists(os.path.join(inc_output_dir, "model.pt"))
+        model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+def test_pyt_image_classification_custom_model():
+    """
+    Tests basic transfer learning functionality for custom PyTorch image classification models using a Torchvision
+    dataset
+    """
+    framework = 'pytorch'
+    use_case = 'image_classification'
+    output_dir = tempfile.mkdtemp()
+    os.environ["TORCH_HOME"] = output_dir
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', 'image_classification', framework, 'CIFAR10',
+                                          'torchvision', split=["train"], shuffle_files=False)
+
+    # Define a model
+    class Net(nn.Module):
+        def __init__(self):
+            super().__init__()
+            self.conv1 = nn.Conv2d(3, 6, 5)
+            self.pool = nn.MaxPool2d(2, 2)
+            self.conv2 = nn.Conv2d(6, 16, 5)
+            self.fc1 = nn.Linear(16 * 5 * 5, 120)
+            self.fc2 = nn.Linear(120, 84)
+            self.fc3 = nn.Linear(84, 10)
+
+        def forward(self, x):
+            x = self.pool(functional.relu(self.conv1(x)))
+            x = self.pool(functional.relu(self.conv2(x)))
+            x = torch.flatten(x, 1)
+            x = functional.relu(self.fc1(x))
+            x = functional.relu(self.fc2(x))
+            x = self.fc3(x)
+            return x
+
+    net = Net()
+
+    # Get the model
+    model = model_factory.load_model('custom_model', net, framework, use_case)
+    assert model.num_classes == 10
+
+    # Preprocess the dataset
+    dataset.preprocess(image_size='variable', batch_size=32)
+    dataset.shuffle_split(train_pct=0.05, val_pct=0.05, seed=10)
+    assert dataset._validation_type == 'shuffle_split'
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False, seed=10)
+
+    # Evaluate
+    trained_metrics = model.evaluate(dataset)
+    assert trained_metrics[0] > 0.0  # loss
+    assert trained_metrics[1] > 0.0  # accuracy
+
+    # Predict with a batch
+    images, labels = dataset.get_batch()
+    predictions = model.predict(images)
+    assert len(predictions) == 32
+    probabilities = model.predict(images, return_type='probabilities')
+    assert probabilities.shape == torch.Size([32, 10])  # CIFAR has 10 classes
+    np.testing.assert_almost_equal(torch.sum(probabilities), np.float32(32), decimal=4)
+
+    # Export the saved model
+    saved_model_dir = model.export(output_dir)
+    assert os.path.isdir(saved_model_dir)
+    assert os.path.isfile(os.path.join(saved_model_dir, "model.pt"))
+
+    # Reload the saved model
+    reload_model = model_factory.load_model('custom_model', saved_model_dir, framework, use_case)
+
+    # Evaluate
+    reload_metrics = reload_model.evaluate(dataset)
+    assert reload_metrics == trained_metrics
+
+    # Ensure we get not implemented errors for graph_optimization
+    with pytest.raises(NotImplementedError):
+        model.optimize_graph(os.path.join(saved_model_dir, 'optimized'))
+
+    # Test quantization and benchmarking
+    inc_output_dir = os.path.join(output_dir, "quantized", 'Net')
+    os.makedirs(inc_output_dir, exist_ok=True)
+    model.quantize(inc_output_dir, dataset)
+    assert os.path.exists(os.path.join(inc_output_dir, "model.pt"))
+    model.benchmark(dataset=dataset, saved_model_dir=inc_output_dir)
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.pytorch
+class TestImageClassificationCustomDataset:
+    """
+    Tests for PyTorch image classification using a custom dataset using the flowers dataset
+    """
+    @classmethod
+    def setup_class(cls):
+        temp_dir = tempfile.mkdtemp(dir='/tmp/data')
+        custom_dataset_path = os.path.join(temp_dir, "flower_photos")
+
+        if not os.path.exists(custom_dataset_path):
+            download_url = "https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz"
+            download_and_extract_tar_file(download_url, temp_dir)
+
+        os.makedirs('/tmp/output', exist_ok=True)
+        cls._output_dir = tempfile.mkdtemp(dir='/tmp/output')
+        os.environ["TORCH_HOME"] = cls._output_dir
+        cls._temp_dir = temp_dir
+        cls._dataset_dir = custom_dataset_path
+
+    @classmethod
+    def teardown_class(cls):
+        # remove directories
+        for dir in [cls._output_dir, cls._temp_dir]:
+            if os.path.exists(dir):
+                print("Deleting test directory:", dir)
+                shutil.rmtree(dir)
+
+    @pytest.mark.skip(reason='TODO: Solve test fails with urllib.error.HTTPError: HTTP Error 403: rate limit exceeded')
+    @pytest.mark.parametrize('model_name,add_aug,ipex_optimize,test_inc',
+                             [['efficientnet_b0', ['hflip'], True, False],
+                              ['resnet18', ['rotate'], False, True],
+                              ['resnet18', None, True, True],
+                              ['resnet18_ssl', ['rotate'], True, False],
+                              ['vit_b_16', None, False, False]])
+    def test_custom_dataset_workflow(self, model_name, add_aug, ipex_optimize, test_inc):
+        """
+        Tests the full workflow for PYT image classification using a custom dataset
+        """
+        framework = 'pytorch'
+        use_case = 'image_classification'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+        assert ['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips'] == dataset.class_names
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework)
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.preprocess(model.image_size, 32, add_aug=add_aug)
+        dataset.shuffle_split(train_pct=0.1, val_pct=0.1, seed=10)
+
+        # Train for 1 epoch
+        model.train(dataset, output_dir=self._output_dir, epochs=1, do_eval=False, seed=10, ipex_optimize=ipex_optimize)
+
+        # Evaluate
+        model.evaluate(dataset)
+
+        # Predict with a batch
+        images, labels = dataset.get_batch()
+        predictions = model.predict(images)
+        assert len(predictions) == 32
+
+        # export the saved model
+        saved_model_dir = model.export(self._output_dir)
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "model.pt"))
+
+        # Reload the saved model
+        reload_model = model_factory.get_model(model_name, framework)
+        reload_model.load_from_directory(saved_model_dir)
+
+        # Evaluate
+        metrics = reload_model.evaluate(dataset)
+        assert len(metrics) > 0
+
+        # Test benchmarking and quantization
+        if test_inc:
+            inc_output_dir = os.path.join(self._output_dir, "quantized", model_name)
+            os.makedirs(inc_output_dir, exist_ok=True)
+            model.quantize(inc_output_dir, dataset)
+            assert os.path.exists(os.path.join(inc_output_dir, "model.pt"))
+            model.benchmark(saved_model_dir=inc_output_dir, dataset=dataset)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name,epochs,lr,do_eval,early_stopping,lr_decay,final_lr,final_acc',
+                         [['efficientnet_b0', 'CIFAR10', 10, 0.005, True, False, True, 0.001, 0.9888],
+                          ['resnet18', 'CIFAR10', 1, 0.005, True, False, False, None, 0.2688],
+                          ['efficientnet_b0', 'CIFAR10', 1, 0.001, False, False, False, None, 0.1976],
+                          ['efficientnet_b0', 'CIFAR10', 10, 0.001, True, True, True, 0.0002, 0.8768]])
+def test_pyt_image_classification_with_lr_options(model_name, dataset_name, epochs, lr, do_eval, early_stopping,
+                                                  lr_decay, final_lr, final_acc):
+    """
+    Tests transfer learning for PyTorch image classification models using learning rate options
+    """
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+    os.environ["TORCH_HOME"] = output_dir
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', 'image_classification', framework, dataset_name,
+                                          'torchvision', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+    model.learning_rate = lr
+
+    # Preprocess the dataset
+    dataset.shuffle_split(train_pct=0.05, val_pct=0.05, shuffle_files=False)
+    dataset.preprocess(image_size='variable', batch_size=32)
+    assert dataset._validation_type == 'shuffle_split'
+
+    # Train
+    history = model.train(dataset, output_dir=output_dir, epochs=epochs, do_eval=do_eval, early_stopping=early_stopping,
+                          lr_decay=lr_decay, seed=10)
+
+    if final_lr:
+        assert model._lr_scheduler.optimizer.param_groups[0]['lr'] == final_lr
+    else:
+        assert model._lr_scheduler is None
+
+    assert history['Acc'][-1] == final_acc
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+def test_pyt_freeze():
+    """
+    Tests layer freezing functionality for PyTorch image classification models using a torchvision dataset
+    """
+    dataset_name = 'CIFAR10'
+    framework = 'pytorch'
+    layer_name = 'features'
+    model_name = 'efficientnet_b0'
+    output_dir = tempfile.mkdtemp()
+    os.environ["TORCH_HOME"] = output_dir
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', 'image_classification', framework, dataset_name,
+                                          'torchvision', split=["train"], shuffle_files=False)
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    # Preprocess the dataset
+    dataset.preprocess(image_size='variable', batch_size=32)
+    dataset.shuffle_split(train_pct=0.05, val_pct=0.05, seed=10)
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False)
+
+    # Check that everything in the layer is unfrozen
+    model.unfreeze_layer("features")
+
+    # Unfreeze everything in the layer
+    for (name, module) in model._model.named_children():
+        if name == layer_name:
+            for layer in module.children():
+                for param in layer.parameters():
+                    assert param.requires_grad is True
+
+    # Check that everything in the layer is frozen
+    model.freeze_layer("features")
+
+    # Freeze everything in the layer
+    for (name, module) in model._model.named_children():
+        if name == layer_name:
+            for layer in module.children():
+                for param in layer.parameters():
+                    assert param.requires_grad is False
+
+    # Test functionality of list_layers()
+    trainable_params = model.list_layers()
+    assert trainable_params == 12810  # Number of trainable params in efficientnet_b0
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
diff --git a/tests/pytorch_tests/test_text_classification.py b/tests/pytorch_tests/test_text_classification.py
new file mode 100644
index 0000000000000000000000000000000000000000..19dbb570ebbb381aa8df78b33c4dd16a6adf24be
--- /dev/null
+++ b/tests/pytorch_tests/test_text_classification.py
@@ -0,0 +1,315 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+from unittest.mock import MagicMock
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+try:
+    from tlt.datasets.text_classification.hf_custom_text_classification_dataset import HFCustomTextClassificationDataset
+except ModuleNotFoundError:
+    print("WARNING: Unable to import HFCustomTextClassificationDataset.")
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name,extra_layers,correct_num_layers,test_inc',
+                         [['bert-base-cased', 'imdb', None, 1, False],
+                          ['distilbert-base-uncased', 'imdb', [384, 192], 5, True]])
+def test_pyt_text_classification(model_name, dataset_name, extra_layers, correct_num_layers, test_inc):
+    """
+    Tests basic transfer learning functionality for PyTorch text classification models using a hugging face dataset
+    """
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                          'huggingface', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    # Preprocess the dataset
+    dataset.preprocess(model_name, batch_size=32)
+    dataset.shuffle_split(train_pct=0.02, val_pct=0.01, seed=6)
+    assert dataset._validation_type == 'shuffle_split'
+
+    # Evaluate before training
+    pretrained_metrics = model.evaluate(dataset)
+    assert len(pretrained_metrics) > 0
+
+    # Train
+    train_history = model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False, extra_layers=extra_layers)
+    assert train_history is not None and isinstance(train_history, dict)
+    assert 'Loss' in train_history
+    assert 'Acc' in train_history
+    assert 'train_runtime' in train_history
+    assert 'train_samples_per_second' in train_history
+    classifier_layer = getattr(model._model, "classifier")
+    try:
+        # If extra_layers given, the classifier is a Sequential layer with given input
+        n_layers = len(classifier_layer)
+    except TypeError:
+        # If not given, the classifer is just a single Linear layer
+        n_layers = 1
+    assert n_layers == correct_num_layers
+
+    # Evaluate
+    trained_metrics = model.evaluate(dataset)
+    assert trained_metrics['eval_loss'] <= pretrained_metrics['eval_loss']
+    assert trained_metrics['eval_accuracy'] >= pretrained_metrics['eval_accuracy']
+
+    # Export the saved model
+    saved_model_dir = model.export(output_dir)
+    assert os.path.isdir(saved_model_dir)
+    assert os.path.isfile(os.path.join(saved_model_dir, "model.pt"))
+
+    # Reload the saved model
+    reload_model = model_factory.get_model(model_name, framework)
+    reload_model.load_from_directory(saved_model_dir)
+
+    # Evaluate
+    reload_metrics = reload_model.evaluate(dataset)
+    assert reload_metrics['eval_accuracy'] == trained_metrics['eval_accuracy']
+
+    # Ensure we get 'NotImplementedError' for graph_optimization
+    with pytest.raises(NotImplementedError):
+        model.optimize_graph(os.path.join(saved_model_dir, 'optimized'))
+
+    # Quantization
+    if test_inc:
+        inc_output_dir = os.path.join(output_dir, "quantized", model_name)
+        os.makedirs(inc_output_dir, exist_ok=True)
+        model.quantize(inc_output_dir, dataset)
+        assert os.path.exists(os.path.join(inc_output_dir, "model.pt"))
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name',
+                         ['bert-base-cased'])
+def test_custom_dataset_workflow(model_name):
+    """
+    Tests the full workflow for PYT text classification using a custom dataset mock
+    """
+    model = model_factory.get_model(model_name, framework='pytorch', use_case="text_classification")
+
+    output_dir = tempfile.mkdtemp()
+    os.environ["TORCH_HOME"] = output_dir
+
+    mock_dataset = MagicMock()
+    mock_dataset.__class__ = HFCustomTextClassificationDataset
+    mock_dataset.validation_subset = ['fun', 'terrible']
+    mock_dataset.train_subset = ["fun, happy, boring, terrible"]
+    mock_dataset.class_names = ['good', 'bad']
+
+    # Preprocess the dataset and split to get small subsets for training and validation
+    mock_dataset.shuffle_split(train_pct=0.1, val_pct=0.1, shuffle_files=False)
+    mock_dataset.preprocess(model_name, batch_size=32)
+
+    # Train for 1 epoch
+    history = model.train(mock_dataset, output_dir=output_dir, epochs=1, seed=10, do_eval=False)
+    assert history is not None
+
+    # Evaluate
+    model.evaluate(mock_dataset)
+
+    # export the saved model
+    saved_model_dir = model.export(output_dir)
+    assert os.path.isdir(saved_model_dir)
+    assert os.path.isfile(os.path.join(saved_model_dir, "model.pt"))
+
+    # Reload the saved model
+    reload_model = model_factory.get_model(model_name, 'pytorch')
+    reload_model.load_from_directory(saved_model_dir)
+
+    # Evaluate
+    metrics = reload_model.evaluate(mock_dataset)
+    assert len(metrics) > 0
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name',
+                         [['distilbert-base-uncased', 'imdb']])
+def test_initial_checkpoints(model_name, dataset_name):
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+    checkpoint_dir = os.path.join(output_dir, model_name + '_checkpoints')
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                          'huggingface', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    assert model._generate_checkpoints is True
+
+    dataset.preprocess(model_name, batch_size=32)
+    dataset.shuffle_split(train_pct=0.01, val_pct=0.01, seed=10)
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=2, do_eval=False)
+
+    trained_metrics = model.evaluate(dataset)
+
+    # Delete the model and train a brand new model but instead we resume training from checkpoints
+    del model
+
+    model = model_factory.get_model(model_name, framework)
+    model.train(dataset, output_dir=output_dir, epochs=2, do_eval=False,
+                initial_checkpoints=os.path.join(checkpoint_dir, 'checkpoint.pt'))
+
+    improved_metrics = model.evaluate(dataset)
+
+    assert improved_metrics['eval_loss'] < trained_metrics['eval_loss']
+    assert improved_metrics['eval_accuracy'] > trained_metrics['eval_accuracy']
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name',
+                         [['distilbert-base-uncased', 'imdb']])
+def test_freeze_bert(model_name, dataset_name):
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                          'huggingface', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    dataset.preprocess(model_name, batch_size=32)
+    dataset.shuffle_split(train_pct=0.01, val_pct=0.01, seed=10)
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False)
+
+    # Freeze feature layers
+    layer_name = "features"
+    model.freeze_layer(layer_name)
+
+    # Check everything is frozen (not trainable) in the layer
+    for (name, module) in model._model.named_children():
+        if name == layer_name:
+            for param in module.parameters():
+                assert param.requires_grad is False
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name',
+                         [['distilbert-base-uncased', 'imdb']])
+def test_unfreeze_bert(model_name, dataset_name):
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                          'huggingface', split=["train"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    dataset.preprocess(model_name, batch_size=32)
+    dataset.shuffle_split(train_pct=0.01, val_pct=0.01, seed=10)
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False)
+    layer_name = "features"
+    model.unfreeze_layer(layer_name)
+
+    # Check everything is unfrozen (trainable) in the layer
+    for (name, module) in model._model.named_children():
+        if name == layer_name:
+            for param in module.parameters():
+                assert param.requires_grad is True
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('model_name,dataset_name',
+                         [['distilbert-base-uncased', 'imdb']])
+def test_list_layers_bert(model_name, dataset_name):
+    import io
+    import unittest.mock as mock
+
+    framework = 'pytorch'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                          'huggingface', split=["train"], shuffle_files=False)
+
+    dataset.preprocess(model_name, batch_size=32)
+    dataset.shuffle_split(train_pct=0.01, val_pct=0.01, seed=10)
+
+    # Train
+    model.train(dataset, output_dir=output_dir, epochs=1, do_eval=False)
+
+    # Mock stdout and sterr to capture the function's output
+    stdout = io.StringIO()
+    stderr = io.StringIO()
+    with mock.patch('sys.stdout', stdout), mock.patch('sys.stderr', stderr):
+        model.list_layers(verbose=True)
+    # Assert the function printed the correct output of the trainable layers
+    output = stdout.getvalue().strip()
+    assert 'distilbert' in output
+    assert 'embeddings: 23835648/23835648 parameters are trainable' in output
+    assert 'transformer: 42527232/42527232 parameters are trainable' in output
+    assert 'pre_classifier: 590592/590592 parameters are trainable' in output
+    assert 'dropout: 0/0 parameters are trainable' in output
+    assert 'dropout: 0/0 parameters are trainable' in output
+    assert 'Total Trainable Parameters: 66955010/66955010' in output
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
diff --git a/tests/pytorch_tests/unit/__init__.py b/tests/pytorch_tests/unit/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/pytorch_tests/unit/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/pytorch_tests/unit/test_datasets.py b/tests/pytorch_tests/unit/test_datasets.py
new file mode 100644
index 0000000000000000000000000000000000000000..17de908ee8217ec8fbe1b8ddf2fd019be298b689
--- /dev/null
+++ b/tests/pytorch_tests/unit/test_datasets.py
@@ -0,0 +1,687 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import math
+import pytest
+import shutil
+import tempfile
+import pandas as pd
+from numpy.testing import assert_array_equal
+from PIL import Image
+import random
+import string
+
+from tlt.datasets.dataset_factory import get_dataset, load_dataset
+
+try:
+    # Do torch specific imports in a try/except to prevent pytest test loading from failing when running in a TF env
+    from tlt.datasets.image_classification.torchvision_image_classification_dataset import TorchvisionImageClassificationDataset  # noqa: E501
+except ModuleNotFoundError:
+    print("Unable to import TorchvisionImageClassificationDataset. Torch may not be installed")
+
+try:
+    # Do torch specific imports in a try/except to prevent pytest test loading from failing when running in a TF env
+    from tlt.datasets.image_classification.pytorch_custom_image_classification_dataset import PyTorchCustomImageClassificationDataset  # noqa: E501
+except ModuleNotFoundError:
+    print("Unable to import PyTorchCustomImageClassificationDataset. Torch may not be installed")
+
+try:
+    from tlt.datasets.image_anomaly_detection.pytorch_custom_image_anomaly_detection_dataset import PyTorchCustomImageAnomalyDetectionDataset  # noqa: E501
+except ModuleNotFoundError:
+    print("Unable to import PyTorchCustomImageAnomalyDetectionDataset. Torch may not be installed")
+
+try:
+    from tlt.datasets.text_classification.hf_text_classification_dataset import HFTextClassificationDataset
+except ModuleNotFoundError:
+    print("Unable to import HFTextClassificationDataset. Hugging Face's 'tranformers' API may not be installed \
+            in the current env")
+
+try:
+    from tlt.datasets.text_classification.hf_custom_text_classification_dataset import HFCustomTextClassificationDataset
+except ModuleNotFoundError:
+    print("Unable to import HFCustomTextClassificationDataset. Hugging Face's 'tranformers' API may not be \
+            installed in the current env")
+
+
+@pytest.mark.pytorch
+def test_torchvision_subset():
+    """
+    Checks that a torchvision test subset can be loaded
+    """
+    data = get_dataset('/tmp/data', 'image_classification', 'pytorch', 'CIFAR10', 'torchvision', split=["test"])
+    assert type(data) == TorchvisionImageClassificationDataset
+    assert len(data.dataset) > 0
+
+
+@pytest.mark.pytorch
+def test_defined_split():
+    """
+    Checks that dataset can be loaded into train and test subsets based on torchvision splits and then
+    re-partitioned with shuffle-split
+    """
+    data = get_dataset('/tmp/data', 'image_classification', 'pytorch', 'CIFAR10',
+                       'torchvision', split=['train', 'test'])
+
+    dataset_size = len(data.dataset)
+    assert dataset_size > 0
+    assert len(data.train_subset) <= dataset_size
+    assert len(data.test_subset) <= len(data.train_subset)
+    assert data.validation_subset is None
+    assert data._validation_type == 'defined_split'
+
+    # Apply shuffle split and verify new subset sizes
+    data.shuffle_split(.6, .2, .2, seed=10)
+    assert len(data.train_subset) == dataset_size * .6
+    assert len(data.validation_subset) == dataset_size * .2
+    assert len(data.test_subset) == dataset_size * .2
+    assert data._validation_type == 'shuffle_split'
+
+
+@pytest.mark.pytorch
+def test_shuffle_split():
+    """
+    Checks that dataset can be split into train, validation, and test subsets
+    """
+    data = get_dataset('/tmp/data', 'image_classification', 'pytorch', 'CIFAR10', 'torchvision')
+    data.shuffle_split(seed=10)
+    assert len(data.train_subset) == 37500
+    assert len(data.validation_subset) == 12500
+    assert data.test_subset is None
+    assert data._validation_type == 'shuffle_split'
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+def test_shuffle_split_deterministic_tv():
+    """
+    Checks that dataset can be split into train, validation, and test subsets in a way that is reproducible
+    """
+    data = get_dataset('/tmp/data', 'image_classification', 'pytorch', 'DTD', 'torchvision', split=['test'])
+    data.preprocess(224, 128)
+    data.shuffle_split(seed=10)
+
+    data2 = get_dataset('/tmp/data', 'image_classification', 'pytorch', 'DTD', 'torchvision', split=['test'])
+    data2.preprocess(224, 128)
+    data2.shuffle_split(seed=10)
+
+    for i in range(3):
+        image_1, label_1 = data.get_batch()
+        image_2, label_2 = data2.get_batch()
+        assert_array_equal(image_1, image_2)
+        assert_array_equal(label_1, label_2)
+
+
+@pytest.mark.pytorch
+def test_shuffle_split_deterministic_custom():
+    """
+    Checks that custom datasets can be split into train, validation, and test subsets in a way that is reproducible
+    """
+    dataset_dir = '/tmp/data'
+    class_names = ['foo', 'bar']
+    seed = 10
+    image_size = 224
+    batch_size = 1
+    ic_dataset1 = None
+    ic_dataset2 = None
+    try:
+        ic_dataset1 = ImageDatasetForTest(dataset_dir, None, None, class_names)
+        tlt_dataset1 = ic_dataset1.tlt_dataset
+        tlt_dataset1.preprocess(image_size, batch_size)
+        tlt_dataset1.shuffle_split(seed=seed)
+
+        ic_dataset2 = ImageDatasetForTest(dataset_dir, None, None, class_names)
+        tlt_dataset2 = ic_dataset2.tlt_dataset
+        tlt_dataset2.preprocess(image_size, batch_size)
+        tlt_dataset2.shuffle_split(seed=seed)
+
+        for i in range(10):
+            image_1, label_1 = tlt_dataset1.get_batch()
+            image_2, label_2 = tlt_dataset2.get_batch()
+            assert_array_equal(image_1, image_2)
+            assert_array_equal(label_1, label_2)
+    finally:
+        if ic_dataset1:
+            ic_dataset1.cleanup()
+        if ic_dataset2:
+            ic_dataset2.cleanup()
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('dataset_dir,dataset_name,dataset_catalog,class_names,batch_size',
+                         [['/tmp/data', 'DTD', 'torchvision', None, 32],
+                          ['/tmp/data', 'DTD', 'torchvision', None, 1],
+                          ['/tmp/data', None, None, ['foo', 'bar'], 8],
+                          ['/tmp/data', None, None, ['foo', 'bar'], 1]])
+def test_batching(dataset_dir, dataset_name, dataset_catalog, class_names, batch_size):
+    """
+    Checks that dataset can be batched with valid positive integer values
+    """
+    ic_dataset = ImageDatasetForTest(dataset_dir, dataset_name, dataset_catalog, class_names)
+
+    try:
+        tlt_dataset = ic_dataset.tlt_dataset
+
+        tlt_dataset.preprocess(224, batch_size)
+        assert len(tlt_dataset.get_batch()[0]) == batch_size
+    finally:
+        ic_dataset.cleanup()
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+@pytest.mark.parametrize('dataset_dir,dataset_name,dataset_catalog,class_names',
+                         [['/tmp/data', 'DTD', 'torchvision', None],
+                          ['/tmp/data', None, None, ['foo', 'bar']]])
+def test_batching_error(dataset_dir, dataset_name, dataset_catalog, class_names):
+    """
+    Checks that preprocessing cannot be run twice
+    """
+    ic_dataset = ImageDatasetForTest(dataset_dir, dataset_name, dataset_catalog, class_names)
+
+    try:
+        tlt_dataset = ic_dataset.tlt_dataset
+        tlt_dataset.preprocess(224, 1)
+        with pytest.raises(Exception) as e:
+            tlt_dataset.preprocess(256, 32)
+        assert 'Data has already been preprocessed: {}'.\
+            format(tlt_dataset._preprocessed) == str(e.value)
+    finally:
+        ic_dataset.cleanup()
+
+
+class ImageDatasetForTest:
+    def __init__(self, dataset_dir, dataset_name=None, dataset_catalog=None, class_names=None,
+                 splits=None, use_case=None):
+        """
+        This class wraps initialization for image classification datasets (either from torchvision or custom).
+
+        For a custom dataset, provide a dataset dir and class names, with or without splits such as ['train',
+        'validation', 'test']. A temporary directory will be created with dummy folders for the specified split
+        subfolders and class names and 50 images in each folder. The dataset factory will be used to load the custom
+        dataset from the dataset directory.
+
+        For an image classification dataset from a catalog, provide the dataset_dir, dataset_name, and dataset_catalog.
+        The dataset factory will be used to load the specified dataset.
+        """
+        use_case = 'image_classification' if use_case is None else use_case
+        framework = 'pytorch'
+
+        def make_n_files(file_dir, n):
+            os.makedirs(file_dir)
+            for i in range(n):
+                img = Image.new(mode='RGB', size=(24, 24))
+                img.save(os.path.join(file_dir, 'img_{}.jpg'.format(i)))
+
+        if dataset_name and dataset_catalog:
+            self._dataset_catalog = dataset_catalog
+            self._tlt_dataset = get_dataset(dataset_dir, use_case, framework, dataset_name, dataset_catalog)
+        elif class_names:
+            self._dataset_catalog = "custom"
+            dataset_dir = tempfile.mkdtemp(dir=dataset_dir)
+            if not isinstance(class_names, list):
+                raise TypeError("class_names needs to be a list")
+
+            if isinstance(splits, list):
+                for folder in splits:
+                    for dir_name in class_names:
+                        make_n_files(os.path.join(dataset_dir, folder, dir_name), 50)
+            elif splits is None:
+                for dir_name in class_names:
+                    make_n_files(os.path.join(dataset_dir, dir_name), 50)
+            else:
+                raise ValueError("Splits must be None or a list of strings, got {}".format(splits))
+
+            self._tlt_dataset = load_dataset(dataset_dir, use_case, framework)
+
+        self._dataset_dir = dataset_dir
+
+    @property
+    def tlt_dataset(self):
+        """
+        Returns the tlt dataset object
+        """
+        return self._tlt_dataset
+
+    def cleanup(self):
+        """
+        Clean up - remove temp files that were created for custom datasets
+        """
+        if self._dataset_catalog == "custom":
+            print("Deleting temp directory:", self._dataset_dir)
+            shutil.rmtree(self._dataset_dir)
+            # TODO: Should we delete Torchvision directories too?
+
+
+# Metadata about Torchvision datasets
+torchvision_metadata = {
+    'CIFAR10': {
+        'class_names': ['airplane', 'automobile', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck'],
+        'size': 50000
+    }
+}
+
+# Dataset parameters used to define datasets that will be initialized and tested using TestImageClassificationDataset
+# The parameters are: dataset_dir, dataset_name, dataset_catalog, and class_names, which map to the constructor
+# parameters for ImageDatasetForTest, which initializes the datasets using the dataset factory.
+dataset_params = [("/tmp/data", "CIFAR10", "torchvision", None, None),
+                  ("/tmp/data", None, None, ["a", "b", "c"], None),
+                  ("/tmp/data", None, None, ["a", "b", "c"], ['train', 'test'])]
+
+
+@pytest.fixture(scope="class", params=dataset_params)
+def image_classification_data(request):
+    params = request.param
+
+    ic_dataset = ImageDatasetForTest(*params)
+
+    dataset_dir, dataset_name, dataset_catalog, dataset_classes, splits = params
+
+    def cleanup():
+        ic_dataset.cleanup()
+
+    request.addfinalizer(cleanup)
+
+    # Return the tlt dataset along with metadata that tests might need
+    return (ic_dataset.tlt_dataset, dataset_name, dataset_classes, splits)
+
+
+@pytest.mark.pytorch
+class TestImageClassificationDataset:
+    """
+    This class contains image classification dataset tests that only require the dataset to be initialized once. These
+    tests will be run once for each of the dataset defined in the dataset_params list.
+    """
+
+    def test_class_names_and_size(self, image_classification_data):
+        """
+        Verify the class type, dataset class names, and dataset length after initializaion
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+
+        if dataset_name is None:
+            assert type(tlt_dataset) == PyTorchCustomImageClassificationDataset
+            assert len(tlt_dataset.class_names) == len(dataset_classes)
+            if splits is None:
+                assert len(tlt_dataset.dataset) == len(dataset_classes) * 50
+            else:
+                assert len(tlt_dataset.dataset) == len(dataset_classes) * len(splits) * 50
+        else:
+            assert type(tlt_dataset) == TorchvisionImageClassificationDataset
+            assert len(tlt_dataset.class_names) == len(torchvision_metadata[dataset_name]['class_names'])
+            assert len(tlt_dataset.dataset) == torchvision_metadata[dataset_name]['size']
+
+    @pytest.mark.parametrize('batch_size',
+                             ['foo',
+                              -17,
+                              20.5])
+    def test_invalid_batch_sizes(self, batch_size, image_classification_data):
+        """
+        Ensures that a ValueError is raised when an invalid batch size is passed
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+        with pytest.raises(ValueError):
+            tlt_dataset.preprocess(224, batch_size)
+
+    @pytest.mark.parametrize('image_size',
+                             ['foo',
+                              -17,
+                              20.5])
+    def test_invalid_image_size(self, image_size, image_classification_data):
+        """
+        Ensures that a ValueError is raised when an invalid image size is passed
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+        with pytest.raises(ValueError):
+            tlt_dataset.preprocess(image_size, batch_size=8)
+
+    def test_preprocessing(self, image_classification_data):
+        """
+        Checks that dataset can be preprocessed only once
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+        tlt_dataset.preprocess(224, 8)
+        preprocessing_inputs = {'image_size': 224, 'batch_size': 8}
+        assert tlt_dataset._preprocessed == preprocessing_inputs
+        # Trying to preprocess again should throw an exception
+        with pytest.raises(Exception) as e:
+            tlt_dataset.preprocess(324, 32)
+        assert 'Data has already been preprocessed: {}'.format(preprocessing_inputs) == str(e.value)
+        print(tlt_dataset.info)
+
+    def test_shuffle_split_errors(self, image_classification_data):
+        """
+        Checks that splitting into train, validation, and test subsets will error if inputs are wrong
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=.5, val_pct=.5, test_pct=.2)
+        assert 'Sum of percentage arguments must be less than or equal to 1.' == str(e.value)
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=1, val_pct=0)
+        assert 'Percentage arguments must be floats.' == str(e.value)
+
+    def test_shuffle_split(self, image_classification_data):
+        """
+        Checks that dataset can be split into train, validation, and test subsets
+        """
+        tlt_dataset, dataset_name, dataset_classes, splits = image_classification_data
+
+        # Before the shuffle split, validation type should be recall
+        if splits is None:
+            assert tlt_dataset._validation_type is None
+        else:
+            assert 'defined_split' == tlt_dataset._validation_type
+
+        # Perform shuffle split with default percentages
+        tlt_dataset.shuffle_split(seed=10)
+        default_train_pct = 0.75
+        default_val_pct = 0.25
+
+        # Get the full dataset size
+        len_splits = 1 if splits is None else len(splits)
+        ds_size = torchvision_metadata[dataset_name]['size'] if dataset_name else len(dataset_classes) * len_splits * 50
+
+        # Divide by the batch size that was used to preprocess earlier
+        ds_size = ds_size / tlt_dataset.info['preprocessing_info']['batch_size']
+
+        # The PyTorch loaders are what gets batched and they can be off by 1 from the floor value
+        assert math.floor(
+            ds_size * default_train_pct) <= len(tlt_dataset.train_loader) <= math.ceil(ds_size * default_train_pct)
+        assert math.floor(
+            ds_size * default_val_pct) <= len(tlt_dataset.validation_loader) <= math.ceil(ds_size * default_val_pct)
+        assert tlt_dataset.test_loader is None
+        assert tlt_dataset._validation_type == 'shuffle_split'
+
+
+# Tests for Image Anomaly Detection datasets
+@pytest.mark.pytorch
+@pytest.mark.parametrize('dataset_dir,dataset_name,dataset_catalog,class_names,use_case',
+                         [["/tmp/data", "CIFAR10", "torchvision", [], 'anomaly_detection'],
+                          ["/tmp/data", None, None, ["a", "b", "c"], 'image_anomaly_detection']])
+def test_bad_anomaly_dataset(dataset_dir, dataset_name, dataset_catalog, class_names, use_case):
+    """
+    Checks that torchvision datasets are not implemented and that a nonexistent 'good' folder will throw an error
+    """
+    try:
+        get_dataset(dataset_dir, use_case, 'pytorch', dataset_name, dataset_catalog)
+        assert False
+    except NotImplementedError:
+        assert True
+    try:
+        load_dataset(dataset_dir, use_case, framework="pytorch")
+        assert False
+    except FileNotFoundError as e:
+        assert "Couldn't find 'good' folder" in str(e)
+
+
+anomaly_dataset_params = [("/tmp/data", None, None, ["good", "bad"], None, 'anomaly_detection'),
+                          ("/tmp/data", None, None, ["good", "foo", "bar"], None, 'image_anomaly_detection')]
+
+
+@pytest.fixture(scope="class", params=anomaly_dataset_params)
+def anomaly_detection_data(request):
+    params = request.param
+
+    ad_dataset = ImageDatasetForTest(*params)
+
+    dataset_dir, dataset_name, dataset_catalog, dataset_classes, splits, use_case = params
+
+    def cleanup():
+        ad_dataset.cleanup()
+
+    request.addfinalizer(cleanup)
+
+    # Return the tlt dataset along with metadata that tests might need
+    return (ad_dataset.tlt_dataset, dataset_name, dataset_classes, use_case)
+
+
+# Tests for Image Anomaly Detection use case
+@pytest.mark.pytorch
+class TestImageAnomalyDetectionDataset:
+    """
+    This class contains image anomaly detection dataset tests that only require the dataset to be initialized once.
+    These tests will be run once for each of the dataset defined in the anomaly_dataset_params list.
+    """
+
+    def test_classes_defects_and_size(self, anomaly_detection_data):
+        """
+        Verify the class type, dataset class names, defect_names, and dataset length after initializaion
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case = anomaly_detection_data
+
+        assert type(tlt_dataset) == PyTorchCustomImageAnomalyDetectionDataset
+        assert len(tlt_dataset.class_names) == 2  # Always 2 for anomaly detection
+        assert len(tlt_dataset.defect_names) == len(dataset_classes) - 1  # Subtract 1 for the "good" class
+        assert len(tlt_dataset.dataset) == len(dataset_classes) * 50
+
+    def test_preprocessing(self, anomaly_detection_data):
+        """
+        Checks that dataset can be preprocessed only once
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case = anomaly_detection_data
+        tlt_dataset.preprocess(224, 8)
+        preprocessing_inputs = {'image_size': 224, 'batch_size': 8}
+        assert tlt_dataset._preprocessed == preprocessing_inputs
+        # Trying to preprocess again should throw an exception
+        with pytest.raises(Exception) as e:
+            tlt_dataset.preprocess(324, 32)
+        assert 'Data has already been preprocessed: {}'.format(preprocessing_inputs) == str(e.value)
+        print(tlt_dataset.info)
+
+    def test_shuffle_split_errors(self, anomaly_detection_data):
+        """
+        Checks that splitting into train, validation, and test subsets will error if inputs are wrong
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case = anomaly_detection_data
+
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=.5, val_pct=.5, test_pct=.2)
+        assert 'Sum of percentage arguments must be less than or equal to 1.' == str(e.value)
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=1, val_pct=0)
+        assert 'Percentage arguments must be floats.' == str(e.value)
+
+    def test_shuffle_split(self, anomaly_detection_data):
+        """
+        Checks that dataset can be split into train, validation, and test subsets
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case = anomaly_detection_data
+
+        # Before the shuffle split, validation type should be None
+        assert tlt_dataset._validation_type is None
+
+        # Perform shuffle split with default percentages
+        tlt_dataset.shuffle_split(seed=10)
+        default_train_pct = 0.75
+        default_val_pct = 0.25
+
+        # Get the full dataset size
+        ds_size = torchvision_metadata[dataset_name]['size'] if dataset_name else len(dataset_classes) * 50
+
+        # Divide by the batch size that was used to preprocess earlier
+        ds_size = ds_size / tlt_dataset.info['preprocessing_info']['batch_size']
+        good_size = 50 / tlt_dataset.info['preprocessing_info']['batch_size']
+
+        # The PyTorch loaders are what gets batched and they can be off by 1 from the floor value
+        assert math.floor(
+            good_size * default_train_pct) <= len(tlt_dataset.train_loader) <= math.ceil(good_size * default_train_pct)
+        assert math.floor(good_size * default_val_pct) + (ds_size - good_size) <= \
+            len(tlt_dataset.validation_loader) <= math.ceil(good_size * default_val_pct) + (ds_size - good_size)
+        assert tlt_dataset.test_loader is None
+        assert tlt_dataset._validation_type == 'shuffle_split'
+
+
+# =======================================================================================
+
+# Testing for Text classification use case
+
+
+hf_metadata = {
+    'imdb': {
+        'class_names': ['neg', 'pos'],
+        'size': 25000
+    }
+}
+
+
+class TextClassificationDatasetForTest:
+    def __init__(self, dataset_dir, dataset_name=None, dataset_catalog=None, class_names=None):
+        """
+        This class wraps initialization for text classification datasets from Hugging Face.
+
+        For a text classification dataset from Hugging Face catalog, provide the dataset_dir, dataset_name, and \
+        dataset_catalog. The dataset factory will be used to load the specified dataset.
+        """
+        use_case = 'text_classification'
+        framework = 'pytorch'
+        dataset_dir = tempfile.mkdtemp(dir=dataset_dir)
+
+        if dataset_name and dataset_catalog:
+            self._dataset_catalog = dataset_catalog
+            self._tlt_dataset = get_dataset(dataset_dir, use_case, framework, dataset_name, dataset_catalog)
+        elif class_names:
+            self._dataset_catalog = 'custom'
+            if not isinstance(class_names, list):
+                raise TypeError("class_names needs to be a list")
+
+            df = self._create_dataset(n_rows=50, class_names=class_names)
+            df.to_csv(os.path.join(dataset_dir, 'random_text_dataset'), index=False)
+
+            self._tlt_dataset = load_dataset(dataset_dir, use_case, framework,
+                                             csv_file_name='random_text_dataset', header=True)
+
+        self._dataset_dir = dataset_dir
+
+    @property
+    def tlt_dataset(self):
+        """
+        Returns the tlt dataset object
+        """
+        return self._tlt_dataset
+
+    def _create_dataset(self, n_rows, class_names):
+        n_sentences = list(range(3, 10))
+
+        def get_random_word(n_chars):
+            return ''.join(random.choices(string.ascii_letters, k=n_chars))
+
+        def get_random_sentence(n_words):
+            sentence = ''
+            for _ in range(n_words):
+                sentence += '{} '.format(get_random_word(random.choice(list(range(2, 10)))))
+            return sentence.rstrip()
+
+        dataset = []
+        for row in range(n_rows):
+            dataset.append([class_names[row % len(class_names)], get_random_sentence(random.choice(n_sentences))])
+
+        return pd.DataFrame(dataset, columns=['label', 'text'])
+
+    def cleanup(self):
+        """
+        Clean up - remove temp files that were created
+        """
+        print("Deleting temp directory:", self._dataset_dir)
+        shutil.rmtree(self._dataset_dir)
+
+
+# Dataset parameters used to define datasets that will be initialized and tested using TestTextClassificationDataset
+# The parameters are: dataset_dir, dataset_name, dataset_catalog, dataset_classes which map to the constructor
+# parameters for TextClassificationDatasetForTest, which initializes the dataset using the dataset factory.
+dataset_params = [("/tmp/data", "imdb", "huggingface", ['neg', 'pos']),
+                  ("/tmp/data", None, None, ["a", "b", "c"])]
+
+
+@pytest.fixture(scope="class", params=dataset_params)
+def text_classification_data(request):
+    params = request.param
+
+    tc_dataset = TextClassificationDatasetForTest(*params)
+
+    dataset_dir, dataset_name, dataset_catalog, class_names = params
+
+    def cleanup():
+        tc_dataset.cleanup()
+
+    request.addfinalizer(cleanup)
+
+    # Return the tlt dataset along with metadata that tests might need
+    return (tc_dataset.tlt_dataset, dataset_dir, dataset_name, dataset_catalog, class_names)
+
+
+@pytest.mark.integration
+@pytest.mark.pytorch
+class TestTextClassificationDataset:
+    """
+    This class contains text classification dataset tests that only require the dataset to be initialized once. These
+    tests will be run once for each of the datasets defined in the dataset_params list.
+    """
+
+    def test_tlt_dataset(self, text_classification_data):
+        """
+        Tests whether a matching Intel Transfer Learning Tool dataset object is returned
+        """
+        tlt_dataset, _, dataset_name, _, _ = text_classification_data
+        if dataset_name is None:
+            assert type(tlt_dataset) == HFCustomTextClassificationDataset
+        else:
+            assert type(tlt_dataset) == HFTextClassificationDataset
+
+    def test_class_names_and_size(self, text_classification_data):
+        """
+        Verify the class type, dataset class names, and dataset length after initializaion
+        """
+        tlt_dataset, _, dataset_name, _, class_names = text_classification_data
+        if dataset_name is None:
+            assert len(tlt_dataset.class_names) == len(class_names)
+            assert len(tlt_dataset.dataset) == 50
+        else:
+            assert tlt_dataset.class_names == class_names
+            assert len(tlt_dataset.dataset) == hf_metadata[dataset_name]['size']
+
+    @pytest.mark.parametrize('batch_size',
+                             ['foo',  # A string
+                              -17,  # A negative int
+                              20.5,  # A float
+                              ])
+    def test_invalid_batch_size_type(self, batch_size, text_classification_data):
+        """
+        Ensures that a ValueError is raised when an invalid batch size type is passed
+        """
+        tlt_dataset, _, _, _, _ = text_classification_data
+        with pytest.raises(ValueError):
+            tlt_dataset.preprocess('', batch_size)
+
+    def test_shuffle_split_errors(self, text_classification_data):
+        """
+        Checks that splitting into train, validation, and test subsets will error if inputs are wrong
+        """
+        tlt_dataset, _, _, _, _ = text_classification_data
+        with pytest.raises(ValueError) as sum_err_message:
+            tlt_dataset.shuffle_split(train_pct=.5, val_pct=.5, test_pct=.2)
+
+        with pytest.raises(ValueError) as float_err_message:
+            tlt_dataset.shuffle_split(train_pct=1, val_pct=0)
+
+        assert 'Sum of percentage arguments must be less than or equal to 1.' == str(sum_err_message.value)
+        assert 'Percentage arguments must be floats.' == str(float_err_message.value)
diff --git a/tests/pytorch_tests/unit/test_inc.py b/tests/pytorch_tests/unit/test_inc.py
new file mode 100644
index 0000000000000000000000000000000000000000..5270b2db6331ac86da23286042660bcf73fea315
--- /dev/null
+++ b/tests/pytorch_tests/unit/test_inc.py
@@ -0,0 +1,192 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+import uuid
+
+from pathlib import Path
+from unittest.mock import patch, MagicMock
+
+from tlt.models import model_factory
+from tlt.datasets.image_classification.pytorch_custom_image_classification_dataset import PyTorchCustomImageClassificationDataset  # noqa: E501
+
+
+try:
+    # Do PyTorch specific imports in a try/except to prevent pytest test loading from failing when running in a TF env
+    from tlt.models.image_classification.torchvision_image_classification_model import TorchvisionImageClassificationModel  # noqa: F401, E501
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TorchvisionImageClassificationModel. PyTorch or torchvision may not be installed")
+
+
+@pytest.mark.pytorch
+def test_torchvision_image_classification_optimize_graph_not_implemented():
+    """
+    Verifies the error that gets raise if graph optimization is attempted with a PyTorch model
+    """
+    try:
+        output_dir = tempfile.mkdtemp()
+        saved_model_dir = tempfile.mkdtemp()
+        dummy_config_file = os.path.join(output_dir, "config.yaml")
+        Path(dummy_config_file).touch()
+        model = model_factory.get_model('resnet50', 'pytorch')
+        # The torchvision model is not present until training, so call _get_hub_model()
+        model._get_hub_model(3)
+        # Graph optimization is not enabled for PyTorch, so this should fail
+        with patch('neural_compressor.experimental.Graph_Optimization'):
+            with pytest.raises(NotImplementedError):
+                model.optimize_graph(output_dir)
+
+        # Verify that the installed version of Intel Neural Compressor throws a SystemError
+        from neural_compressor.experimental import Graph_Optimization, common
+        # set_backend API is no longer available in Neural Compressor v2.0
+        # from neural_compressor.experimental.common.model import set_backend
+        # set_backend('pytorch')
+        graph_optimizer = Graph_Optimization()
+        with pytest.raises(AssertionError):
+            graph_optimizer.model = common.Model(model._model)
+
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+        if os.path.exists(saved_model_dir):
+            shutil.rmtree(saved_model_dir)
+
+
+@pytest.mark.pytorch
+@patch('tlt.models.image_classification.torchvision_image_classification_model.ModelDownloader')
+@patch('tlt.models.pytorch_model.quantization.fit')
+def test_pyt_image_classification_quantize_overwrite_saved_model(mock_quantization_fit, mock_model_downloader):
+    """
+    Given a valid directory for the output dir, test the quantize function with the actual Intel Neural
+    Compressor call mocked out. Tests that the model will be overwritten or not using the overwrite_model flag.
+    """
+
+    # tlt imports
+    from tlt.datasets.image_classification.pytorch_custom_image_classification_dataset \
+        import PyTorchCustomImageClassificationDataset
+    from tlt.models import model_factory
+
+    try:
+        # Specify a directory for output
+        output_dir = tempfile.mkdtemp()
+
+        model = model_factory.get_model(model_name='efficientnet_b0', framework='pytorch')
+
+        # Mock the dataset
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = PyTorchCustomImageClassificationDataset
+        mock_dataset.get_inc_dataloaders.return_value = 1, 2
+
+        # Method to create a dummy model.pt file in the specified directory
+        def create_dummy_file(output_dir):
+            with open(os.path.join(output_dir, 'model.pt'), 'w') as _:
+                pass
+
+        # Mock an INC quantized model that will create a dummy file when saved
+        mock_quantized_model = MagicMock()
+        mock_quantized_model.save.side_effect = create_dummy_file
+
+        # Mock the INC quantization.fit method
+        def mock_fit(**args):
+            return mock_quantized_model
+        mock_quantization_fit.side_effect = mock_fit
+
+        # Call quantize when a model does not exist
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=False)
+
+        # Call quantize when the model exists, but overwrite_model=True
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=True)
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=True)
+
+        with pytest.raises(FileExistsError):  # Model exists, so this should be true
+            model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=False)
+
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.pytorch
+def test_pyt_image_classification_quantization():
+    """
+    Given a valid directory for output dir, test the quantization function with the actual INC called mocked out.
+    """
+    try:
+        output_dir = tempfile.mkdtemp()
+        model = model_factory.get_model('efficientnet_b0', 'pytorch')
+        with patch('tlt.datasets.image_classification.pytorch_custom_image_classification_dataset.PyTorchCustomImageClassificationDataset') as mock_dataset:  # noqa: E501
+            with patch('neural_compressor.quantization.fit') as mock_q:
+                mock_dataset.dataset_dir = "/tmp/data/my_photos"
+                mock_dataset.__class__ = PyTorchCustomImageClassificationDataset
+                mock_dataset.get_inc_dataloaders.return_value = (1, 2)
+                model.quantize(output_dir, mock_dataset)
+                mock_q.assert_called_once()
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.pytorch
+def test_pyt_image_classification_benchmark_model_does_not_exist():
+    """
+    Verifies the error that gets raise if benchmarking is done with a model that does not exist
+    """
+    try:
+        output_dir = tempfile.mkdtemp()
+        model = model_factory.get_model('efficientnet_b0', 'pytorch')
+        with patch('tlt.datasets.image_classification.pytorch_custom_image_classification_dataset.PyTorchCustomImageClassificationDataset') as mock_dataset:  # noqa: E501
+            mock_dataset.dataset_dir = "/tmp/data/my_photos"
+            mock_dataset.__class__ = PyTorchCustomImageClassificationDataset
+            random_dir = str(uuid.uuid4())
+            saved_model_dir = tempfile.mkdtemp()
+
+            with patch('neural_compressor.experimental.Benchmark'):
+                # It's not a directory, so we expect an error
+                with pytest.raises(NotADirectoryError):
+                    model.benchmark(mock_dataset, saved_model_dir=random_dir)
+
+                # An empty directory with no saved model should also generate an error
+                with pytest.raises(FileNotFoundError):
+                    model.benchmark(mock_dataset, saved_model_dir=saved_model_dir)
+
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+        if os.path.exists(saved_model_dir):
+            shutil.rmtree(saved_model_dir)
+
+
+@pytest.mark.pytorch
+def test_pyt_image_classification_inc_benchmark():
+    """
+    Verifies that if we have a valid model and dataset, benchmarking is called. The actual benchmarking calls to INC
+    are mocked out.
+    """
+    model = model_factory.get_model('efficientnet_b0', 'pytorch')
+    with patch('tlt.datasets.image_classification.pytorch_custom_image_classification_dataset.PyTorchCustomImageClassificationDataset') as mock_dataset:  # noqa: E501
+        with patch('neural_compressor.benchmark.fit') as mock_bench:
+            mock_dataset.dataset_dir = "/tmp/data/my_photos"
+            mock_dataset.__class__ = PyTorchCustomImageClassificationDataset
+            mock_dataset.get_inc_dataloaders.return_value = (1, 2)
+            model.benchmark(mock_dataset)
+            mock_bench.assert_called_once()
diff --git a/tests/pytorch_tests/unit/test_models.py b/tests/pytorch_tests/unit/test_models.py
new file mode 100644
index 0000000000000000000000000000000000000000..068352a7bdc2825c8f238f184e947b909340ca19
--- /dev/null
+++ b/tests/pytorch_tests/unit/test_models.py
@@ -0,0 +1,403 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import pytest
+import numpy
+
+from unittest import mock
+from unittest.mock import ANY, MagicMock, patch
+from sklearn import decomposition
+
+from tlt.models import model_factory
+from tlt.utils.types import FrameworkType, UseCaseType
+
+try:
+    from tlt.models.image_anomaly_detection.pytorch_image_anomaly_detection_model import extract_features, pca, get_feature_extraction_model  # noqa: E501
+except ModuleNotFoundError:
+    print("WARNING: Unable to import PytorchImageAnomolyDetectionModel. Pytorch may not be installed")
+
+# This is necessary to protect from import errors when testing in a pytorch only environment
+# True when imports are successful, False when imports are unsuccessful
+torch_env = True
+
+try:
+    # Do torch specific imports in a try/except to prevent pytest test loading from failing when running in a TF env
+    import torch
+    import torch.nn as nn
+except ModuleNotFoundError:
+    print("WARNING: Unable to import torch. Torch may not be installed")
+    torch_env = False
+
+try:
+    # Do torch specific imports in a try/except to prevent pytest test loading from failing when running in a TF env
+    from tlt.models.image_classification.torchvision_image_classification_model import TorchvisionImageClassificationModel  # noqa: E501
+    from tlt.datasets.image_classification.torchvision_image_classification_dataset import TorchvisionImageClassificationDataset   # noqa: E501
+    from tlt.datasets.image_classification.pytorch_custom_image_classification_dataset import \
+        PyTorchCustomImageClassificationDataset  # noqa: E501
+    from tlt.models.text_classification.pytorch_hf_text_classification_model import PyTorchHFTextClassificationModel  # noqa: E501
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TorchvisionImageClassificationModel and TorchvisionImageClassificationDataset. "
+          "Torch may not be installed")
+
+try:
+    from tlt.models.image_anomaly_detection.torchvision_image_anomaly_detection_model import \
+        TorchvisionImageAnomalyDetectionModel
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TorchvisionImageAnomalyDetectionModel and "
+          "PyTorchCustomImageAnomalyDetectionDataset. Torch may not be installed")
+
+try:
+    from tlt.datasets.text_classification.hf_text_classification_dataset import HFTextClassificationDataset  # noqa: F401, E501
+except ModuleNotFoundError:
+    print("WARNING: Unable to import HFTextClassificationDataset. Hugging Face's `transformers` API may not \
+           be installed in the current env")
+
+
+@pytest.mark.pytorch
+def test_torchvision_efficientnet_b0():
+    """
+    Checks that an efficientnet_b0 model can be downloaded from TFHub
+    """
+    model = model_factory.get_model('efficientnet_b0', 'pytorch')
+    assert type(model) == TorchvisionImageClassificationModel
+    assert model.model_name == 'efficientnet_b0'
+
+
+@pytest.mark.pytorch
+def test_get_supported_models():
+    """
+    Call get supported models and checks to make sure the dictionary has keys for each use case,
+    and checks for a known supported model.
+    """
+    model_dict = model_factory.get_supported_models()
+
+    # Ensure there are keys for each use case
+    for k in UseCaseType:
+        assert str(k) in model_dict.keys()
+
+    # Check for a known model
+    assert 'efficientnet_b0' in model_dict[str(UseCaseType.IMAGE_CLASSIFICATION)]
+    assert 'resnet50' in model_dict[str(UseCaseType.IMAGE_ANOMALY_DETECTION)]
+    efficientnet_b0 = model_dict[str(UseCaseType.IMAGE_CLASSIFICATION)]['efficientnet_b0']
+    assert str(FrameworkType.PYTORCH) in efficientnet_b0
+    assert 'torchvision' == efficientnet_b0[str(FrameworkType.PYTORCH)]['model_hub']
+
+
+@pytest.mark.pytorch
+@pytest.mark.parametrize('framework,use_case',
+                         [['tensorflow', None],
+                          ['pytorch', None],
+                          [None, 'image_classification'],
+                          [None, 'question_answering'],
+                          ['tensorflow', 'image_classification'],
+                          ['pytorch', 'text_classification'],
+                          ['pytorch', 'question_answering'],
+                          ['pytorch', 'image_anomaly_detection']])
+def test_get_supported_models_with_filter(framework, use_case):
+    """
+    Tests getting the dictionary of supported models while filtering by framework and/or use case.
+    Checks to ensure that keys for the expected use cases are there. If filtering by framework, then the test will
+    also check to make sure we only have models for the specified framework.
+    """
+    model_dict = model_factory.get_supported_models(framework, use_case)
+
+    if use_case is not None:
+        # Model dictionary should only have a key for the specified use case
+        assert 1 == len(model_dict.keys())
+        assert use_case in model_dict
+    else:
+        # Model dictionary should have keys for every use case
+        assert len(UseCaseType) == len(model_dict.keys())
+        for k in UseCaseType:
+            assert str(k) in model_dict.keys()
+
+    # If filtering by framework, we should not find models from other frameworks
+    if framework is not None:
+        for use_case_key in model_dict.keys():
+            for model_name_key in model_dict[use_case_key].keys():
+                assert 1 == len(model_dict[use_case_key][model_name_key].keys())
+                assert framework in model_dict[use_case_key][model_name_key]
+
+
+@pytest.mark.pytorch
+@pytest.mark.parametrize('bad_framework',
+                         ['tensorflowers',
+                          'python',
+                          'torch',
+                          'fantastic-potato'])
+def test_get_supported_models_bad_framework(bad_framework):
+    """
+    Ensure that the proper error is raised when a bad framework is passed in
+    """
+    with pytest.raises(ValueError) as e:
+        model_factory.get_supported_models(bad_framework)
+        assert "Unsupported framework: {}".format(bad_framework) in str(e)
+
+
+@pytest.mark.pytorch
+@pytest.mark.parametrize('bad_use_case',
+                         ['tensorflow',
+                          'imageclassification',
+                          'python',
+                          'fantastic-potato'])
+def test_get_supported_models_bad_use_case(bad_use_case):
+    """
+    Ensure that the proper error is raised when a bad use case is passed in
+    """
+    with pytest.raises(ValueError) as e:
+        model_factory.get_supported_models(use_case=bad_use_case)
+        assert "Unsupported use case: {}".format(bad_use_case) in str(e)
+
+
+@pytest.mark.pytorch
+def test_torchvision_efficientnet_b0_train():
+    """
+    Tests calling train on a torchvision efficientnet_b0 model with a mock dataset, model, and optimizer
+    """
+    model = model_factory.get_model('efficientnet_b0', 'pytorch')
+    model._generate_checkpoints = False
+
+    with patch('tlt.datasets.image_classification.torchvision_image_classification_dataset.TorchvisionImageClassificationDataset') as mock_dataset:  # noqa: E501
+        with patch('tlt.models.image_classification.torchvision_image_classification_model.'
+                   'TorchvisionImageClassificationModel._get_hub_model') as mock_get_hub_model:
+            mock_dataset.train_subset = [1, 2, 3]
+            mock_dataset.validation_subset = [4, 5, 6]
+            mock_dataset.__class__ = TorchvisionImageClassificationDataset
+            mock_model = MagicMock()
+            mock_optimizer = MagicMock()
+            expected_return_value_model = mock_model
+            expected_return_value_history_val = {'Acc': [0.0], 'Loss': [0.0], 'Val Acc': [0.0], 'Val Loss': [0.0]}
+            expected_return_value_history_no_val = {'Acc': [0.0], 'Loss': [0.0]}
+
+            def mock_to(device):
+                assert device == torch.device("cpu")
+                return expected_return_value_model
+
+            def mock_train():
+                return None
+
+            mock_model.to = mock_to
+            mock_model.train = mock_train
+            mock_get_hub_model.return_value = (mock_model, mock_optimizer)
+
+            # Train and eval (eval should be called)
+            return_val = model.train(mock_dataset, output_dir="/tmp/output/pytorch", do_eval=True, lr_decay=False)
+            assert return_val == expected_return_value_history_val
+            mock_model.eval.assert_called_once()
+
+            # Train without eval (eval should not be called)
+            mock_model.eval.reset_mock()
+            return_val = model.train(mock_dataset, output_dir="/tmp/output/pytorch", do_eval=False, lr_decay=False)
+            assert return_val == expected_return_value_history_no_val
+            mock_model.eval.assert_not_called()
+
+            # Try to train with eval, but no validation subset (eval should not be called)
+            mock_dataset.validation_subset = None
+            mock_model.eval.reset_mock()
+            return_val = model.train(mock_dataset, output_dir="/tmp/output/pytorch", do_eval=True, lr_decay=False)
+            assert return_val == expected_return_value_history_no_val
+            mock_model.eval.assert_not_called()
+
+
+@pytest.mark.pytorch
+def test_bert_train():
+    model = model_factory.get_model('distilbert-base-uncased', 'pytorch')
+    assert type(model) == PyTorchHFTextClassificationModel
+    with patch('tlt.datasets.text_classification.hf_text_classification_dataset.HFTextClassificationDataset') as mock_dataset:  # noqa: E501
+        mock_dataset.__class__ = HFTextClassificationDataset
+        mock_dataset.train_subset = ['1', '2', '3']
+        mock_dataset.validation_subset = ['4', '5', '6']
+        expected_return_value_history_no_val = {'Acc': [0.0], 'Loss': [0.0]}
+        expected_return_value_history_val = {'Acc': [0.0], 'Loss': [0.0], 'Val Acc': [0.0], 'Val Loss': [0.0]}
+
+        # Scenario 1: Call train without validation
+        return_val = model.train(mock_dataset, output_dir="/tmp/output/pytorch", do_eval=False, lr_decay=False)
+        assert return_val['Acc'] == expected_return_value_history_no_val['Acc']
+        assert return_val['Loss'] == expected_return_value_history_no_val['Loss']
+        assert 'train_runtime' in return_val
+        assert 'train_samples_per_second' in return_val
+        assert 'Val Acc' not in return_val
+        assert 'Val Loss' not in return_val
+
+        # Scenario 2: Call train with validation
+        mock_dataset.validation_loader.__class__ = HFTextClassificationDataset
+        return_val = model.train(mock_dataset, output_dir="/tmp/output/pytorch", do_eval=True, lr_decay=False)
+        assert return_val['Acc'] == expected_return_value_history_val['Acc']
+        assert return_val['Loss'] == expected_return_value_history_val['Loss']
+        assert return_val['Val Acc'] == expected_return_value_history_val['Val Acc']
+        assert return_val['Val Loss'] == expected_return_value_history_val['Val Loss']
+        assert 'train_runtime' in return_val
+        assert 'train_samples_per_second' in return_val
+
+
+@pytest.mark.pytorch
+def test_resnet50_anomaly_extract_pca():
+    model = model_factory.get_model(model_name="resnet50", framework="pytorch", use_case="anomaly_detection")
+    assert type(model) == TorchvisionImageAnomalyDetectionModel
+
+    # Call extract_features and PCA on 5 randomly generated images
+    data = torch.rand(5, 3, 225, 225)  # NCHW
+    resnet_model = get_feature_extraction_model(model._model, 'layer3')
+    features = extract_features(resnet_model, data, layer_name='layer3', pooling=['avg', 2])
+    assert isinstance(features, torch.Tensor)
+    assert len(features) == 5
+
+    data_mats_orig = torch.empty((features.shape[1], len(data))).to('cpu')
+
+    # Skip the rest of the test if the tensor contains any NaNs, due to flaky behavior
+    if not numpy.isnan(data_mats_orig).any():
+        with torch.no_grad():
+            components = pca(data_mats_orig, 0.97)
+        assert type(components) == decomposition._pca.PCA
+        assert components.n_components == 0.97
+
+
+# This is necessary to protect from import errors when testing in a pytorch only environment
+if torch_env:
+    @pytest.mark.pytorch
+    @pytest.mark.parametrize('model_name,use_case,dataset_type,optimizer,loss',
+                             [['efficientnet_b0', 'image_classification', PyTorchCustomImageClassificationDataset,
+                               torch.optim.Adam, torch.nn.L1Loss],
+                              ['resnet18', 'image_classification', PyTorchCustomImageClassificationDataset,
+                               torch.optim.AdamW, torch.nn.MSELoss],
+                              ['custom', 'image_classification', PyTorchCustomImageClassificationDataset,
+                               torch.optim.SGD, torch.nn.L1Loss],
+                              ['distilbert-base-uncased', 'text_classification', HFTextClassificationDataset,
+                               torch.optim.Adam, torch.nn.MSELoss]])
+    def test_pytorch_optimizer_loss(model_name, use_case, dataset_type, optimizer, loss):
+        """
+        Tests initializing and training a model with configurable optimizers and loss functions
+        """
+
+        # Define a model
+        class Net(nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.conv1 = nn.Conv2d(3, 6, 5)
+                self.pool = nn.MaxPool2d(2, 2)
+                self.conv2 = nn.Conv2d(6, 16, 5)
+                self.fc1 = nn.Linear(16 * 5 * 5, 120)
+                self.fc2 = nn.Linear(120, 84)
+                self.fc3 = nn.Linear(84, 3)
+
+            def forward(self, x):
+                x = self.pool(nn.functional.relu(self.conv1(x)))
+                x = self.pool(nn.functional.relu(self.conv2(x)))
+                x = torch.flatten(x, 1)
+                x = nn.functional.relu(self.fc1(x))
+                x = nn.functional.relu(self.fc2(x))
+                x = self.fc3(x)
+                return x
+
+        net = Net()
+
+        if model_name == 'custom':
+            model = model_factory.load_model(model_name, net, 'pytorch', use_case, optimizer=optimizer, loss=loss)
+        else:
+            model = model_factory.get_model(model_name, 'pytorch', optimizer=optimizer, loss=loss)
+
+        model._generate_checkpoints = False
+        model._fit = MagicMock()
+        assert model._optimizer_class == optimizer
+        assert model._loss_class == loss
+        assert type(model._loss) == loss
+
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = dataset_type
+        mock_dataset.class_names = ['a', 'b', 'c']
+        mock_dataset.train_subset = [1, 2, 3]
+        mock_dataset.validation_subset = [4, 5, 6]
+
+        # Train is called and optimizer and loss objects should match the input types
+        model.train(mock_dataset, output_dir="/tmp/output/pytorch")
+        assert model._optimizer_class == optimizer
+        assert type(model._optimizer) == optimizer
+        assert model._loss_class == loss
+        assert type(model._loss) == loss
+
+
+# This is necessary to protect from import errors when testing in a pytorch only environment
+if torch_env:
+    @pytest.mark.pytorch
+    @pytest.mark.parametrize('model_name,optimizer',
+                             [['efficientnet_b0', 1],
+                              ['resnet18', 'foo'],
+                              ['distilbert-base-uncased', torch.nn.MSELoss]])
+    def test_pytorch_optimizer_wrong_type(model_name, optimizer):
+        """
+        Tests that an exception is thrown when the input optimizer is the wrong type
+        """
+        with pytest.raises(TypeError):
+            model_factory.get_model(model_name, 'pytorch', optimizer=optimizer)
+
+
+@pytest.mark.pytorch
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.torch.optim.AdamW')
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.Trainer')
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.ModelDownloader')
+def test_pytorch_hf_text_classification_trainer_return_values(mock_downloader, mock_trainer, mock_optimizer):
+    """
+    Tests the PyTorch Text Classification model with the Hugging Face Trainer to verify that the value returned
+    by Trainer.train() is returned by the model.train() method
+    """
+
+    model = model_factory.get_model(model_name='bert-base-cased', framework='pytorch')
+
+    mock_dataset = MagicMock()
+    mock_dataset.__class__ = HFTextClassificationDataset
+    mock_dataset.class_names = ['a', 'b', 'c']
+    mock_dataset.train_subset = [1, 2, 3]
+    mock_dataset.validation_subset = [4, 5, 6]
+
+    expected_value = "a"
+
+    mock_trainer().train.return_value = expected_value
+
+    return_val = model.train(mock_dataset, output_dir="/tmp", use_trainer=True, seed=10)
+    assert mock_trainer().train.call_count == 1
+
+    assert return_val == expected_value
+
+
+@pytest.mark.pytorch
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.torch.optim.AdamW')
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.Trainer')
+@patch('tlt.models.text_classification.pytorch_hf_text_classification_model.ModelDownloader')
+def test_pytorch_hf_text_classification_trainer_without_val_subset(mock_downloader, mock_trainer, mock_optimizer):
+    """
+    Tests the PyTorch Text Classification model with the Hugging Face Trainer is able to run evaluation with a test
+    subset when a validation subset does not exist.
+    """
+
+    model = model_factory.get_model(model_name='bert-base-cased', framework='pytorch')
+
+    mock_dataset = MagicMock()
+    mock_dataset.__class__ = HFTextClassificationDataset
+    mock_dataset.class_names = ['a', 'b', 'c']
+    mock_dataset.train_subset = [1, 2, 3]
+    mock_dataset.test_subset = [4, 5, 6]
+    type(mock_dataset).validation_subset = mock.PropertyMock(side_effect=ValueError)
+
+    with pytest.raises(ValueError):
+        mock_dataset.validation_subset
+
+    model.train(mock_dataset, output_dir="/tmp", use_trainer=True, seed=10)
+    mock_trainer.assert_called_with(model=model._model, args=ANY, train_dataset=[1, 2, 3], eval_dataset=[4, 5, 6],
+                                    compute_metrics=ANY, tokenizer=ANY)
diff --git a/tests/requirements-test.txt b/tests/requirements-test.txt
new file mode 100644
index 0000000000000000000000000000000000000000..6f57a9f7760850e6ce9b7577756462f02a7ae29d
--- /dev/null
+++ b/tests/requirements-test.txt
@@ -0,0 +1,7 @@
+flake8~=6.0.0
+mock~=5.0.2
+Pillow~=9.5.0
+pytest~=7.3.1
+pytest-cov~=4.0.0
+pytest-xdist~=3.2.1
+tox~=4.5.1
diff --git a/tests/tensorflow_tests/__init__.py b/tests/tensorflow_tests/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/tensorflow_tests/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/tensorflow_tests/test_image_classification.py b/tests/tensorflow_tests/test_image_classification.py
new file mode 100644
index 0000000000000000000000000000000000000000..9f10b9a15685d5092acc6eaf63ebf9a57990d96b
--- /dev/null
+++ b/tests/tensorflow_tests/test_image_classification.py
@@ -0,0 +1,529 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+import numpy as np
+
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.utils.file_utils import download_and_extract_tar_file
+from unittest.mock import MagicMock, patch
+
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+keras_env = True
+
+try:
+    from tensorflow import keras
+except ModuleNotFoundError:
+    print("WARNING: Unable to import Keras. Tensorflow may not be installed")
+    keras_env = False
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,dataset_name,train_accuracy,retrain_accuracy,extra_layers,correct_num_layers,'
+                         'test_optimization',
+                         [['efficientnet_b0', 'tf_flowers', 0.3125, 0.53125, None, 2, False],
+                          ['resnet_v1_50', 'tf_flowers', 0.40625, 0.59375, None, 2, True],
+                          ['efficientnet_b0', 'tf_flowers', 0.8125, 0.96875, [1024, 512], 4, False],
+                          ['ResNet50', 'tf_flowers', 0.34375, 0.625, None, 4, True]])
+def test_tf_image_classification(model_name, dataset_name, train_accuracy, retrain_accuracy, extra_layers,
+                                 correct_num_layers, test_optimization):
+    """
+    Tests basic transfer learning functionality for TensorFlow image classification models using TF Datasets
+    """
+    framework = 'tensorflow'
+    use_case = 'image_classification'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', use_case, framework, dataset_name,
+                                          'tf_datasets', split=["train[:5%]"], seed=10, shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+
+    # Preprocess the dataset
+    dataset.preprocess(model.image_size, 32, preprocessor=model.preprocessor)
+    dataset.shuffle_split(shuffle_files=False)
+
+    # Evaluate before training
+    pretrained_metrics = model.evaluate(dataset)
+    assert len(pretrained_metrics) > 0
+
+    # Train
+    history = model.train(dataset, output_dir=output_dir, epochs=1, shuffle_files=False, seed=10, do_eval=False,
+                          extra_layers=extra_layers)
+    assert history is not None
+    np.testing.assert_almost_equal(history['acc'], [train_accuracy])
+    assert len(model._model.layers) == correct_num_layers
+
+    # Verify that checkpoints were generated
+    checkpoint_dir = os.path.join(output_dir, "{}_checkpoints".format(model_name))
+    assert os.path.isdir(checkpoint_dir)
+    assert len(os.listdir(checkpoint_dir))
+
+    # Evaluate
+    trained_metrics = model.evaluate(dataset)
+    assert trained_metrics[0] <= pretrained_metrics[0]  # loss
+    assert trained_metrics[1] >= pretrained_metrics[1]  # accuracy
+
+    # Predict with a batch
+    images, labels = dataset.get_batch()
+    predictions = model.predict(images)
+    assert len(predictions) == 32
+    probabilities = model.predict(images, return_type='probabilities')
+    assert probabilities.shape == (32, 5)  # tf_flowers has 5 classes
+    np.testing.assert_almost_equal(np.sum(probabilities), np.float32(32), decimal=4)
+
+    # Export the saved model
+    saved_model_dir = model.export(output_dir)
+    assert os.path.isdir(saved_model_dir)
+    assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+    # Reload the saved model
+    reload_model = model_factory.get_model(model_name, framework)
+    reload_model.load_from_directory(saved_model_dir)
+
+    # Evaluate
+    reload_metrics = reload_model.evaluate(dataset)
+    np.testing.assert_almost_equal(reload_metrics, trained_metrics)
+
+    # Optimize the graph
+    if test_optimization:
+        inc_output_dir = os.path.join(output_dir, "optimized")
+        os.makedirs(inc_output_dir, exist_ok=True)
+        model.optimize_graph(inc_output_dir)
+        assert os.path.isfile(os.path.join(inc_output_dir, "saved_model.pb"))
+
+    # Retrain from checkpoints and verify that we have better accuracy than the original training
+    retrain_model = model_factory.load_model(model_name, saved_model_dir, framework, use_case)
+    retrain_history = retrain_model.train(dataset, output_dir=output_dir, epochs=1, initial_checkpoints=checkpoint_dir,
+                                          shuffle_files=False, seed=10, do_eval=False)
+    np.testing.assert_almost_equal(retrain_history['acc'], [retrain_accuracy])
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if keras_env:
+    @pytest.mark.integration
+    @pytest.mark.tensorflow
+    def test_tf_image_classification_custom_model():
+        """
+        Tests basic transfer learning functionality for a custom TensorFlow image classification model using TF Datasets
+        """
+        framework = 'tensorflow'
+        use_case = 'image_classification'
+        output_dir = tempfile.mkdtemp()
+        model_name = 'custom_model'
+        image_size = 227
+
+        # Get the dataset
+        dataset = dataset_factory.get_dataset('/tmp/data', use_case, framework, 'tf_flowers',
+                                              'tf_datasets', split=["train[:5%]"], shuffle_files=False)
+
+        # Define a custom model
+        alexnet = keras.models.Sequential([
+            keras.layers.Conv2D(filters=96, kernel_size=(11, 11), strides=(4, 4), activation='relu',
+                                input_shape=(image_size, image_size, 3)),
+            keras.layers.BatchNormalization(),
+            keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+            keras.layers.Conv2D(filters=256, kernel_size=(5, 5), strides=(1, 1), activation='relu', padding="same"),
+            keras.layers.BatchNormalization(),
+            keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+            keras.layers.Conv2D(filters=384, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+            keras.layers.BatchNormalization(),
+            keras.layers.Conv2D(filters=384, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+            keras.layers.BatchNormalization(),
+            keras.layers.Conv2D(filters=256, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+            keras.layers.BatchNormalization(),
+            keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+            keras.layers.Flatten(),
+            keras.layers.Dense(4096, activation='relu'),
+            keras.layers.Dropout(0.5),
+            keras.layers.Dense(4096, activation='relu'),
+            keras.layers.Dropout(0.5),
+            keras.layers.Dense(5, activation='softmax')
+        ])
+
+        model = model_factory.load_model(model_name=model_name, model=alexnet, framework=framework, use_case=use_case)
+        assert model.num_classes == 5
+        assert model._image_size == 227
+
+        # Preprocess the dataset
+        dataset.preprocess(image_size, 32)
+        dataset.shuffle_split(seed=10)
+
+        # Train
+        history = model.train(dataset, output_dir=output_dir, epochs=1, shuffle_files=False, seed=10)
+        assert history is not None
+
+        # Verify that checkpoints were generated
+        checkpoint_dir = os.path.join(output_dir, "{}_checkpoints".format(model_name))
+        assert os.path.isdir(checkpoint_dir)
+        assert len(os.listdir(checkpoint_dir))
+
+        # Evaluate
+        trained_metrics = model.evaluate(dataset)
+        assert trained_metrics is not None
+
+        # Predict with a batch
+        images, labels = dataset.get_batch()
+        predictions = model.predict(images)
+        assert len(predictions) == 32
+        probabilities = model.predict(images, return_type='probabilities')
+        assert probabilities.shape == (32, 5)  # tf_flowers has 5 classes
+        np.testing.assert_almost_equal(np.sum(probabilities), np.float32(32), decimal=4)
+
+        # Export the saved model
+        saved_model_dir = model.export(output_dir)
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+        # Reload the saved model
+        reload_model = model_factory.load_model(model_name, saved_model_dir, framework, use_case)
+
+        # Evaluate
+        reload_metrics = reload_model.evaluate(dataset)
+        np.testing.assert_almost_equal(reload_metrics, trained_metrics)
+
+        # Retrain from checkpoints and verify that we have better accuracy than the original training
+        retrain_model = model_factory.load_model(model_name, saved_model_dir, framework, use_case)
+        retrain_history = retrain_model.train(dataset, output_dir=output_dir, epochs=1,
+                                              initial_checkpoints=checkpoint_dir, shuffle_files=False, seed=10)
+        assert retrain_history is not None
+
+        # Delete the temp output directory
+        if os.path.exists(output_dir) and os.path.isdir(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+class TestImageClassificationCustomDataset:
+    """
+    Tests for TensorFlow image classification using a custom dataset using the flowers dataset
+    """
+    @classmethod
+    def setup_class(cls):
+        temp_dir = tempfile.mkdtemp(dir='/tmp/data')
+        custom_dataset_path = os.path.join(temp_dir, "flower_photos")
+
+        if not os.path.exists(custom_dataset_path):
+            download_url = "https://storage.googleapis.com/download.tensorflow.org/example_images/flower_photos.tgz"
+            download_and_extract_tar_file(download_url, temp_dir)
+
+        cls._output_dir = tempfile.mkdtemp()
+        cls._temp_dir = temp_dir
+        cls._dataset_dir = custom_dataset_path
+
+    @classmethod
+    def teardown_class(cls):
+        # remove directories
+        for dir in [cls._output_dir, cls._temp_dir]:
+            if os.path.exists(dir):
+                print("Deleting test directory:", dir)
+                shutil.rmtree(dir)
+
+    @pytest.mark.parametrize('model_name,train_accuracy,retrain_accuracy,test_inc',
+                             [['efficientnet_b0', 0.9333333, 1.0, False],
+                              ['resnet_v1_50', 1.0, 1.0, True],
+                              ['resnet_v2_50', 1.0, 1.0, False]])
+    def test_custom_dataset_workflow(self, model_name, train_accuracy, retrain_accuracy, test_inc):
+        """
+        Tests the full workflow for TF image classification using a custom dataset
+        """
+        framework = 'tensorflow'
+        use_case = 'image_classification'
+
+        # Get the dataset
+        dataset = dataset_factory.load_dataset(self._dataset_dir, use_case=use_case, framework=framework,
+                                               shuffle_files=False)
+        assert ['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips'] == dataset.class_names
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework)
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.shuffle_split(train_pct=0.1, val_pct=0.1, shuffle_files=False)
+        dataset.preprocess(model.image_size, 32, preprocessor=model.preprocessor)
+
+        # Train for 1 epoch
+        history = model.train(dataset, output_dir=self._output_dir, epochs=1, shuffle_files=False, seed=10,
+                              do_eval=False)
+        assert history is not None
+        np.testing.assert_almost_equal(history['acc'], [train_accuracy])
+
+        # Verify that checkpoints were generated
+        checkpoint_dir = os.path.join(self._output_dir, "{}_checkpoints".format(model_name))
+        assert os.path.isdir(checkpoint_dir)
+        assert len(os.listdir(checkpoint_dir))
+
+        # Evaluate
+        model.evaluate(dataset)
+
+        # Predict with a batch
+        images, labels = dataset.get_batch()
+        predictions = model.predict(images)
+        assert len(predictions) == 32
+
+        # export the saved model
+        saved_model_dir = model.export(self._output_dir)
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+        # Reload the saved model
+        reload_model = model_factory.get_model(model_name, framework)
+        reload_model.load_from_directory(saved_model_dir)
+
+        # Evaluate
+        metrics = reload_model.evaluate(dataset)
+        assert len(metrics) > 0
+
+        # Retrain from checkpoints and verify that we have better accuracy than the original training
+        retrain_model = model_factory.get_model(model_name, framework)
+        retrain_history = retrain_model.train(dataset, output_dir=self._output_dir, epochs=1,
+                                              initial_checkpoints=checkpoint_dir, shuffle_files=False, seed=10,
+                                              do_eval=False)
+        np.testing.assert_almost_equal(retrain_history['acc'], [retrain_accuracy])
+
+        # Test benchmarking, quantization
+        if test_inc:
+            inc_output_dir = os.path.join(self._output_dir, "quantized", model_name)
+            os.makedirs(inc_output_dir)
+            model.quantize(inc_output_dir, dataset=dataset)
+            assert os.path.exists(os.path.join(inc_output_dir, "saved_model.pb"))
+            model.benchmark(saved_model_dir=inc_output_dir, dataset=dataset)
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,dataset_name,epochs,learning_rate,do_eval,early_stopping,lr_decay,accuracy,\
+                          val_accuracy,lr_final',
+                         [['efficientnet_b0', 'tf_flowers', 4, 0.001, False, False, False, 0.9, None, 0.001],
+                          ['efficientnet_b0', 'tf_flowers', 4, 0.001, True, False, False, 0.9, 0.8478260, 0.001],
+                          ['efficientnet_b0', 'tf_flowers', 4, 0.001, True, False, True, 0.9, 0.8478260, 0.001],
+                          ['efficientnet_b0', 'tf_flowers', 4, 0.001, False, False, True, 0.9, None, 0.001],
+                          ['efficientnet_b0', 'tf_flowers', 16, 0.001, True, False, True, 1.0, 0.8695651, 1.0000e-03],
+                          ['efficientnet_b0', 'tf_flowers', 25, 0.001, True, True, False, 1.0, 0.8695651, 0.0002]])
+def test_tf_image_classification_with_lr_options(model_name, dataset_name, epochs, learning_rate, do_eval,
+                                                 early_stopping, lr_decay, accuracy, val_accuracy, lr_final):
+    """
+    Tests learning rate options
+    """
+    framework = 'tensorflow'
+    use_case = 'image_classification'
+    output_dir = tempfile.mkdtemp()
+
+    # Get the dataset
+    dataset = dataset_factory.get_dataset('/tmp/data', use_case, framework, dataset_name,
+                                          'tf_datasets', split=["train[:5%]"], shuffle_files=False)
+
+    # Get the model
+    model = model_factory.get_model(model_name, framework)
+    model.learning_rate = learning_rate
+    assert model.learning_rate == learning_rate
+
+    # Preprocess the dataset
+    dataset.shuffle_split(shuffle_files=False)
+    dataset.preprocess(model.image_size, 32)
+
+    # Train
+    history = model.train(dataset, output_dir=output_dir, epochs=epochs, shuffle_files=False, seed=10, do_eval=do_eval,
+                          early_stopping=early_stopping, lr_decay=lr_decay)
+
+    assert history is not None
+    np.testing.assert_almost_equal(history['acc'][-1], accuracy)
+    if val_accuracy:
+        np.testing.assert_almost_equal(history['val_acc'][-1], val_accuracy)
+    else:
+        assert 'val_acc' not in history
+    if do_eval and lr_decay:
+        assert history['lr'][-1] <= np.float32(lr_final)
+    else:
+        assert 'lr' not in history
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('add_aug',
+                         ['rotate',
+                          'zoom',
+                          'hflip'])
+def test_train_add_aug_mock(add_aug):
+    """
+    Tests basic add augmentation functionality for TensorFlow image classification models using mock objects
+    """
+    model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+
+    with patch('tlt.models.image_classification.tfhub_image_classification_model.'
+               'TFHubImageClassificationModel._get_hub_model') as mock_get_hub_model:
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = ImageClassificationDataset
+        print(mock_dataset.__class__)
+        mock_dataset.validation_subset = [1, 2, 3]
+
+        mock_dataset.class_names = ['a', 'b', 'c']
+        mock_model = MagicMock()
+        expected_return_value = {"result": True}
+        mock_history = MagicMock()
+        mock_history.history = expected_return_value
+
+        def mock_fit(dataset, epochs, shuffle, callbacks, validation_data=None):
+            assert dataset is not None
+            assert isinstance(epochs, int)
+            assert isinstance(shuffle, bool)
+            assert len(callbacks) > 0
+
+            return mock_history
+
+        mock_model.fit = mock_fit
+        mock_get_hub_model.return_value = mock_model
+
+        # add basic preprocessing with add aug set to 'zoom'
+        mock_dataset.preprocess(model.image_size, 32, add_aug=[add_aug])
+        mock_dataset.shuffle_split(shuffle_files=False)
+
+        # Test train without eval
+        return_val = model.train(mock_dataset, output_dir="/tmp/output", do_eval=False)
+        assert return_val == expected_return_value
+
+
+@pytest.mark.tensorflow
+def test_custom_callback():
+    """
+    Tests passing custom callbacks to the TensorFlow image classification train, evaluate, and predict functions.
+    """
+    model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+
+    with patch('tlt.models.image_classification.tfhub_image_classification_model.'
+               'TFHubImageClassificationModel._get_hub_model') as mock_get_hub_model:
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = ImageClassificationDataset
+        mock_dataset.validation_subset = [1, 2, 3]
+
+        mock_dataset.class_names = ['a', 'b', 'c']
+        mock_model = MagicMock()
+        expected_return_value = {"result": True}
+        mock_history = MagicMock()
+        mock_history.history = expected_return_value
+
+        class TestCallbackMethod(keras.callbacks.Callback):
+            pass
+
+        test_callback = TestCallbackMethod()
+
+        def mock_fit(dataset, epochs, shuffle, callbacks, validation_data=None):
+            # We should have more than one callback since TLT them and we added a custom one
+            assert isinstance(callbacks, list)
+            assert len(callbacks) > 1
+
+            # We should have one callback that's our test callback
+            assert (len([x for x in callbacks if x.__class__.__name__ == 'TestCallbackMethod']) == 1)
+
+            return mock_history
+
+        def mock_evaluate(dataset, callbacks=None):
+            assert isinstance(callbacks, list)
+            assert len(callbacks) == 1
+            assert (len([x for x in callbacks if x.__class__.__name__ == 'TestCallbackMethod']) == 1)
+            return [.98, 0.13]
+
+        def mock_predict(input_samples, callbacks=None):
+            assert isinstance(callbacks, list)
+            assert len(callbacks) == 1
+            assert (len([x for x in callbacks if x.__class__.__name__ == 'TestCallbackMethod']) == 1)
+            return [1.0, 0.5]
+
+        mock_model.fit.side_effect = mock_fit
+        mock_model.evaluate.side_effect = mock_evaluate
+        mock_model.predict.side_effect = mock_predict
+        mock_get_hub_model.return_value = mock_model
+
+        # Test custom callback as a single item, list, or tuple
+        custom_callbacks = [test_callback, [test_callback], (test_callback)]
+
+        for custom_callback in custom_callbacks:
+            # Test train with custom callback
+            return_val = model.train(mock_dataset, output_dir="/tmp/output", do_eval=False, callbacks=custom_callback)
+            assert return_val == expected_return_value
+            mock_model.fit.assert_called_once()
+            mock_model.fit.reset_mock()
+
+            # Test evaluate with custom callback
+            model.evaluate(mock_dataset, callbacks=custom_callback)
+            mock_model.evaluate.assert_called_once()
+            mock_model.evaluate.reset_mock()
+
+            # Test predict with custom callback
+            model.predict([], callbacks=custom_callback)
+            mock_model.predict.assert_called_once()
+            mock_model.predict.reset_mock()
+
+
+@pytest.mark.tensorflow
+@patch('tlt.models.image_classification.tfhub_image_classification_model.TFHubImageClassificationModel._get_hub_model')
+def test_invalid_callback_types(mock_get_hub_model):
+    """
+    Tests passing custom callbacks of the wrong type to train, predict, and evaluate
+    """
+    model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+
+    mock_dataset = MagicMock()
+    mock_dataset.__class__ = ImageClassificationDataset
+    mock_dataset.validation_subset = [1, 2, 3]
+
+    mock_dataset.class_names = ['a', 'b', 'c']
+    mock_model = MagicMock()
+    expected_return_value = {"result": True}
+    mock_history = MagicMock()
+    mock_history.history = expected_return_value
+
+    class TestCallbackMethod(keras.callbacks.Callback):
+        pass
+
+    good_callback = TestCallbackMethod()
+    bad_callback = 1
+
+    mock_model.fit = MagicMock()
+    mock_model.evaluate = MagicMock()
+    mock_model.predict = MagicMock()
+    mock_get_hub_model.return_value = mock_model
+
+    with pytest.raises(TypeError, match="Callbacks must be tf.keras.callbacks.Callback instances"):
+        model.train(mock_dataset, output_dir="/tmp/output", do_eval=False, callbacks=[good_callback, bad_callback])
+
+    with pytest.raises(TypeError, match="Callbacks must be tf.keras.callbacks.Callback instances"):
+        model.evaluate(mock_dataset, callbacks=[good_callback, bad_callback])
+
+    with pytest.raises(TypeError, match="Callbacks must be tf.keras.callbacks.Callback instances"):
+        model.predict([], callbacks=[good_callback, bad_callback])
diff --git a/tests/tensorflow_tests/test_text_classification.py b/tests/tensorflow_tests/test_text_classification.py
new file mode 100644
index 0000000000000000000000000000000000000000..9e66b495f50d119e8148879b130110607a1cf90a
--- /dev/null
+++ b/tests/tensorflow_tests/test_text_classification.py
@@ -0,0 +1,356 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from tlt.utils.file_utils import validate_model_name, download_and_extract_zip_file
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,dataset_name,extra_layers,correct_num_layers,model_hub',
+                         [['google/bert_uncased_L-2_H-128_A-2', 'ag_news_subset', None, 5, 'huggingface']])
+def test_tf_multi_text_classification(model_name, dataset_name, extra_layers, correct_num_layers, model_hub):
+    """
+    Tests basic transfer learning functionality for TensorFlow multi text classification using TF Datasets
+    """
+    framework = 'tensorflow'
+    output_dir = tempfile.mkdtemp()
+    os.environ["TENSORFLOW_HOME"] = output_dir
+
+    try:
+        # Get the dataset
+        dataset = dataset_factory.get_dataset(output_dir, 'text_classification', framework, dataset_name,
+                                              'tf_datasets', split=["train[:8%]"], shuffle_files=False)
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework)
+
+        # Preprocess the dataset
+        batch_size = 32
+        dataset.preprocess(batch_size)
+        dataset.shuffle_split(seed=10)
+
+        # This model does not support evaluate/predict before training
+        with pytest.raises(ValueError) as e:
+            model.evaluate(dataset)
+        assert "model must be trained" in str(e)
+        with pytest.raises(ValueError) as e:
+            model.predict(dataset)
+        assert "model must be trained" in str(e)
+
+        # Train
+        history = model.train(dataset, output_dir=output_dir, epochs=1,
+                              shuffle_files=False, do_eval=False,
+                              extra_layers=extra_layers)
+        assert history is not None
+        assert len(model._model.layers) == correct_num_layers
+
+        # Verify that checkpoints were generated
+        cleaned_name = validate_model_name(model_name)
+        checkpoint_dir = os.path.join(output_dir, "{}_checkpoints".format(cleaned_name))
+        assert os.path.isdir(checkpoint_dir)
+        assert len(os.listdir(checkpoint_dir))
+
+        # Evaluate
+        trained_metrics = model.evaluate(dataset)
+        assert len(trained_metrics) == 2  # expect to get loss and accuracy metrics
+
+        # Predict with a batch
+        input, labels = dataset.get_batch()
+        predictions = model.predict(input)
+        assert len(predictions) == batch_size
+
+        text1 = ('Oil and Economy Cloud Stocks Outlook (Reuters) Reuters - '
+                 'Soaring crude prices plus worries about the economy and the'
+                 'outlook for earnings are expected to hang over the stock market'
+                 'next week during the depth of the summer doldrums')
+        text2 = ('Wall St. Bears Claw Back Into the Black (Reuters) Reuters -'
+                 'Short-sellers, Wall Streets dwindlingband of ultra-cynics,'
+                 'are seeing green again.')
+        text3 = ('Expansion slows in Japan Economic growth in Japan slows down'
+                 'as the country experiences a drop in domestic and corporate spending.'
+                 'outlook for earnings are expected to hang over the stock market'
+                 'next week during the depth of the summer doldrums')
+        # Predict with raw text input
+        raw_text_input = [text1, text2, text3]
+        predictions = model.predict(raw_text_input)
+        assert len(predictions) == len(raw_text_input)
+
+        # export the saved model
+        saved_model_dir = model.export(output_dir)
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+        # Reload the saved model
+        reload_model = model_factory.load_model(model_name, saved_model_dir, framework, 'text_classification',
+                                                model_hub)
+
+        # Evaluate
+        reload_metrics = reload_model.evaluate(dataset)
+        assert reload_metrics == trained_metrics
+
+        # Predict with the raw text input
+        reload_predictions = reload_model.predict(raw_text_input)
+        assert (reload_predictions == predictions).all()
+
+        # Retrain from checkpoints and verify that accuracy metric is the expected type
+        retrain_model = model_factory.load_model(model_name, saved_model_dir, framework, 'text_classification',
+                                                 model_hub)
+        retrain_model.train(dataset, output_dir=output_dir, epochs=1, initial_checkpoints=checkpoint_dir,
+                            shuffle_files=False, do_eval=False)
+
+        retrain_metrics = retrain_model.evaluate(dataset)
+        accuracy_index = next(id for id, k in enumerate(model._model.metrics_names) if 'acc' in k)
+        # BERT model results are not deterministic, so the commented assertion doesn't reliably pass
+        assert isinstance(retrain_metrics[accuracy_index], float)
+
+    finally:
+        # Delete the temp output directory
+        if os.path.exists(output_dir) and os.path.isdir(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,dataset_name,extra_layers,correct_num_layers,model_hub',
+                         [['google/bert_uncased_L-2_H-128_A-2', 'imdb_reviews', None, 5, 'huggingface'],
+                          ['google/bert_uncased_L-2_H-256_A-4', 'glue/sst2', None, 5, 'huggingface'],
+                          ['google/bert_uncased_L-2_H-128_A-2', 'imdb_reviews', [512, 128], 7, 'huggingface']])
+def test_tf_binary_text_classification(model_name, dataset_name, extra_layers, correct_num_layers, model_hub):
+    """
+    Tests basic transfer learning functionality for TensorFlow binary text classification using TF Datasets
+    """
+    framework = 'tensorflow'
+    output_dir = tempfile.mkdtemp()
+
+    try:
+        # Get the dataset
+        dataset = dataset_factory.get_dataset('/tmp/data', 'text_classification', framework, dataset_name,
+                                              'tf_datasets', split=["train[:8%]"], shuffle_files=False)
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework)
+
+        # Preprocess the dataset
+        batch_size = 32
+        dataset.preprocess(batch_size)
+        dataset.shuffle_split(seed=10)
+
+        # This model does not support evaluate/predict before training
+        with pytest.raises(ValueError) as e:
+            model.evaluate(dataset)
+        assert "model must be trained" in str(e)
+        with pytest.raises(ValueError) as e:
+            model.predict(dataset)
+        assert "model must be trained" in str(e)
+
+        # Train
+        history = model.train(dataset, output_dir=output_dir, epochs=1,
+                              shuffle_files=False, do_eval=False,
+                              extra_layers=extra_layers)
+        assert history is not None
+        assert len(model._model.layers) == correct_num_layers
+
+        # Verify that checkpoints were generated
+        cleaned_name = validate_model_name(model_name)
+        checkpoint_dir = os.path.join(output_dir, "{}_checkpoints".format(cleaned_name))
+        assert os.path.isdir(checkpoint_dir)
+        assert len(os.listdir(checkpoint_dir))
+
+        # Evaluate
+        trained_metrics = model.evaluate(dataset)
+        assert len(trained_metrics) == 2  # expect to get loss and accuracy metrics
+
+        # Predict with a batch
+        input, labels = dataset.get_batch()
+        predictions = model.predict(input)
+        assert len(predictions) == batch_size
+
+        # Predict with raw text input
+        raw_text_input = ["awesome", "fun", "boring"]
+        predictions = model.predict(raw_text_input)
+        assert len(predictions) == len(raw_text_input)
+
+        # export the saved model
+        saved_model_dir = model.export(output_dir)
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+        # Reload the saved model
+        reload_model = model_factory.load_model(model_name, saved_model_dir, framework, 'text_classification',
+                                                model_hub)
+
+        # Evaluate
+        reload_metrics = reload_model.evaluate(dataset)
+        assert reload_metrics == trained_metrics
+
+        # Predict with the raw text input
+        reload_predictions = reload_model.predict(raw_text_input)
+        assert (reload_predictions == predictions).all()
+
+        # Retrain from checkpoints and verify that accuracy metric is the expected type
+        retrain_model = model_factory.load_model(model_name, saved_model_dir, framework, 'text_classification',
+                                                 model_hub)
+        retrain_model.train(dataset, output_dir=output_dir, epochs=1, initial_checkpoints=checkpoint_dir,
+                            shuffle_files=False, do_eval=False)
+
+        retrain_metrics = retrain_model.evaluate(dataset)
+        accuracy_index = next(id for id, k in enumerate(model._model.metrics_names) if 'acc' in k)
+        # BERT model results are not deterministic, so the commented assertion doesn't reliably pass
+        # assert retrain_metrics[accuracy_index] > trained_metrics[accuracy_index]
+        assert isinstance(retrain_metrics[accuracy_index], float)
+
+    finally:
+        # Delete the temp output directory
+        if os.path.exists(output_dir) and os.path.isdir(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name, dataset_name, epochs, learning_rate, do_eval, \
+                         lr_decay, accuracy, val_accuracy, lr_final',
+                         [['google/bert_uncased_L-2_H-128_A-2', 'glue/sst2', 1,
+                           .005, False, False, None, None, 0.005],
+                          ['google/bert_uncased_L-2_H-256_A-4', 'glue/sst2',
+                           1, .001, True, True, 0.34375, 0.4256, 0.001],
+                          ['google/bert_uncased_L-2_H-128_A-2', 'imdb_reviews',
+                           15, .005, True, True, None, None, 0.001]])
+def test_tf_binary_text_classification_with_lr_options(model_name, dataset_name,
+                                                       epochs, learning_rate, do_eval,
+                                                       lr_decay, accuracy, val_accuracy, lr_final):
+    """
+    Tests transfer learning for TensorFlow binary text classification with different learning rate options
+    """
+    framework = 'tensorflow'
+    output_dir = tempfile.mkdtemp()
+
+    try:
+        # Get the dataset
+        dataset = dataset_factory.get_dataset('/tmp/data', 'text_classification', framework, dataset_name,
+                                              'tf_datasets', split=["train[:4%]"], shuffle_files=False)
+
+        # Get the model
+        model = model_factory.get_model(model_name, framework)
+        model.learning_rate = learning_rate
+        assert model.learning_rate == learning_rate
+
+        # Preprocess the dataset
+        batch_size = 32
+        dataset.preprocess(batch_size)
+        dataset.shuffle_split(seed=10)
+
+        # Train
+        history = model.train(dataset, output_dir=output_dir, epochs=epochs, shuffle_files=False, do_eval=do_eval,
+                              lr_decay=lr_decay, seed=10)
+        assert history is not None
+
+        # TODO: BERT model results are not deterministic (AIZOO-1222), exact assertions will not pass
+        # assert history['binary_accuracy'][-1] == accuracy
+        # if val_accuracy:
+        #     assert history['val_binary_accuracy'][-1] == val_accuracy
+        # else:
+        #     assert 'val_binary_accuracy' not in history
+
+        # Non-determinism causes this assertion to fail a small fraction of the time,
+        # for now, no assertions will be checked until a workaround is implemented
+        if do_eval and lr_decay:
+            pass
+        else:
+            assert 'lr' not in history
+
+    finally:
+        # Delete the temp output directory
+        if os.path.exists(output_dir) and os.path.isdir(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name',
+                         ['google/bert_uncased_L-2_H-128_A-2'])
+def test_custom_dataset_workflow(model_name):
+    """
+    Tests the full workflow for TF text classification using a custom dataset
+    """
+    output_dir = tempfile.mkdtemp()
+    dataset_dir = '/tmp/data'
+
+    def label_map_func(x):
+        return int(x == "spam")
+
+    try:
+        # Get the dataset
+        zip_file_url = "https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip"
+        sms_data_directory = os.path.join(dataset_dir, "sms_spam_collection")
+        csv_file_name = "SMSSpamCollection"
+
+        # If the SMS Spam collection csv file is not found, download and extract the file:
+        if not os.path.exists(os.path.join(sms_data_directory, csv_file_name)):
+            # Download the zip file with the SMS Spam collection dataset
+            download_and_extract_zip_file(zip_file_url, sms_data_directory)
+
+        dataset = dataset_factory.load_dataset(sms_data_directory, use_case="text_classification",
+                                               framework="tensorflow", csv_file_name="SMSSpamCollection",
+                                               class_names=["ham", "spam"], shuffle_files=False,
+                                               delimiter='\t', header=False, label_map_func=label_map_func)
+        # Get the model
+        model = model_factory.get_model(model_name, "tensorflow")
+
+        # Preprocess the dataset and split to get small subsets for training and validation
+        dataset.shuffle_split(train_pct=0.1, val_pct=0.1, shuffle_files=False)
+        dataset.preprocess(batch_size=32)
+        # Train for 1 epoch
+        history = model.train(dataset=dataset, output_dir=output_dir, epochs=1, seed=10, do_eval=False)
+        assert history is not None
+
+        # Evaluate
+        model.evaluate(dataset)
+
+        # export the saved model
+        saved_model_dir = model.export(output_dir)
+
+        assert os.path.isdir(saved_model_dir)
+        assert os.path.isfile(os.path.join(saved_model_dir, "saved_model.pb"))
+
+        # Reload the saved model
+        reload_model = model_factory.get_model(model_name, "tensorflow")
+        reload_model.load_from_directory(saved_model_dir)
+
+        # Evaluate
+        metrics = reload_model.evaluate(dataset)
+        assert len(metrics) > 0
+
+        # Quantization
+        inc_output_dir = os.path.join(output_dir, "quantized", "mocked")
+        os.makedirs(inc_output_dir, exist_ok=True)
+        model.quantize(inc_output_dir, dataset)
+        assert os.path.exists(os.path.join(inc_output_dir, "saved_model.pb"))
+
+    finally:
+        # Delete the temp output directory
+        if os.path.exists(output_dir) and os.path.isdir(output_dir):
+            shutil.rmtree(output_dir)
diff --git a/tests/tensorflow_tests/unit/__init__.py b/tests/tensorflow_tests/unit/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/tensorflow_tests/unit/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/tensorflow_tests/unit/test_datasets.py b/tests/tensorflow_tests/unit/test_datasets.py
new file mode 100644
index 0000000000000000000000000000000000000000..bdcc29de0b0c8597fd2caf0579786ff1107d53ab
--- /dev/null
+++ b/tests/tensorflow_tests/unit/test_datasets.py
@@ -0,0 +1,608 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import math
+import os
+import pytest
+import shutil
+import tempfile
+from numpy.testing import assert_array_equal
+from PIL import Image
+
+from tlt.datasets.dataset_factory import get_dataset, load_dataset
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.datasets.image_classification.tfds_image_classification_dataset import TFDSImageClassificationDataset
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TFDSImageClassificationDataset. TensorFlow may not be installed")
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.datasets.text_classification.tfds_text_classification_dataset import TFDSTextClassificationDataset
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TFDSTextClassificationDataset. TensorFlow may not be installed")
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.datasets.image_classification.tf_custom_image_classification_dataset import TFCustomImageClassificationDataset  # noqa: E501
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TFCustomImageClassificationDataset. TensorFlow may not be installed")
+
+
+@pytest.mark.tensorflow
+def test_tf_flowers_10pct():
+    """
+    Checks that a 10% tf_flowers subset can be loaded
+    """
+    flowers = get_dataset('/tmp/data', 'image_classification', 'tensorflow', 'tf_flowers',
+                          'tf_datasets', split=["train[:10%]"])
+    assert type(flowers) == TFDSImageClassificationDataset
+    assert len(flowers.dataset) < 3670
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,use_case,train_split,val_split,test_split,train_len,val_len,test_len',
+                         [['beans', 'image_classification', 'train', 'validation', None, 1034, 133, 0],
+                          ['glue/cola', 'text_classification', 'train', 'validation', 'test', 8551, 1043, 1063]])
+def test_defined_split(dataset_name, use_case, train_split, val_split, test_split, train_len, val_len, test_len):
+    """
+    Checks that dataset can be loaded into train, validation, and test subsets based on TFDS splits and then
+    re-partitioned with shuffle-split
+    """
+    splits = [train_split, val_split, test_split]
+    splits = [s for s in splits if s]  # Filter out ones that are None
+    data = get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', split=splits)
+
+    total_len = train_len + val_len + test_len
+    assert len(data.dataset) == total_len
+
+    if train_len:
+        assert len(data.train_subset) == train_len
+    else:
+        assert data.train_subset is None
+
+    if val_len:
+        assert len(data.validation_subset) == val_len
+    else:
+        assert data.validation_subset is None
+
+    if test_len:
+        assert len(data.test_subset) == test_len
+    else:
+        assert data.test_subset is None
+
+    assert data._validation_type == 'defined_split'
+
+    # Apply shuffle split and verify new subset sizes
+    train_percent = .6
+    val_percent = .2
+    test_percent = .2
+    data.shuffle_split(train_percent, val_percent, test_percent, seed=10)
+    assert len(data.train_subset) == int(total_len * train_percent)
+    assert len(data.validation_subset) == int(total_len * val_percent)
+    assert len(data.test_subset) == total_len - len(data.train_subset) - len(data.validation_subset)
+    assert data._validation_type == 'shuffle_split'
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,use_case,train_split,train_len,val_len',
+                         [['tf_flowers', 'image_classification', 'train[:30%]', 825, 275],
+                          ['glue/cola', 'text_classification', 'train[:10%]', 641, 213]])
+def test_shuffle_split(dataset_name, use_case, train_split, train_len, val_len):
+    """
+    Checks that dataset can be split into train, validation, and test subsets. The expected train subset length is
+    75% of the specified train_split. The expected validation length is 25% of the specified train split.
+    """
+    flowers = get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', split=[train_split])
+    flowers.shuffle_split(seed=10)
+    assert len(flowers.train_subset) == train_len
+    assert len(flowers.validation_subset) == val_len
+    assert flowers.test_subset is None
+    assert flowers._validation_type == 'shuffle_split'
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,use_case,image_size',
+                         [['tf_flowers', 'image_classification', 224],
+                          ['glue/cola', 'text_classification', None]])
+def test_shuffle_split_deterministic_tfds(dataset_name, use_case, image_size):
+    """
+    Checks that tfds datasets can be split into train, validation, and test subsets in a way that is reproducible
+    """
+    seed = 10
+
+    data1 = get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', shuffle_files=False)
+    if image_size:
+        data1.preprocess(image_size, batch_size=1)
+    else:
+        data1.preprocess(batch_size=1)
+
+    data1.shuffle_split(seed=seed)
+
+    data2 = get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', shuffle_files=False)
+
+    if image_size:
+        data2.preprocess(image_size, batch_size=1)
+    else:
+        data2.preprocess(batch_size=1)
+
+    data2.shuffle_split(seed=seed)
+
+    for i in range(10):
+        sample_1, label_1 = data1.get_batch()
+        sample_2, label_2 = data2.get_batch()
+        assert_array_equal(sample_1, sample_2)
+        assert_array_equal(label_1, label_2)
+
+
+@pytest.mark.tensorflow
+def test_shuffle_split_deterministic_custom():
+    """
+    Checks that custom datasets can be split into train, validation, and test subsets in a way that is reproducible
+    """
+    dataset_dir = '/tmp/data'
+    use_case = 'image_classification'
+    class_names = ['foo', 'bar']
+    seed = 10
+    image_size = 224
+    batch_size = 1
+    ic_dataset1 = None
+    ic_dataset2 = None
+    try:
+        ic_dataset1 = DatasetForTest(dataset_dir, use_case, None, None, class_names)
+        tlt_dataset1 = ic_dataset1.tlt_dataset
+        tlt_dataset1.preprocess(image_size, batch_size)
+        tlt_dataset1.shuffle_split(seed=seed)
+
+        ic_dataset2 = DatasetForTest(dataset_dir, use_case, None, None, class_names)
+        tlt_dataset2 = ic_dataset2.tlt_dataset
+        tlt_dataset2.preprocess(image_size, batch_size)
+        tlt_dataset2.shuffle_split(seed=seed)
+
+        for i in range(10):
+            image_1, label_1 = tlt_dataset1.get_batch()
+            image_2, label_2 = tlt_dataset2.get_batch()
+            assert_array_equal(image_1, image_2)
+            assert_array_equal(label_1, label_2)
+    finally:
+        if ic_dataset1:
+            ic_dataset1.cleanup()
+        if ic_dataset2:
+            ic_dataset2.cleanup()
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_dir,use_case,dataset_name,dataset_catalog,class_names,batch_size',
+                         [['/tmp/data', 'image_classification', 'tf_flowers', 'tf_datasets', None, 32],
+                          ['/tmp/data', 'image_classification', 'tf_flowers', 'tf_datasets', None, 1],
+                          ['/tmp/data', 'image_classification', None, None, ['foo', 'bar'], 8],
+                          ['/tmp/data', 'image_classification', None, None, ['foo', 'bar'], 1],
+                          ['/tmp/data', 'text_classification', 'glue/cola', 'tf_datasets', None, 1],
+                          ['/tmp/data', 'text_classification', 'glue/cola', 'tf_datasets', None, 32]])
+def test_batching(dataset_dir, use_case, dataset_name, dataset_catalog, class_names, batch_size):
+    """
+    Checks that dataset can be batched with valid positive integer values
+    """
+    ic_dataset = DatasetForTest(dataset_dir, use_case, dataset_name, dataset_catalog, class_names)
+
+    try:
+        tlt_dataset = ic_dataset.tlt_dataset
+        if use_case == 'image_classification':
+            tlt_dataset.preprocess(224, batch_size)  # image classification needs an image size
+        else:
+            tlt_dataset.preprocess(batch_size=batch_size)
+
+        assert len(tlt_dataset.get_batch()[0]) == batch_size
+    finally:
+        ic_dataset.cleanup()
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_dir,use_case,dataset_name,dataset_catalog,class_names',
+                         [['/tmp/data', 'image_classification', 'tf_flowers', 'tf_datasets', None],
+                          ['/tmp/data', 'image_classification', None, None, ['foo', 'bar']],
+                          ['/tmp/data', 'text_classification', 'glue/cola', 'tf_datasets', None]])
+def test_batching_error(dataset_dir, use_case, dataset_name, dataset_catalog, class_names):
+    """
+    Checks that preprocessing cannot be run twice
+    """
+    ic_dataset = DatasetForTest(dataset_dir, use_case, dataset_name, dataset_catalog, class_names)
+
+    try:
+        tlt_dataset = ic_dataset.tlt_dataset
+
+        if use_case == 'image_classification':
+            tlt_dataset.preprocess(224, 1)  # image classification needs an image size
+        else:
+            tlt_dataset.preprocess(batch_size=1)
+
+        with pytest.raises(Exception) as e:
+            if use_case == 'image_classification':
+                tlt_dataset.preprocess(256, 32)
+            else:
+                tlt_dataset.preprocess(batch_size=32)
+
+        assert 'Data has already been preprocessed: {}'.format(tlt_dataset._preprocessed) == str(e.value)
+    finally:
+        ic_dataset.cleanup()
+
+
+@pytest.mark.integration
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,use_case,expected_class_names',
+                         [['glue/cola', 'text_classification', ['unacceptable', 'acceptable']],
+                          ['glue/sst2', 'text_classification', ['negative', 'positive']],
+                          ['imdb_reviews', 'text_classification', ['neg', 'pos']]])
+def test_supported_tfds_datasets(dataset_name, use_case, expected_class_names):
+    """
+    Verifies that we are able to load supported datasets and get class names
+    """
+    dataset = get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', split=["train[:10%]"])
+
+    assert dataset.class_names == expected_class_names
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,use_case',
+                         [['glue', 'text_classification'],
+                          ['sst2', 'text_classification'],
+                          ['taco', 'text_classification']])
+def test_unsupported_tfds_datasets(dataset_name, use_case):
+    """
+    Verifies that unsupported datasets get the proper error
+    """
+
+    with pytest.raises(ValueError) as e:
+        get_dataset('/tmp/data', use_case, 'tensorflow', dataset_name, 'tf_datasets', split=["train[:10%]"])
+
+    assert "Dataset name is not supported" in str(e)
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('dataset_name,delimiter',
+                         [['foo', ':'],
+                          [None, '\t'],
+                          ['potato', ',']])
+def test_custom_text_classification_csv(dataset_name, delimiter):
+    """
+    Tests load_dataset with a text classification csv file. Verifies that the csv file gets loaded into the dataset
+    and that the map function is properly applied to the data.
+    """
+    dataset_dir = tempfile.mkdtemp()
+    csv_file_name = "test.csv"
+    default_dataset_name = "test"
+    use_case = "text_classification"
+    framework = "tensorflow"
+    class_names = ['neg', 'pos']
+    batch_size = 20
+
+    try:
+        # Write dummy csv file
+        csv_lines = ['pos{}hello\n'.format(delimiter), 'neg{}bye\n'.format(delimiter)] * batch_size
+        with open(os.path.join(dataset_dir, csv_file_name), 'w') as f:
+            f.writelines(csv_lines)
+
+        def map_func(x):
+            return int(x == 'pos')
+
+        dataset = load_dataset(dataset_dir, use_case, framework, dataset_name, csv_file_name=csv_file_name,
+                               label_map_func=map_func, class_names=class_names, delimiter=delimiter,
+                               shuffle_files=False)
+
+        assert len(dataset._dataset) == len(csv_lines)
+        assert dataset.class_names == class_names
+
+        if dataset_name:
+            assert dataset.dataset_name == dataset_name
+        else:
+            assert dataset.dataset_name == default_dataset_name
+
+        dataset.preprocess(batch_size=batch_size)
+
+        # Get a batch and verify that the text labels have been mapped to numerical values
+        _, label_value = dataset.get_batch()
+        assert_array_equal([1, 0] * int(batch_size / 2), label_value)
+
+    finally:
+        # Clean up after the test by deleting the temp dataset directory
+        if os.path.exists(dataset_dir):
+            shutil.rmtree(dataset_dir)
+
+
+@pytest.mark.tensorflow
+def test_custom_text_classification_extra_columns():
+    """
+    Tests load_dataset with a text classification csv file that has 3 columns and uses select_cols and exclude_cols to
+    make the resulting dataset only have 2 columns.
+    """
+    dataset_dir = tempfile.mkdtemp()
+    csv_file_name = "test.csv"
+    use_case = "text_classification"
+    framework = "tensorflow"
+    class_names = ['neg', 'pos']
+    batch_size = 20
+    delimiter = ","
+
+    try:
+        # Write dummy csv file with 3 columns
+        csv_lines = ['pos{0}hello{0}other\n'.format(delimiter), 'neg{0}bye{0}other\n'.format(delimiter)] * batch_size
+        with open(os.path.join(dataset_dir, csv_file_name), 'w') as f:
+            f.writelines(csv_lines)
+
+        def str_to_int(x):
+            return int(x == 'pos')
+
+        # Call load_dataset with exclude_cols
+        dataset = load_dataset(dataset_dir, use_case, framework, dataset_name=None, csv_file_name=csv_file_name,
+                               class_names=class_names, delimiter=delimiter, exclude_cols=[2],
+                               shuffle_files=False, label_map_func=str_to_int)
+
+        assert len(dataset._dataset) == len(csv_lines)
+        dataset.preprocess(batch_size=batch_size)
+
+        # The batch should have 2 columns, since one was excluded using 'exclude_cols'
+        assert len(dataset.get_batch()) == 2
+
+        # Call load_dataset with select_cols
+        dataset = load_dataset(dataset_dir, use_case, framework, dataset_name=None, csv_file_name=csv_file_name,
+                               class_names=class_names, delimiter=delimiter, select_cols=[0, 1], shuffle_files=False,
+                               label_map_func=str_to_int)
+
+        assert len(dataset._dataset) == len(csv_lines)
+        dataset.preprocess(batch_size=batch_size)
+
+        # We should only have 2 columns, since 'select_cols' was used
+        assert len(dataset.get_batch()) == 2
+
+    finally:
+        # Clean up after the test by deleting the temp dataset directory
+        if os.path.exists(dataset_dir):
+            shutil.rmtree(dataset_dir)
+
+
+class DatasetForTest:
+    def __init__(self, dataset_dir, use_case, dataset_name=None, dataset_catalog=None, class_names=None, splits=None):
+        """
+        This class wraps initialization for datasets (either from TFDS or custom).
+
+        For a custom dataset, provide a dataset dir and class names, with or without splits such as ['train',
+        'validation', 'test']. A temporary directory will be created with dummy folders for the specified split
+        subfolders and class names and 50 images in each folder. The dataset factory will be used to load the custom
+        dataset from the dataset directory.
+
+        For a dataset from a catalog, provide the dataset_dir, dataset_name, and dataset_catalog.
+        The dataset factory will be used to load the specified dataset.
+        """
+        framework = 'tensorflow'
+
+        def make_n_files(file_dir, n):
+            os.makedirs(file_dir)
+            for i in range(n):
+                img = Image.new(mode='RGB', size=(24, 24))
+                img.save(os.path.join(file_dir, 'img_{}.jpg'.format(i)))
+
+        if dataset_name and dataset_catalog:
+            self._dataset_catalog = dataset_catalog
+            self._tlt_dataset = get_dataset(dataset_dir, use_case, framework, dataset_name, dataset_catalog)
+        elif class_names:
+            self._dataset_catalog = "custom"
+            dataset_dir = tempfile.mkdtemp(dir=dataset_dir)
+            if not isinstance(class_names, list):
+                raise TypeError("class_names needs to be a list")
+
+            if use_case == 'image_classification':
+                if isinstance(splits, list):
+                    for folder in splits:
+                        for dir_name in class_names:
+                            make_n_files(os.path.join(dataset_dir, folder, dir_name), 50)
+                elif splits is None:
+                    for dir_name in class_names:
+                        make_n_files(os.path.join(dataset_dir, dir_name), 50)
+                else:
+                    raise ValueError("Splits must be None or a list of strings, got {}".format(splits))
+            else:
+                raise NotImplementedError("The custom dataset option has only been implemented for images")
+
+            self._tlt_dataset = load_dataset(dataset_dir, use_case, framework, seed=10)
+
+        self._dataset_dir = dataset_dir
+
+    @property
+    def tlt_dataset(self):
+        """
+        Returns the tlt dataset object
+        """
+        return self._tlt_dataset
+
+    def cleanup(self):
+        """
+        Clean up - remove temp files that were created for custom datasets
+        """
+        if self._dataset_catalog == "custom":
+            print("Deleting temp directory:", self._dataset_dir)
+            shutil.rmtree(self._dataset_dir)
+        # TODO: Should we delete tfds directories too?
+
+
+# Metadata about tfds datasets
+tfds_metadata = {
+    'tf_flowers': {
+        'class_names': ['dandelion', 'daisy', 'tulips', 'sunflowers', 'roses'],
+        'size': 3670
+    },
+    'glue/cola': {
+        'class_names': ['unacceptable', 'acceptable'],
+        'size': 8551
+    }
+}
+
+# Dataset parameters used to define datasets that will be initialized and tested using DatasetForTest class.
+# The parameters are: dataset_dir, use_case, dataset_name, dataset_catalog, class_names, and subfolders, which map to
+# the constructor parameters for DatasetForTest, which initializes the datasets using the dataset factory.
+dataset_params = [("/tmp/data", 'image_classification', "tf_flowers", "tf_datasets", None, None),
+                  ("/tmp/data", 'image_classification', None, None, ["a", "b", "c"], None),
+                  ("/tmp/data", 'text_classification', "glue/cola", "tf_datasets", None, None),
+                  ("/tmp/data", 'image_classification', None, None, ["a", "b", "c"], ['train', 'validation']),
+                  ("/tmp/data", 'image_classification', None, None, ["a", "b"], ['train', 'validation', 'test'])]
+
+
+@pytest.fixture(scope="class", params=dataset_params)
+def test_data(request):
+    params = request.param
+
+    ic_dataset = DatasetForTest(*params)
+
+    dataset_dir, use_case, dataset_name, dataset_catalog, dataset_classes, splits = params
+
+    def cleanup():
+        ic_dataset.cleanup()
+
+    request.addfinalizer(cleanup)
+
+    # Return the tlt dataset along with metadata that tests might need
+    return (ic_dataset.tlt_dataset, dataset_name, dataset_classes, use_case, splits)
+
+
+@pytest.mark.tensorflow
+class TestImageClassificationDataset:
+    """
+    This class contains image classification dataset tests that only require the dataset to be initialized once. These
+    tests will be run once for each of the dataset defined in the dataset_params list.
+    """
+
+    def test_class_names_and_size(self, test_data):
+        """
+        Verify the class type, dataset class names, and dataset length after initialization
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+
+        if dataset_name is None:
+            assert type(tlt_dataset) == TFCustomImageClassificationDataset
+            assert len(tlt_dataset.class_names) == len(dataset_classes)
+            if splits is None:
+                assert len(tlt_dataset.dataset) == len(dataset_classes) * 50
+            else:
+                assert len(tlt_dataset.dataset) == len(dataset_classes) * len(splits) * 50
+        else:
+            if use_case == 'image_classification':
+                assert type(tlt_dataset) == TFDSImageClassificationDataset
+            elif use_case == 'text_classification':
+                assert type(tlt_dataset) == TFDSTextClassificationDataset
+
+            assert len(tlt_dataset.class_names) == len(tfds_metadata[dataset_name]['class_names'])
+            assert len(tlt_dataset.dataset) == tfds_metadata[dataset_name]['size']
+
+    @pytest.mark.parametrize('batch_size',
+                             ['foo',
+                              -17,
+                              20.5])
+    def test_invalid_batch_sizes(self, batch_size, test_data):
+        """
+        Ensures that a ValueError is raised when an invalid batch size is passed
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+        with pytest.raises(ValueError):
+            if use_case == 'image_classification':
+                tlt_dataset.preprocess(224, batch_size)
+            else:
+                tlt_dataset.preprocess(batch_size=batch_size)
+
+    @pytest.mark.parametrize('image_size',
+                             ['foo',
+                              -17,
+                              20.5])
+    def test_invalid_image_size(self, image_size, test_data):
+        """
+        Ensures that a ValueError is raised when an invalid image size is passed. This test only applies to
+        image dataset.
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+
+        if use_case == 'image_classification':
+            with pytest.raises(ValueError):
+                tlt_dataset.preprocess(image_size, batch_size=8)
+
+    def test_preprocessing(self, test_data):
+        """
+        Checks that dataset can be preprocessed only once
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+
+        if use_case == 'image_classification':
+            tlt_dataset.preprocess(224, 8)
+            preprocessing_inputs = {'image_size': 224, 'batch_size': 8}
+        else:
+            tlt_dataset.preprocess(batch_size=8)
+            preprocessing_inputs = {'batch_size': 8}
+
+        assert tlt_dataset._preprocessed == preprocessing_inputs
+
+        # Trying to preprocess again should throw an exception
+        with pytest.raises(Exception) as e:
+            if use_case == 'image_classification':
+                tlt_dataset.preprocess(324, 32)
+            else:
+                tlt_dataset.preprocess(batch_size=32)
+        assert 'Data has already been preprocessed: {}'.format(preprocessing_inputs) == str(e.value)
+        print(tlt_dataset.info)
+
+    def test_shuffle_split_errors(self, test_data):
+        """
+        Checks that splitting into train, validation, and test subsets will error if inputs are wrong
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=.5, val_pct=.5, test_pct=.2)
+        assert 'Sum of percentage arguments must be less than or equal to 1.' == str(e.value)
+        with pytest.raises(Exception) as e:
+            tlt_dataset.shuffle_split(train_pct=1, val_pct=0)
+        assert 'Percentage arguments must be floats.' == str(e.value)
+
+    def test_shuffle_split(self, test_data):
+        """
+        Checks that dataset can be split into train, validation, and test subsets
+        """
+        tlt_dataset, dataset_name, dataset_classes, use_case, splits = test_data
+
+        # Before the shuffle split, validation type should be None or defined_split
+        if splits is None:
+            assert tlt_dataset._validation_type is None
+        else:
+            assert 'defined_split' == tlt_dataset._validation_type
+
+        # Perform shuffle split with default percentages
+        tlt_dataset.shuffle_split(shuffle_files=False)
+        default_train_pct = 0.75
+        default_val_pct = 0.25
+
+        # Get the full dataset size
+        len_splits = 1 if splits is None else len(splits)
+        dataset_size = tfds_metadata[dataset_name]['size'] if dataset_name else len(dataset_classes) * len_splits * 50
+
+        # Divide by the batch size that was used to preprocess earlier
+        dataset_size = dataset_size / tlt_dataset.info['preprocessing_info']['batch_size']
+
+        assert len(tlt_dataset.train_subset) == math.floor(dataset_size * default_train_pct)
+        assert len(tlt_dataset.validation_subset) == math.floor(dataset_size * default_val_pct)
+        assert tlt_dataset.test_subset is None
+        assert tlt_dataset._validation_type == 'shuffle_split'
diff --git a/tests/tensorflow_tests/unit/test_inc.py b/tests/tensorflow_tests/unit/test_inc.py
new file mode 100644
index 0000000000000000000000000000000000000000..7368d6efd0852119de234c88bdba5636808ba541
--- /dev/null
+++ b/tests/tensorflow_tests/unit/test_inc.py
@@ -0,0 +1,198 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+import uuid
+
+from unittest.mock import patch, MagicMock
+from tlt.models import model_factory
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.models.image_classification.tf_image_classification_model import TFImageClassificationModel  # noqa: F401
+    from tlt.models.image_classification.tf_image_classification_model import TFCustomImageClassificationDataset
+except ModuleNotFoundError:
+    print("WARNING: Unable to import TFImageClassificationModel. TensorFlow may not be installed")
+
+
+@pytest.mark.tensorflow
+def test_tf_image_classification_quantization():
+    """
+    Given a valid directory for the output dir, test the quantization function with the actual Intel Neural Compressor
+    call mocked out.
+    """
+    try:
+        output_dir = tempfile.mkdtemp()
+
+        model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+        with patch('tlt.models.image_classification.tf_image_classification_model.TFCustomImageClassificationDataset') \
+                as mock_dataset:
+            with patch('neural_compressor.quantization.fit') as mock_q:
+                mock_dataset.dataset_dir = "/tmp/data/my_photos"
+                mock_dataset.__class__ = TFCustomImageClassificationDataset
+                mock_dataset.get_inc_dataloaders.return_value = (1, 2)
+                model.quantize(output_dir, mock_dataset)
+                mock_q.assert_called_once()
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.tensorflow
+@patch('tlt.models.tf_model.quantization.fit')
+def test_tf_image_classification_quantize_overwrite_saved_model(mock_quantization_fit):
+    """
+    Given a valid directory for the output dir, test the quantize function with the actual Intel Neural
+    Compressor call mocked out. Tests that the model will be overwritten or not using the overwrite_model flag.
+    """
+
+    from tlt.models import model_factory
+
+    try:
+        # Specify a directory for output
+        output_dir = tempfile.mkdtemp()
+
+        model = model_factory.get_model(model_name='resnet_v1_50', framework='tensorflow')
+
+        # Mock the dataset
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = TFCustomImageClassificationDataset
+        mock_dataset.get_inc_dataloaders.return_value = 1, 2
+
+        # Method to create a dummy model.pt file in the specified directory
+        def create_dummy_file(output_dir):
+            with open(os.path.join(output_dir, 'saved_model.pb'), 'w') as fp:
+                fp.close()
+
+        # Mock an INC quantized model that will create a dummy file when saved
+        mock_quantized_model = MagicMock()
+        mock_quantized_model.save.side_effect = create_dummy_file
+
+        # Mock the INC quantization.fit method
+        def mock_fit(**args):
+            return mock_quantized_model
+        mock_quantization_fit.side_effect = mock_fit
+
+        # Call quantize when a model does not exist
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=False)
+
+        # Call quantize when the model exists, but overwrite_model=True
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=True)
+        model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=True)
+
+        with pytest.raises(FileExistsError):  # Model exists, so this should be true
+            model.quantize(output_dir=output_dir, dataset=mock_dataset, overwrite_model=False)
+
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@patch('tlt.models.tf_model.Graph_Optimization')
+@pytest.mark.tensorflow
+def test_tf_image_classification_optimize_graph_overwrite_saved_model(mock_graph_optimization):
+    """
+    Given a valid directory for the output dir, test the quantize function with the actual Intel Neural
+    Compressor call mocked out. Tests that the model will be overwritten or not using the overwrite_model flag.
+    """
+
+    # tlt imports
+    from tlt.models.image_classification.tf_image_classification_model import TFCustomImageClassificationDataset
+    from tlt.models import model_factory
+
+    try:
+        # Specify a directory for output
+        output_dir = tempfile.mkdtemp()
+
+        model = model_factory.get_model(model_name='resnet_v1_50', framework='tensorflow')
+
+        # Mock the dataset
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = TFCustomImageClassificationDataset
+        mock_dataset.get_inc_dataloaders.return_value = 1, 2
+
+        # Method to create a dummy model.pt file in the specified directory
+        def create_dummy_file():
+            with open(os.path.join(output_dir, 'saved_model.pb'), 'w') as fp:
+                fp.close()
+            return MagicMock()
+
+        # Mock an INC quantized model that will create a dummy file when saved
+        mock_graph_optimization.side_effect = create_dummy_file
+
+        # Call optimize_graph when a model does not exist
+        model.optimize_graph(output_dir=output_dir)
+
+        # Call optimize_graph when the model exists, but overwrite_model=True
+        model.optimize_graph(output_dir=output_dir, overwrite_model=True)
+        model.optimize_graph(output_dir=output_dir, overwrite_model=True)
+
+        with pytest.raises(FileExistsError):  # Model exists, so this should be true
+            model.optimize_graph(output_dir=output_dir, overwrite_model=False)
+
+    finally:
+        if os.path.exists(output_dir):
+            shutil.rmtree(output_dir)
+
+
+@pytest.mark.tensorflow
+def test_tf_image_classification_benchmark_model_does_not_exist():
+    """
+    Verifies the error that gets raise if benchmarking is done with a model that does not exist
+    """
+    try:
+        model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+        with patch('tlt.models.image_classification.tf_image_classification_model.TFCustomImageClassificationDataset') \
+                as mock_dataset:
+            mock_dataset.dataset_dir = "/tmp/data/my_photos"
+            mock_dataset.__class__ = TFCustomImageClassificationDataset
+            random_dir = str(uuid.uuid4())
+            saved_model_dir = tempfile.mkdtemp()
+            with patch('neural_compressor.benchmark.fit'):
+                # It's not a directory, so we expect an error
+                with pytest.raises(NotADirectoryError):
+                    model.benchmark(mock_dataset, saved_model_dir=random_dir)
+
+                # An empty directory with no saved model should also generate an error
+                with pytest.raises(FileNotFoundError):
+                    model.benchmark(mock_dataset, saved_model_dir=saved_model_dir)
+    finally:
+        if os.path.exists(saved_model_dir):
+            shutil.rmtree(saved_model_dir)
+
+
+@pytest.mark.tensorflow
+def test_tf_image_classification_inc_benchmark():
+    """
+    Verifies that if we have a valid model and dataset, benchmarking is called. The actual benchmarking calls to Intel
+    Neural Compressor are mocked out.
+    """
+    model = model_factory.get_model('efficientnet_b0', 'tensorflow')
+    with patch('tlt.models.image_classification.tf_image_classification_model.TFCustomImageClassificationDataset') \
+            as mock_dataset:
+        with patch('neural_compressor.benchmark.fit') as mock_bench:
+            mock_dataset.dataset_dir = "/tmp/data/my_photos"
+            mock_dataset.__class__ = TFCustomImageClassificationDataset
+            mock_dataset.get_inc_dataloaders.return_value = (1, 2)
+            model.benchmark(mock_dataset)
+            mock_bench.assert_called_once()
diff --git a/tests/tensorflow_tests/unit/test_models.py b/tests/tensorflow_tests/unit/test_models.py
new file mode 100644
index 0000000000000000000000000000000000000000..6bce94496c5711a629f3fbdba1aef2359282f6ea
--- /dev/null
+++ b/tests/tensorflow_tests/unit/test_models.py
@@ -0,0 +1,468 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import pytest
+from unittest.mock import MagicMock, patch
+
+from test_utils import platform_config
+from tlt.models import model_factory
+from tlt.utils.types import FrameworkType, UseCaseType
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+from tlt.datasets.text_classification.text_classification_dataset import TextClassificationDataset
+
+# True when all imports are successful, false when an import fails
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+tf_env = True
+
+try:
+    from tensorflow import keras
+except ModuleNotFoundError:
+    print("WARNING: Unable to import Keras. Tensorflow may not be installed")
+    tf_env = False
+
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.models.image_classification.tfhub_image_classification_model import TFHubImageClassificationModel
+    from tlt.models.image_classification.keras_image_classification_model import KerasImageClassificationModel
+    from tlt.models.image_classification.tf_image_classification_model import TFImageClassificationModel
+except ModuleNotFoundError:
+    TFHubImageClassificationModel = None
+    KerasImageClassificationModel = None
+    TFImageClassificationModel = None
+    print("WARNING: Unable to import TFHubImageClassificationModel or TFImageClassificationModel. "
+          "TensorFlow may not be installed")
+    tf_env = False
+
+
+try:
+    # Do TF specific imports in a try/except to prevent pytest test loading from failing when running in a PyTorch env
+    from tlt.models.text_classification.tf_hf_text_classification_model import TFHFTextClassificationModel
+    from tlt.models.text_classification.tf_text_classification_model import TFTextClassificationModel
+except ModuleNotFoundError:
+    TFHFTextClassificationModel = None
+    TFTextClassificationModel = None
+    print("WARNING: Unable to import TFHFTextClassificationModel. TensorFlow may not be installed")
+    tf_env = False
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    # Define a custom model
+    ALEXNET = keras.models.Sequential([
+        keras.layers.Conv2D(filters=96, kernel_size=(11, 11), strides=(4, 4), activation='relu',
+                            input_shape=(227, 227, 3)),
+        keras.layers.BatchNormalization(),
+        keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+        keras.layers.Conv2D(filters=256, kernel_size=(5, 5), strides=(1, 1), activation='relu', padding="same"),
+        keras.layers.BatchNormalization(),
+        keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+        keras.layers.Conv2D(filters=384, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+        keras.layers.BatchNormalization(),
+        keras.layers.Conv2D(filters=384, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+        keras.layers.BatchNormalization(),
+        keras.layers.Conv2D(filters=256, kernel_size=(3, 3), strides=(1, 1), activation='relu', padding="same"),
+        keras.layers.BatchNormalization(),
+        keras.layers.MaxPool2D(pool_size=(3, 3), strides=(2, 2)),
+        keras.layers.Flatten(),
+        keras.layers.Dense(4096, activation='relu'),
+        keras.layers.Dropout(0.5),
+        keras.layers.Dense(4096, activation='relu'),
+        keras.layers.Dropout(0.5),
+        keras.layers.Dense(3, activation='softmax')
+    ])
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,expected_class,expected_image_size',
+                         [['efficientnet_b0', TFHubImageClassificationModel, 224],
+                          ['google/bert_uncased_L-2_H-128_A-2', TFHFTextClassificationModel, None]])
+def test_tf_model_load(model_name, expected_class, expected_image_size):
+    """
+    Checks that a model can be downloaded
+    """
+    model = model_factory.get_model(model_name, 'tensorflow')
+    assert type(model) == expected_class
+    if expected_image_size:
+        assert model.image_size == expected_image_size
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    @pytest.mark.parametrize('model_name,expected_class,expected_image_size',
+                             [['ResNet50', KerasImageClassificationModel, 224],
+                              ['Xception', KerasImageClassificationModel, 299]])
+    def test_keras_model_load(model_name, expected_class, expected_image_size):
+        """
+        Checks that a model can be downloaded from Keras.applications
+        """
+        model = model_factory.get_model(model_name, 'tensorflow')
+        assert type(model) == expected_class
+        if expected_image_size:
+            assert model.image_size == expected_image_size
+        assert callable(model.preprocessor)
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    @pytest.mark.parametrize('model_name,use_case,expected_class,expected_image_size,expected_num_classes',
+                             [['alexnet', 'image_classification', TFImageClassificationModel, 227, 3],
+                              ['alexnet', 'text_classification', TFTextClassificationModel, None, 3]])
+    def test_custom_model_load(model_name, use_case, expected_class, expected_image_size, expected_num_classes):
+        """
+        Checks that a custom model can be loaded
+        """
+        model = model_factory.load_model(model_name, ALEXNET, 'tensorflow', use_case)
+        assert type(model) == expected_class
+        assert model.num_classes == expected_num_classes
+        if use_case == 'image_classification':
+            assert model.image_size == expected_image_size
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('model_name,use_case,hub',
+                         [['ResNet50', 'image_classification', 'Keras'],
+                          ['efficientnet_b0', 'image_classification', 'TFHub'],
+                          ['google/bert_uncased_L-2_H-128_A-2', 'text_classification', 'huggingface']])
+def test_get_supported_models(model_name, use_case, hub):
+    """
+    Call get supported models and checks to make sure the dictionary has keys for each use case,
+    and checks for a known supported model.
+    """
+    model_dict = model_factory.get_supported_models()
+
+    # Ensure there are keys for each use case
+    for k in UseCaseType:
+        assert str(k) in model_dict.keys()
+
+    # Check for a known model
+    assert model_name in model_dict[use_case]
+    model_info = model_dict[use_case][model_name]
+    assert str(FrameworkType.TENSORFLOW) in model_info
+    assert hub == model_info[str(FrameworkType.TENSORFLOW)]['model_hub']
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('framework,use_case',
+                         [['tensorflow', None],
+                          ['pytorch', None],
+                          [None, 'image_classification'],
+                          [None, 'question_answering'],
+                          ['tensorflow', 'image_classification'],
+                          ['tensorflow', 'text_classification'],
+                          ['pytorch', 'text_classification'],
+                          ['pytorch', 'question_answering']])
+def test_get_supported_models_with_filter(framework, use_case):
+    """
+    Tests getting the dictionary of supported models while filtering by framework and/or use case.
+    Checks to ensure that keys for the expected use cases are there. If filtering by framework, then the test will
+    also check to make sure we only have models for the specified framework.
+    """
+    model_dict = model_factory.get_supported_models(framework, use_case)
+
+    if use_case is not None:
+        # Model dictionary should only have a key for the specified use case
+        assert 1 == len(model_dict.keys())
+        assert use_case in model_dict
+    else:
+        # Model dictionary should have keys for every use case
+        assert len(UseCaseType) == len(model_dict.keys())
+        for k in UseCaseType:
+            assert str(k) in model_dict.keys()
+
+    # If filtering by framework, we should not find models from other frameworks
+    if framework is not None:
+        for use_case_key in model_dict.keys():
+            for model_name_key in model_dict[use_case_key].keys():
+                assert 1 == len(model_dict[use_case_key][model_name_key].keys())
+                assert framework in model_dict[use_case_key][model_name_key]
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('bad_framework',
+                         ['tensorflowers',
+                          'python',
+                          'torch',
+                          'fantastic-potato'])
+def test_get_supported_models_bad_framework(bad_framework):
+    """
+    Ensure that the proper error is raised when a bad framework is passed in
+    """
+    with pytest.raises(ValueError) as e:
+        model_factory.get_supported_models(bad_framework)
+        assert "Unsupported framework: {}".format(bad_framework) in str(e)
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize('bad_use_case',
+                         ['tensorflow',
+                          'imageclassification',
+                          'python',
+                          'fantastic-potato'])
+def test_get_supported_models_bad_use_case(bad_use_case):
+    """
+    Ensure that the proper error is raised when a bad use case is passed in
+    """
+    with pytest.raises(ValueError) as e:
+        model_factory.get_supported_models(use_case=bad_use_case)
+        assert "Unsupported use case: {}".format(bad_use_case) in str(e)
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    @pytest.mark.parametrize('model_name,dataset_type,get_hub_model_patch,class_names',
+                             [['efficientnet_b0', ImageClassificationDataset,
+                               'tlt.models.image_classification.tfhub_image_classification_model.'
+                               'TFHubImageClassificationModel._get_hub_model', ['a', 'b', 'c']],
+                              ['google/bert_uncased_L-2_H-128_A-2',
+                              TextClassificationDataset, 'tlt.models.text_classification.tf_hf_text_classification_model.'  # noqa: E501
+                               'TFHFTextClassificationModel._get_hub_model', ['a', 'b']],
+                              ['ResNet50', ImageClassificationDataset,
+                               'tlt.models.image_classification.keras_image_classification_model.'
+                               'KerasImageClassificationModel._get_hub_model', ['a', 'b', 'c']]
+                              ])
+    @patch('tlt.models.text_classification.tf_hf_text_classification_model.prepare_huggingface_input_data')
+    def test_tf_model_train(mock_tokenizer, model_name, dataset_type, get_hub_model_patch, class_names):
+        """
+        Tests calling train on an TFHub or Keras model with a mock dataset and mock model and verifies we get back the
+        return value from the fit function.
+        """
+        model = model_factory.get_model(model_name, 'tensorflow')
+
+        with patch(get_hub_model_patch) as mock_get_hub_model:
+            mock_dataset = MagicMock()
+            mock_dataset.__class__ = dataset_type
+            mock_dataset.validation_subset = [1, 2, 3]
+
+            mock_dataset.class_names = class_names
+            mock_model = MagicMock()
+            expected_return_value = {"result": True}
+            mock_history = MagicMock()
+            mock_history.history = expected_return_value
+
+            def mock_fit(x=None, y=None, epochs=1, shuffle=True, callbacks=[], validation_data=None, batch_size=None):
+                assert x is not None
+                assert isinstance(epochs, int)
+                assert isinstance(shuffle, bool)
+                assert len(callbacks) > 0
+
+                if eval_expected:
+                    assert validation_data is not None
+                else:
+                    assert validation_data is None
+
+                return mock_history
+
+            # Mock internal function to tokenize input data
+            mock_tokenizer.return_value = mock_dataset, []
+
+            mock_model.fit = mock_fit
+            mock_get_hub_model.return_value = mock_model
+
+            # Test train with eval
+            eval_expected = True
+            return_val = model.train(mock_dataset, output_dir="/tmp/output", do_eval=True)
+            assert return_val == expected_return_value
+
+            # Test train without eval
+            eval_expected = False
+            return_val = model.train(mock_dataset, output_dir="/tmp/output", do_eval=False)
+            assert return_val == expected_return_value
+
+            # Test train with eval, but no validation subset
+            eval_expected = False
+            mock_dataset.validation_subset = None
+            return_val = model.train(mock_dataset, output_dir="/tmp/output", do_eval=True)
+            assert return_val == expected_return_value
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    def test_custom_model_train():
+        """
+        Tests calling train on a custom TF model with a mock dataset and mock model and verifies we get back the return
+        value from the fit function.
+        """
+        model = model_factory.load_model('custom_model', ALEXNET, 'tensorflow', 'image_classification')
+
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = ImageClassificationDataset
+
+        mock_dataset.class_names = ['1', '2', '3']
+        model._model = MagicMock()
+        expected_return_value = {"result": True}
+        mock_history = MagicMock()
+        mock_history.history = expected_return_value
+
+        def mock_fit(dataset, epochs, shuffle, callbacks, validation_data=None):
+            assert dataset is not None
+            assert isinstance(epochs, int)
+            assert isinstance(shuffle, bool)
+            assert len(callbacks) > 0
+
+            return mock_history
+
+        model._model.fit = mock_fit
+
+        return_val = model.train(mock_dataset, output_dir="/tmp/output")
+        assert return_val == expected_return_value
+
+
+@pytest.mark.tensorflow
+@pytest.mark.parametrize(
+    'cpu_model,enable_auto_mixed_precision,expected_auto_mixed_precision_parameter,tf_version,model_name,dataset_type',
+    [['85', None, False, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['143', None, True, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', None, False, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', True, True, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['143', True, True, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', True, True, '2.9.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', True, True, '2.10.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', None, False, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['143', None, True, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['123', None, False, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['85', True, True, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['143', True, True, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['123', True, True, '2.9.0', 'bert-base-uncased', TextClassificationDataset],
+     ['85', True, True, '2.10.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['143', True, True, '2.10.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', True, True, '2.10.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', False, False, '2.9.1', 'efficientnet_b0', ImageClassificationDataset],
+     ['143', False, False, '2.9.1', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', False, False, '2.9.1', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', False, None, '2.8.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', None, None, '2.8.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['123', True, None, '2.8.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', None, None, '2.8.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['85', True, None, '2.8.0', 'efficientnet_b0', ImageClassificationDataset],
+     ['143', None, True, '3.1.0', 'efficientnet_b0', ImageClassificationDataset]])
+@patch("tlt.models.tf_model.tf.version")
+@patch("tlt.models.tf_model.tf.config.optimizer.set_experimental_options")
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+@patch("tlt.utils.platform_util.os")
+@patch("tlt.utils.platform_util.system_platform")
+@patch("tlt.utils.platform_util.subprocess")
+@patch('tlt.models.text_classification.tf_hf_text_classification_model.prepare_huggingface_input_data')
+def test_tfhub_auto_mixed_precision(mock_tokenizer, mock_subprocess, mock_platform, mock_os, mock_get_cpuset,
+                                    mock_set_experimental_options, mock_tf_version, cpu_model,
+                                    enable_auto_mixed_precision, expected_auto_mixed_precision_parameter,
+                                    tf_version, model_name, dataset_type):
+    """
+    Verifies that auto mixed precision is enabled by default for SPR (cpu model 85), but disabled by default for other
+    CPU types like SKX (cpu model 143).  The default auto mixed precision setting is used when
+    enable_auto_mixed_precision=None. Auto mixed precision was enabled for TF 2.9.0 and later, so don't expect the call
+    to set the config for earlier TF versions.
+
+    If enable_auto_mixed_precision is set to True/False, then that's what should be used, regardless of CPU type.
+    """
+    mock_get_cpuset.return_value = platform_config.CPUSET
+    platform_config.set_mock_system_type(mock_platform)
+    platform_config.set_mock_os_access(mock_os)
+
+    # get the lscpu sample output, but replace in the parameterized cpu model id
+    lscpu_value = platform_config.LSCPU_OUTPUT
+    original_model_value = "Model:                 143\n"  # model test value from the test platform config
+    new_model_value = "Model:                 {}\n".format(cpu_model)
+    lscpu_value = lscpu_value.replace(original_model_value, new_model_value)
+    mock_subprocess.check_output.return_value = lscpu_value
+
+    mock_dataset = MagicMock()
+    mock_dataset.__class__ = dataset_type
+    mock_dataset.class_names = ['a', 'b']
+
+    mock_tf_version.VERSION = tf_version
+
+    model = model_factory.get_model(model_name, 'tensorflow')
+    model._get_hub_model = MagicMock()
+
+    # Mock internal function to tokenize input data
+    mock_tokenizer.return_value = mock_dataset, []
+
+    model.train(mock_dataset, output_dir="/tmp/output", enable_auto_mixed_precision=enable_auto_mixed_precision)
+
+    if expected_auto_mixed_precision_parameter is not None:
+        expected_parameter = {'auto_mixed_precision_mkl': expected_auto_mixed_precision_parameter}
+        mock_set_experimental_options.assert_called_with(expected_parameter)
+    else:
+        # We expect that the auto mixed prercision config is not called (due to TF version unsupported)
+        assert not mock_set_experimental_options.called
+
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    @pytest.mark.parametrize('model_name,use_case,dataset_type,optimizer,loss',
+                             [['efficientnet_b0', 'image_classification', ImageClassificationDataset,
+                              keras.optimizers.Adagrad, keras.losses.MeanSquaredError],
+                              ['custom', 'image_classification', ImageClassificationDataset,
+                              keras.optimizers.SGD, keras.losses.CategoricalCrossentropy],
+                              ['bert-base-uncased', 'text_classification', TextClassificationDataset,
+                              keras.optimizers.RMSprop, keras.losses.BinaryCrossentropy]])
+    @patch('tlt.models.text_classification.tf_hf_text_classification_model.prepare_huggingface_input_data')
+    def test_tf_optimizer_loss(mock_tokenizer, model_name, use_case, dataset_type, optimizer, loss):
+        """
+        Tests initializing and training a model with configurable optimizers and loss functions
+        """
+
+        if model_name == 'custom':
+            model = model_factory.load_model(model_name, ALEXNET, 'tensorflow', use_case, optimizer=optimizer, loss=loss)  # noqa: E501
+        else:
+            model = model_factory.get_model(model_name, 'tensorflow', optimizer=optimizer, loss=loss)
+
+        model._generate_checkpoints = False
+        model._get_hub_model = MagicMock()
+        model._model = MagicMock()
+        model._model.fit = MagicMock()
+        assert model._optimizer_class == optimizer
+        assert model._loss_class == loss
+
+        mock_dataset = MagicMock()
+        mock_dataset.__class__ = dataset_type
+        if dataset_type == TextClassificationDataset:
+            mock_dataset.class_names = ['a', 'b']
+        else:
+            mock_dataset.class_names = ['a', 'b', 'c']
+
+        # Mock internal function to tokenize input data
+        mock_tokenizer.return_value = mock_dataset, []
+
+        # Train is called and optimizer and loss objects should match the input types
+        model.train(mock_dataset, output_dir="/tmp/output/tf")
+        assert model._optimizer_class == optimizer
+        assert type(model._optimizer) == optimizer
+        assert model._loss_class == loss
+        assert type(model._loss) == loss
+
+# This is necessary to protect from import errors when testing in a tensorflow only environment
+if tf_env:
+    @pytest.mark.tensorflow
+    @pytest.mark.parametrize('model_name,loss',
+                             [['efficientnet_b0', 1],
+                              ['efficientnet_b0', 'foo'],
+                              ['bert-base-uncased', keras.optimizers.Adam]])
+    def test_tf_loss_wrong_type(model_name, loss):
+        """
+        Tests that an exception is thrown when the input loss function is the wrong type
+        """
+        with pytest.raises(TypeError):
+            model_factory.get_model(model_name, 'tensorflow', loss=loss)
diff --git a/tests/test_utils/__init__.py b/tests/test_utils/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/test_utils/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/test_utils/platform_config.py b/tests/test_utils/platform_config.py
new file mode 100644
index 0000000000000000000000000000000000000000..16c9d42860429130bd425a56f2665e5d73681944
--- /dev/null
+++ b/tests/test_utils/platform_config.py
@@ -0,0 +1,81 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2018-2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import platform as system_platform
+
+
+# Constants used for test mocks
+OS_TYPE = system_platform.system()
+SYSTEM_TYPE = "Linux"
+LSCPU_OUTPUT = ("Architecture:          x86_64\n"
+                "CPU(s):                112\n"
+                "Thread(s) per core:    2\n"
+                "Core(s) per socket:    28\n"
+                "Socket(s):             2\n"
+                "NUMA node(s):          2\n"
+                "On-line CPU(s) list:   0-111\n"
+                "NUMA node0 CPU(s):     0-27,56-83\n"
+                "NUMA node1 CPU(s):     28-55,84-111\n"
+                "CPU family:            6\n"
+                "Model:                 143\n")
+
+NUMA_CORES_OUTPUT = ['0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27',
+                     '28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55']
+
+WMIC_OUTPUT = ("DeviceID=CPU0\r\r\n"
+               "NumberOfCores=28\r\r\n"
+               "NumberOfLogicalProcessors=56\r\r\n"
+               "ThreadCount=56\r\r\n"
+
+
+               "DeviceID=CPU1\r\r\n"
+               "NumberOfCores=28\r\r\n"
+               "NumberOfLogicalProcessors=56\r\r\n"
+               "ThreadCount=56\r\r\n")
+
+CPUSET = "0-111"
+
+
+def set_mock_system_type(mock_platform):
+    """
+    Sets the system type return value to Linux.
+    """
+    mock_platform.system.return_value = SYSTEM_TYPE
+
+
+def set_mock_os_access(mock_os):
+    """
+    Sets the os.access return value to True
+    """
+    mock_os.access.return_value = True
+
+
+def set_mock_lscpu_subprocess_values(mock_subprocess):
+    """
+    Sets mock return value for the lscpu output with platform info
+    """
+    mock_subprocess.check_output.return_value = LSCPU_OUTPUT
+
+
+def set_mock_wmic_subprocess_values(mock_subprocess):
+    """
+    Sets mock return value for the wmic output with platform info on Windows
+    """
+    mock_subprocess.check_output.return_value = WMIC_OUTPUT
diff --git a/tests/tools/__init__.py b/tests/tools/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/tools/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/tools/cli/__init__.py b/tests/tools/cli/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/tools/cli/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/tools/cli/test_benchmark_cli.py b/tests/tools/cli/test_benchmark_cli.py
new file mode 100644
index 0000000000000000000000000000000000000000..1a0e6c57bb348ed6729a6dfb8c0d4c91656527d8
--- /dev/null
+++ b/tests/tools/cli/test_benchmark_cli.py
@@ -0,0 +1,289 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from click.testing import CliRunner
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+from tlt.tools.cli.commands.benchmark import benchmark
+from tlt.utils.types import FrameworkType
+from tlt.utils.file_utils import download_and_extract_zip_file
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,batch_size,mode',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 512, 'performance'],
+                          ['inception_v3', FrameworkType.TENSORFLOW, 32, 'accuracy'],
+                          ['resnet50', FrameworkType.PYTORCH, 128, 'performance'],
+                          ['bert-base-cased', FrameworkType.PYTORCH, 256, 'accuracy']])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+def test_benchmark(mock_load_dataset, mock_get_model, model_name, framework, batch_size, mode):
+    """
+    Tests the benchmark command and verifies that the
+    expected calls are made on the tlt model object. The call parameters also verify that the benchmark command
+    is able to properly identify the model's name based on the directory and the framework type based on the
+    type of saved model.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    if model_name == "bert-base-cased":
+        # Get the dataset
+        zip_file_url = "https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip"
+        csv_dir = os.path.join(dataset_dir, "sms_spam_collection")
+        csv_file_name = "SMSSpamCollection"
+        delimiter = '\t'
+
+        # If the SMS Spam collection csv file is not found, download and extract the file:
+        if not os.path.exists(os.path.join(csv_dir, csv_file_name)):
+            # Download the zip file with the SMS Spam collection dataset
+            download_and_extract_zip_file(zip_file_url, csv_dir)
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir, exist_ok=True)
+
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+
+        if model_name == "bert-base-cased":
+            model_mock.use_case = "text_classification"
+        else:
+            model_mock.use_case = "image_classification"
+
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        # Call the benchmark command
+        if model_mock.use_case == "image_classification":
+            result = runner.invoke(benchmark,
+                                   ["--model-dir", model_dir, "--dataset_dir", dataset_dir,
+                                    "--batch-size", batch_size, "--output-dir", output_dir])
+        else:
+            result = runner.invoke(benchmark,
+                                   ["--model-dir", model_dir, "--dataset_dir", dataset_dir,
+                                    "--batch-size", batch_size, "--output-dir", output_dir,
+                                    "--dataset-file", csv_file_name, "--delimiter", delimiter])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, framework)
+        if model_mock.use_case == "image_classification":
+            mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        else:
+            mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework,
+                                                      csv_file_name=csv_file_name, delimiter=delimiter)
+        assert model_mock.benchmark.called
+
+        # Verify a successful exit code
+        assert result.exit_code == 0
+
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file',
+                         [['bar', 'unsupported_model_type.txt'],
+                          ['foo', 'potato.pb']])
+def test_benchmark_bad_model_file(model_name, model_file):
+    """
+    Verifies that the benchmark command fails if it's given a model directory that doesn't contain a saved_model.pb or
+    model.pt file.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create the bogus model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the benchmark command with the bogus model directory
+        result = runner.invoke(benchmark,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir",
+                                output_dir])
+
+        # Verify that we got an error about the unsupported model type
+        assert result.exit_code == 1
+        assert "Benchmarking is currently only implemented for TensorFlow saved_model.pb and PyTorch model.pt models." \
+               in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file,framework',
+                         [['bar', 'saved_model.pb', 'tensorflow'],
+                          ['foo', 'model.pt', 'pytorch']])
+def test_benchmark_bad_model_dir(model_name, model_file, framework):
+    """
+    Verifies that benchmark command fails if it's given a model directory with a model name that we don't support
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create the model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the benchmark command with the model directory
+        result = runner.invoke(benchmark,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error about the unsupported model for the framework
+        assert result.exit_code == 1
+        assert "An error occurred while getting the model" in result.output
+        assert "The specified model is not supported for {}".format(framework) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+def test_benchmark_model_dir_does_not_exist():
+    """
+    Verifies that benchmark command fails if the model directory does not exist
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, 'resnet_v1_50', '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(dataset_dir)
+
+        # Call the benchmark command with the model directory
+        result = runner.invoke(benchmark,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error model directory not existing
+        assert result.exit_code == 2
+        assert "--model-dir" in result.output
+        assert "Directory '{}' does not exist".format(model_dir) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+def test_benchmark_dataset_dir_does_not_exist():
+    """
+    Verifies that benchmark command fails if the dataset directory does not exist
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, 'resnet_v1_50', '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+
+        # Call the benchmark command with the model directory
+        result = runner.invoke(benchmark,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error dataset directory not existing
+        assert result.exit_code == 2
+        assert "--dataset-dir" in result.output
+        assert "Directory '{}' does not exist".format(dataset_dir) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+class TestBenchmarkArgs:
+    """
+    Class for tests that are testing bad inputs for benchmarking args with generic folders for the model dir,
+    dataset dir, and output dir.
+    """
+
+    def setup_class(self):
+        self._runner = CliRunner()
+
+        self._tmp_dir = tempfile.mkdtemp()
+        self._model_dir = os.path.join(self._tmp_dir, 'resnet_v1_50', '3')
+        self._dataset_dir = os.path.join(self._tmp_dir, 'data')
+        self._output_dir = os.path.join(self._tmp_dir, 'output')
+
+    def setup_method(self):
+        for new_dir in [self._model_dir, self._dataset_dir]:
+            if not os.path.exists(new_dir):
+                os.makedirs(new_dir)
+
+    def teardown_method(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    def teardown_class(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('batch_size',
+                             ['foo', 'benchmark', '0', -1, 0])
+    def test_benchmark_invalid_batch_size(self, batch_size):
+        """
+        Verifies that benchmark command fails if the batch size is invalid
+        """
+        # Create the model file
+        Path(os.path.join(self._model_dir, 'saved_model.pt')).touch()
+
+        # Call the benchmark command with the model directory
+        result = self._runner.invoke(benchmark,
+                                     ["--model-dir", self._model_dir,
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--batch-size", batch_size])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--batch-size'" in result.output
diff --git a/tests/tools/cli/test_eval_cli.py b/tests/tools/cli/test_eval_cli.py
new file mode 100644
index 0000000000000000000000000000000000000000..ebf1933cbac2fc68dfbad27ab8d6c9a965102cc4
--- /dev/null
+++ b/tests/tools/cli/test_eval_cli.py
@@ -0,0 +1,302 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from click.testing import CliRunner
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+from tlt.tools.cli.commands.eval import eval
+from tlt.utils.types import FrameworkType
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW],
+                          ['resnet50', FrameworkType.PYTORCH]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_eval_preprocess_with_image_size(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework):
+    """
+    Tests the eval command with a dataset preprocessing method that has an image_size. Actual calls for the model and
+    dataset are mocked out. The test verifies that the proper args are used for calling preprocess()
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    model_dir = os.path.join(tmp_dir, 'model')
+    dummy_image_size = 100
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create dummy model file
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        model_mock.image_size = dummy_image_size
+        data_mock = MagicMock()
+
+        # Test where the preprocessing command will have an image size
+        inspect_mock = MagicMock()
+        inspect_mock.args = ['image_size', 'batch_size']
+        mock_inspect.return_value = inspect_mock
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        # Call the eval command
+        result = runner.invoke(eval, ["--model-dir", model_dir, "--dataset_dir", dataset_dir])
+
+        # Verify that the expected calls were made
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert mock_get_model.called
+        assert data_mock.shuffle_split.called
+        assert model_mock.evaluate.called
+
+        # Verify that preprocess was called with an image size
+        data_mock.preprocess.assert_called_once_with(image_size=dummy_image_size, batch_size=32)
+
+        # Verify that the eval command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework',
+                         [['google/bert_uncased_L-10_H-128_A-2', FrameworkType.TENSORFLOW],
+                          ['bert_en_uncased_L-12_H-768_A-12', FrameworkType.PYTORCH]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_eval_preprocess_without_image_size(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework):
+    """
+    Tests the eval command with a dataset preprocessing method that just has a batch size arg. Actual calls for the
+    model and dataset are mocked out. The test verifies that the proper args are used for calling preprocess()
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    model_dir = os.path.join(tmp_dir, 'model')
+    dummy_image_size = 100
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create dummy model file
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        model_mock.image_size = dummy_image_size
+        data_mock = MagicMock()
+
+        # Test where the preprocessing command just has a batch_size arg
+        inspect_mock = MagicMock()
+        inspect_mock.args = ['batch_size']
+
+        mock_inspect.return_value = inspect_mock
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        # Call the eval command
+        result = runner.invoke(eval, ["--model-dir", model_dir, "--dataset_dir", dataset_dir])
+
+        # Verify that the eval command exit code is successful
+        assert result.exit_code == 0
+
+        # Verify that the expected calls were made
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert mock_get_model.called
+        assert data_mock.shuffle_split.called
+        assert model_mock.evaluate.called
+
+        # Verify that preprocess was called with just batch size
+        data_mock.preprocess.assert_called_once_with(batch_size=32)
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('provided_model_name,model_dir,expected_model_name,framework',
+                         [['mymodel/name', 'model/abc', 'mymodel/name', FrameworkType.TENSORFLOW],
+                          ['', 'bert_en_uncased_L-12_H-768_A-12/3', 'bert_en_uncased_L-12_H-768_A-12',
+                           FrameworkType.PYTORCH],
+                          ['test', 'bert_en_uncased_L-12_H-768_A-12/3', 'test',
+                           FrameworkType.PYTORCH]
+                          ])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+def test_eval_model_name(mock_load_dataset, mock_get_model, provided_model_name, model_dir,
+                         expected_model_name, framework):
+    """
+    Tests the eval command with and without providing a model name to verify that when a model name is provided, that
+    is what's used, and when a model name is not provided, we use the model_dir folder as the model name.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    model_dir = os.path.join(tmp_dir, model_dir)
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create dummy model file
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        # Call the eval command
+        eval_params = ["--model-dir", model_dir, "--dataset_dir", dataset_dir]
+
+        if provided_model_name:
+            eval_params += ["--model-name", provided_model_name]
+        result = runner.invoke(eval, eval_params)
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(expected_model_name, framework)
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert model_mock.evaluate.called
+
+        # Verify that the eval command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,dataset_name,dataset_catalog',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 'tf_flowers', 'tf_datasets'],
+                          ['resnet50', FrameworkType.PYTORCH, 'cifar10', 'torchvision']])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.get_dataset")
+def test_eval_dataset_catalog(mock_get_dataset, mock_get_model, model_name, framework, dataset_name, dataset_catalog):
+    """
+    Tests the eval command a named dataset and verifies that get_dataset is called (vs load_dataset, which is used
+    for custom dataset directories in other tests).
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    model_dir = os.path.join(tmp_dir, 'model')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create dummy model file
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        # Setup mocks
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+        mock_get_dataset.return_value = data_mock
+
+        # Call the eval command
+        result = runner.invoke(eval,
+                               ["--model-dir", str(model_dir), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--dataset-name", dataset_name, "--dataset-catalog", dataset_catalog])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, framework)
+        mock_get_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework,
+                                                 dataset_name, dataset_catalog)
+
+        # Verify that the evaluate command exit code is successful
+        assert model_mock.evaluate.called
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+class TestEvalArgs:
+    """
+    Class for tests that are testing bad inputs for evaluation
+    """
+
+    def setup_class(self):
+        self._runner = CliRunner()
+
+        self._tmp_dir = tempfile.mkdtemp()
+        self._dataset_dir = os.path.join(self._tmp_dir, 'data')
+        self._model_dir = os.path.join(self._tmp_dir, 'model')
+
+    def setup_method(self):
+        for new_dir in [self._model_dir, self._dataset_dir]:
+            if not os.path.exists(new_dir):
+                os.makedirs(new_dir)
+
+        Path(os.path.join(self._model_dir, 'saved_model.pb')).touch()
+
+    def teardown_method(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    def teardown_class(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('dataset_catalog', ['foo', 'benchmark', '0'])
+    def test_eval_invalid_dataset_catalog(self, dataset_catalog):
+        """
+        Verifies that eval command fails if the dataset catalog value is invalid
+        """
+
+        result = self._runner.invoke(eval,
+                                     ["--model-dir", self._model_dir,
+                                      "--dataset-dir", self._dataset_dir,
+                                      "--dataset-name", "foo",
+                                      "--dataset-catalog", dataset_catalog])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--dataset-catalog'" in result.output
+        assert "'{}' is not one of 'tf_datasets', 'torchvision', 'huggingface'".format(dataset_catalog) in result.output
diff --git a/tests/tools/cli/test_optimize_cli.py b/tests/tools/cli/test_optimize_cli.py
new file mode 100644
index 0000000000000000000000000000000000000000..91d6025445bb53595b181a1509bb8851b6032516
--- /dev/null
+++ b/tests/tools/cli/test_optimize_cli.py
@@ -0,0 +1,209 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from click.testing import CliRunner
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+from tlt.tools.cli.commands.optimize import optimize
+from tlt.utils.types import FrameworkType
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW],
+                          ['inception_v3', FrameworkType.TENSORFLOW],
+                          ['resnet50', FrameworkType.PYTORCH]])
+@patch("tlt.models.model_factory.get_model")
+def test_optimize(mock_get_model, model_name, framework):
+    """
+    Tests the optimize commandand verifies that the expected calls are made
+    on the tlt model object. The call parameters also verify that the optimize command is able to properly identify
+    the model's name based on the directory and the framework type based on the type of saved model.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+
+        # Call the optimize command
+        result = runner.invoke(optimize,
+                               ["--model-dir", model_dir, "--output-dir", output_dir])
+
+        # Verify that the expected calls were made
+        if framework == FrameworkType.TENSORFLOW:
+            mock_get_model.assert_called_once_with(model_name, framework)
+            assert model_mock.optimize_graph.called
+
+        # Verify the exit code
+        if framework == FrameworkType.TENSORFLOW:
+            assert result.exit_code == 0
+        else:
+            assert result.exit_code == 1
+
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file',
+                         [['bar', 'unsupported_model_type.txt'],
+                          ['foo', 'potato.pb'],
+                          ['pytorch_model', 'model.pt']])
+def test_optimize_bad_model_file(model_name, model_file):
+    """
+    Verifies that the optimize command fails if it's given a model directory that doesn't contain a saved_model.pb.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+
+        # Create the bogus model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the optimize command with the bogus model directory
+        result = runner.invoke(optimize,
+                               ["--model-dir", model_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error about the unsupported model type
+        assert result.exit_code == 1
+        assert "Graph optimization is currently only supported for TensorFlow saved_model.pb models." \
+               in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file,framework',
+                         [['bar', 'saved_model.pb', 'tensorflow'],
+                          ['foo', 'saved_model.pb', 'tensorflow']])
+def test_optimize_bad_model_dir(model_name, model_file, framework):
+    """
+    Verifies that optimize command fails if it's given a model directory with a model name that we don't support
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+
+        # Create the model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the optimize command with the model directory
+        result = runner.invoke(optimize,
+                               ["--model-dir", model_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error about the unsupported model for the framework
+        assert result.exit_code == 1
+        assert "An error occurred while getting the model" in result.output
+        assert "The specified model is not supported for {}".format(framework) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+def test_optimize_model_dir_does_not_exist():
+    """
+    Verifies that optimize command fails if the model directory does not exist
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, 'resnet_v1_50', '3')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        # Call the optimize command with the model directory
+        result = runner.invoke(optimize,
+                               ["--model-dir", model_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error model directory not existing
+        assert result.exit_code == 2
+        assert "--model-dir" in result.output
+        assert "Directory '{}' does not exist".format(model_dir) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@patch("tlt.models.model_factory.get_model")
+def test_optimize_output_dir(mock_get_model):
+    """
+    Verifies that the optimize command increments the output directory for the optimized model each time
+    the optimization command is called
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_name = 'resnet_v1_50'
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+        Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+
+        model_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+
+        for i in range(1, 5):
+            # Call the optimize command
+            result = runner.invoke(optimize,
+                                   ["--model-dir", model_dir, "--output-dir", output_dir])
+            assert result.exit_code == 0
+
+            # Check for an expected optimization output dir with the folder number incrementing
+            expected_optimize_dir = os.path.join(output_dir, "optimize", model_name, str(i))
+            model_mock.optimize.called_once_with(model_dir, expected_optimize_dir)
+
+            model_mock.reset_mock()
+
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
diff --git a/tests/tools/cli/test_quantize_cli.py b/tests/tools/cli/test_quantize_cli.py
new file mode 100644
index 0000000000000000000000000000000000000000..1a3d72440fc9272c0dad4e46ab8d7812e1ebc7f3
--- /dev/null
+++ b/tests/tools/cli/test_quantize_cli.py
@@ -0,0 +1,380 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from click.testing import CliRunner
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+from tlt.tools.cli.commands.quantize import quantize
+from tlt.utils.types import FrameworkType
+from tlt.utils.file_utils import download_and_extract_zip_file
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,batch_size',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 512],
+                          ['inception_v3', FrameworkType.TENSORFLOW, 32],
+                          ['resnet50', FrameworkType.PYTORCH, 128],
+                          ['bert-base-cased', FrameworkType.PYTORCH, 256]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+def test_quantize(mock_load_dataset, mock_get_model, model_name, framework, batch_size):
+    """
+    Tests the quantize command and verifies that the
+    expected calls are made on the tlt model object. The call parameters also verify that the quantize command
+    is able to properly identify the model's name based on the directory and the framework type based on the
+    type of saved model.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    if model_name == "bert-base-cased":
+        # Get the dataset
+        zip_file_url = "https://archive.ics.uci.edu/static/public/228/sms+spam+collection.zip"
+        csv_dir = os.path.join(dataset_dir, "sms_spam_collection")
+        csv_file_name = "SMSSpamCollection"
+        delimiter = '\t'
+
+        # If the SMS Spam collection csv file is not found, download and extract the file:
+        if not os.path.exists(os.path.join(csv_dir, csv_file_name)):
+            # Download the zip file with the SMS Spam collection dataset
+            download_and_extract_zip_file(zip_file_url, csv_dir)
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir, exist_ok=True)
+
+        if framework == FrameworkType.TENSORFLOW:
+            Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+        elif framework == FrameworkType.PYTORCH:
+            Path(os.path.join(model_dir, 'model.pt')).touch()
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+
+        if model_name == "bert-base-cased":
+            model_mock.use_case = "text_classification"
+        else:
+            model_mock.use_case = "image_classification"
+
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        # Call the quantize command
+        if model_mock.use_case == "image_classification":
+            result = runner.invoke(quantize,
+                                   ["--model-dir", model_dir, "--dataset_dir", dataset_dir,
+                                    "--batch-size", batch_size, "--output-dir", output_dir])
+        else:
+            result = runner.invoke(quantize,
+                                   ["--model-dir", model_dir, "--dataset_dir", dataset_dir,
+                                    "--batch-size", batch_size, "--output-dir", output_dir,
+                                    "--dataset-file", csv_file_name, "--delimiter", delimiter])
+
+        # Verify that the expected calls were made, including to create an Intel Neural Compressor config file
+        mock_get_model.assert_called_once_with(model_name, framework)
+
+        if model_mock.use_case == "image_classification":
+            mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        else:
+            mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework,
+                                                      csv_file_name=csv_file_name, delimiter=delimiter)
+
+        assert model_mock.quantize.called
+
+        # Verify a successful exit code
+        assert result.exit_code == 0
+
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file',
+                         [['bar', 'unsupported_model_type.txt'],
+                          ['foo', 'potato.pb']])
+def test_quantize_bad_model_file(model_name, model_file):
+    """
+    Verifies that the quantize command fails if it's given a model directory that doesn't contain a saved_model.pb or
+    model.pt file.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create the bogus model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the quantize command with the bogus model directory
+        result = runner.invoke(quantize,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error about the unsupported model type
+        assert result.exit_code == 1
+        assert "Quantization is currently only implemented for TensorFlow saved_model.pb and PyTorch model.pt models." \
+               in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,model_file,framework',
+                         [['bar', 'saved_model.pb', 'tensorflow'],
+                          ['foo', 'model.pt', 'pytorch']])
+def test_quantize_bad_model_dir(model_name, model_file, framework):
+    """
+    Verifies that quantize command fails if it's given a model directory with a model name that we don't support
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Create the model file
+        Path(os.path.join(model_dir, model_file)).touch()
+
+        # Call the quantize command with the model directory
+        result = runner.invoke(quantize,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error about the unsupported model for the framework
+        assert result.exit_code == 1
+        assert "An error occurred while getting the model" in result.output
+        assert "The specified model is not supported for {}".format(framework) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+def test_quantize_model_dir_does_not_exist():
+    """
+    Verifies that quantize command fails if the model directory does not exist
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, 'resnet_v1_50', '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(dataset_dir)
+
+        # Call the quantize command with the model directory
+        result = runner.invoke(quantize,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error model directory not existing
+        assert result.exit_code == 2
+        assert "--model-dir" in result.output
+        assert "Directory '{}' does not exist".format(model_dir) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+def test_quantize_dataset_dir_does_not_exist():
+    """
+    Verifies that quantize command fails if the dataset directory does not exist
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_dir = os.path.join(tmp_dir, 'resnet_v1_50', '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        os.makedirs(model_dir)
+
+        # Call the quantize command with the model directory
+        result = runner.invoke(quantize,
+                               ["--model-dir", model_dir, "--dataset_dir", dataset_dir, "--output-dir", output_dir])
+
+        # Verify that we got an error dataset directory not existing
+        assert result.exit_code == 2
+        assert "--dataset-dir" in result.output
+        assert "Directory '{}' does not exist".format(dataset_dir) in result.output
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+def test_quantize_output_dir(mock_get_model, mock_load_dataset):
+    """
+    Verifies that quantize command increments the output directory for the quantized model each time the quantization
+    command is called
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    model_name = 'resnet_v1_50'
+    model_dir = os.path.join(tmp_dir, model_name, '3')
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [model_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        Path(os.path.join(model_dir, 'saved_model.pb')).touch()
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        model_mock.use_case = "image_classification"
+        data_mock.use_case = "image_classification"
+
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+
+        for i in range(1, 5):
+            # Call the quantize command
+            result = runner.invoke(quantize,
+                                   ["--model-dir", model_dir, "--dataset_dir", dataset_dir,
+                                    "--output-dir", output_dir])
+            assert result.exit_code == 0
+
+            # Check for an expected quantization output dir with the folder number incrementing
+            expected_quantize_dir = os.path.join(output_dir, "quantize", model_name, str(i))
+            model_mock.quantize.called_once_with(model_dir, expected_quantize_dir)
+
+            model_mock.reset_mock()
+
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+class TestQuantizationArgs:
+    """
+    Class for tests that are testing bad inputs for quntization args with generic folders for the model dir,
+    dataset dir, and output dir.
+    """
+
+    def setup_class(self):
+        self._runner = CliRunner()
+
+        self._tmp_dir = tempfile.mkdtemp()
+        self._model_dir = os.path.join(self._tmp_dir, 'resnet_v1_50', '3')
+        self._dataset_dir = os.path.join(self._tmp_dir, 'data')
+        self._output_dir = os.path.join(self._tmp_dir, 'output')
+
+    def setup_method(self):
+        for new_dir in [self._model_dir, self._dataset_dir]:
+            if not os.path.exists(new_dir):
+                os.makedirs(new_dir)
+
+    def teardown_method(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    def teardown_class(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('max_trials',
+                             [-1, -5, 'foo'])
+    def test_quantize_invalid_max_trials(self, max_trials):
+        """
+        Verifies that quantize command fails if the max trials is invalid (should be an integer > 0)
+        """
+
+        # Create the model file
+        Path(os.path.join(self._model_dir, 'saved_model.pt')).touch()
+
+        # Call the quantize command with the model directory
+        result = self._runner.invoke(quantize,
+                                     ["--model-dir", self._model_dir,
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--max-trials", max_trials])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--max-trials'" in result.output
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('timeout', [-1, -5, 'foo'])
+    def test_quantize_invalid_timeout(self, timeout):
+        """
+        Verifies that quantize command fails if the timeout is invalid (should be an integer >= 0)
+        """
+
+        # Create the model file
+        Path(os.path.join(self._model_dir, 'saved_model.pt')).touch()
+
+        # Call the quantize command with the model directory
+        result = self._runner.invoke(quantize,
+                                     ["--model-dir", self._model_dir,
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--timeout", timeout])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--timeout'" in result.output
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('accuracy_criterion',
+                             [1.3, -5, 'foo'])
+    def test_quantize_invalid_accuracy_criterion(self, accuracy_criterion):
+        """
+        Verifies quantize command fails if the accuracy criterion value is invalid (should be a float between 0 and 1.0)
+        """
+
+        # Create the model file
+        Path(os.path.join(self._model_dir, 'saved_model.pt')).touch()
+
+        # Call the quantize command with the model directory
+        result = self._runner.invoke(quantize,
+                                     ["--model-dir", self._model_dir,
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--accuracy-criterion", accuracy_criterion])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--accuracy-criterion'" in result.output
diff --git a/tests/tools/cli/test_train_cli.py b/tests/tools/cli/test_train_cli.py
new file mode 100644
index 0000000000000000000000000000000000000000..8f85b00b8f82f09d6d82c3456794d4dde6d52bac
--- /dev/null
+++ b/tests/tools/cli/test_train_cli.py
@@ -0,0 +1,450 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import pytest
+import shutil
+import tempfile
+
+from click.testing import CliRunner
+from unittest.mock import MagicMock, patch
+from tlt.tools.cli.commands.train import train
+from tlt.utils.types import FrameworkType
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW],
+                          ['resnet50', FrameworkType.PYTORCH]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_train_preprocess_with_image_size(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework):
+    """
+    Tests the train command with a dataset preprocessing method that has an image_size. Actual calls for the model and
+    dataset are mocked out. The test verifies that the proper args are used for calling preprocess()
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+    dummy_image_size = 100
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        model_mock = MagicMock()
+        model_mock.image_size = dummy_image_size
+        data_mock = MagicMock()
+
+        # Test where the preprocessing command will have an image size
+        inspect_mock = MagicMock()
+        inspect_mock.args = ['image_size', 'batch_size']
+        mock_inspect.return_value = inspect_mock
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        result = runner.invoke(train,
+                               ["--framework", str(framework), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--output-dir", output_dir])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert data_mock.shuffle_split.called
+        assert model_mock.train.called
+
+        # Verify that preprocess was called with the right arguments
+        data_mock.preprocess.assert_called_once_with(image_size=dummy_image_size, batch_size=32, add_aug=[])
+
+        # Verify that the train command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework',
+                         [['google/bert_uncased_L-10_H-128_A-2', FrameworkType.TENSORFLOW],
+                          ['bert_en_uncased_L-12_H-768_A-12', FrameworkType.PYTORCH]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_train_preprocess_without_image_size(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework):
+    """
+    Tests the train command with a dataset preprocessing method that just has a batch size arg. Actual calls for the
+    model and dataset are mocked out. The test verifies that the proper args are used for calling preprocess()
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+    dummy_image_size = 100
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        model_mock = MagicMock()
+        model_mock.image_size = dummy_image_size
+        data_mock = MagicMock()
+
+        # Test where the preprocessing command just has a batch_size arg
+        inspect_mock = MagicMock()
+        inspect_mock.args = ['batch_size']
+
+        mock_inspect.return_value = inspect_mock
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        result = runner.invoke(train,
+                               ["--framework", str(framework), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--output-dir", output_dir])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert data_mock.shuffle_split.called
+        assert model_mock.train.called
+
+        # Verify preprocess was called with the right arguments
+        data_mock.preprocess.assert_called_once_with(batch_size=32)
+
+        # Verify that the train command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,add_aug',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 'rotate'],
+                          ['resnet50', FrameworkType.PYTORCH, 'zoom']])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_train_add_augmentation(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework, add_aug):
+    """
+    Tests the train command with add augmentation. Actual calls for the model and dataset are mocked out. The test
+    verifies that the proper args are passed to the model train() method.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        result = runner.invoke(train,
+                               ["--framework", str(framework), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--output-dir", output_dir, "--add_aug", add_aug])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert data_mock.shuffle_split.called
+        assert model_mock.train.called
+
+        # Verify preprocess was called with the right arguments
+        data_mock.preprocess.assert_called_once_with(batch_size=32)
+
+        # Verify that the train command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,init_checkpoints',
+                         [['bert_en_uncased_L-12_H-768_A-12', FrameworkType.TENSORFLOW, '/tmp/checkpoints'],
+                          ['resnet50', FrameworkType.PYTORCH, '/tmp/checkpoint.pt']])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+def test_train_init_checkpoints(mock_load_dataset, mock_get_model, model_name, framework, init_checkpoints):
+    """
+    Tests the train command with init checkpoints. Actual calls for the model and dataset are mocked out. The test
+    verifies that the proper args are passed to the model train() method.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Setup mocks
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        result = runner.invoke(train,
+                               ["--framework", str(framework), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--output-dir", output_dir, "--init-checkpoints", init_checkpoints, "--epochs", 2])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+
+        # Verify that train and preprocess were called with the right arguments
+        if framework == FrameworkType.TENSORFLOW:
+            model_mock.train.assert_called_once_with(data_mock, output_dir=output_dir, epochs=2,
+                                                     initial_checkpoints=init_checkpoints, early_stopping=False,
+                                                     lr_decay=False, distributed=False, hostfile=None, nnodes=1,
+                                                     nproc_per_node=1, use_horovod=False)
+        elif framework == FrameworkType.PYTORCH:
+            model_mock.train.assert_called_once_with(data_mock, output_dir=output_dir, epochs=2,
+                                                     initial_checkpoints=init_checkpoints, early_stopping=False,
+                                                     lr_decay=False, ipex_optimize=False, distributed=False,
+                                                     hostfile=None, nnodes=1, nproc_per_node=1, use_horovod=False,
+                                                     hvd_start_timeout=30)
+        data_mock.preprocess.assert_called_once_with(batch_size=32)
+
+        # Verify that the train command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,epochs,early_stopping, lr_decay',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 15, True, False],
+                          ['resnet50', FrameworkType.PYTORCH, 15, True, True],
+                          ['efficientnet_b0', FrameworkType.TENSORFLOW, 15, False, True],
+                          ['resnet50', FrameworkType.PYTORCH, 15, False, False]])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.load_dataset")
+@patch("inspect.getfullargspec")
+def test_train_features(mock_inspect, mock_load_dataset, mock_get_model, model_name, framework, epochs, early_stopping, lr_decay):  # noqa: E501
+    """
+    Tests the train command with early stopping. Actual calls for the model and dataset are mocked out. The test
+    verifies that the proper args are passed to the model train() method.
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+        mock_load_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        if early_stopping and lr_decay:
+            result = runner.invoke(train,
+                                   ["--framework", str(framework), "--model-name", model_name, "--dataset_dir",
+                                    dataset_dir, "--output-dir", output_dir, "--epochs", epochs, "--early_stopping",
+                                    "--lr_decay"])
+        elif early_stopping:
+            result = runner.invoke(train,
+                                   ["--framework", str(framework), "--model-name", model_name, "--dataset_dir",
+                                    dataset_dir, "--output-dir", output_dir, "--epochs", epochs, "--early_stopping"])
+        elif lr_decay:
+            result = runner.invoke(train,
+                                   ["--framework", str(framework), "--model-name", model_name, "--dataset_dir",
+                                    dataset_dir, "--output-dir", output_dir, "--epochs", epochs, "--lr_decay"])
+
+        else:
+            result = runner.invoke(train,
+                                   ["--framework", str(framework), "--model-name", model_name, "--dataset_dir",
+                                    dataset_dir, "--output-dir", output_dir, "--epochs", epochs])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_load_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework)
+        assert data_mock.shuffle_split.called
+        assert model_mock.train.called
+
+        # Verify that train and preprocess were called with the right arguments
+        if framework == FrameworkType.TENSORFLOW:
+            model_mock.train.assert_called_once_with(data_mock, output_dir=output_dir, epochs=15,
+                                                     initial_checkpoints=None, early_stopping=early_stopping,
+                                                     lr_decay=lr_decay, distributed=False, hostfile=None, nnodes=1,
+                                                     nproc_per_node=1, use_horovod=False)
+        elif framework == FrameworkType.PYTORCH:
+            model_mock.train.assert_called_once_with(data_mock, output_dir=output_dir, epochs=15,
+                                                     initial_checkpoints=None, early_stopping=early_stopping,
+                                                     lr_decay=lr_decay, ipex_optimize=False, distributed=False,
+                                                     hostfile=None, nnodes=1, nproc_per_node=1, use_horovod=False,
+                                                     hvd_start_timeout=30)
+
+        # Verify that the train command exit code is successful
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,framework,dataset_name,dataset_catalog',
+                         [['efficientnet_b0', FrameworkType.TENSORFLOW, 'tf_flowers', 'tf_datasets'],
+                          ['resnet50', FrameworkType.PYTORCH, 'cifar10', 'torchvision']])
+@patch("tlt.models.model_factory.get_model")
+@patch("tlt.datasets.dataset_factory.get_dataset")
+def test_train_dataset_catalog(mock_get_dataset, mock_get_model, model_name, framework, dataset_name, dataset_catalog):
+    """
+    Tests the train command a named dataset and verifies that get_dataset is called (vs load_dataset, which is used
+    for custom dataset directories in other tests).
+    """
+    runner = CliRunner()
+
+    tmp_dir = tempfile.mkdtemp()
+    dataset_dir = os.path.join(tmp_dir, 'data')
+    output_dir = os.path.join(tmp_dir, 'output')
+
+    try:
+        for new_dir in [output_dir, dataset_dir]:
+            os.makedirs(new_dir)
+
+        # Setup mocks
+        model_mock = MagicMock()
+        data_mock = MagicMock()
+        mock_get_model.return_value = model_mock
+        mock_get_dataset.return_value = data_mock
+        model_mock.export.return_value = output_dir
+
+        # Call the train command
+        result = runner.invoke(train,
+                               ["--framework", str(framework), "--model-name", model_name, "--dataset_dir", dataset_dir,
+                                "--output-dir", output_dir, "--dataset-name", dataset_name,
+                                "--dataset-catalog", dataset_catalog])
+
+        # Verify that the expected calls were made
+        mock_get_model.assert_called_once_with(model_name, str(framework))
+        mock_get_dataset.assert_called_once_with(dataset_dir, model_mock.use_case, model_mock.framework,
+                                                 dataset_name, dataset_catalog)
+
+        # Verify that the train command exit code is successful
+        assert model_mock.train.called
+        assert result.exit_code == 0
+    finally:
+        if os.path.exists(tmp_dir):
+            shutil.rmtree(tmp_dir)
+
+
+class TestTrainArgs:
+    """
+    Class for tests that are testing bad inputs for training with generic folders for the dataset dir and output dir.
+    """
+
+    def setup_class(self):
+        self._runner = CliRunner()
+
+        self._tmp_dir = tempfile.mkdtemp()
+        self._dataset_dir = os.path.join(self._tmp_dir, 'data')
+        self._output_dir = os.path.join(self._tmp_dir, 'output')
+
+    def setup_method(self):
+        for new_dir in [self._output_dir, self._dataset_dir]:
+            if not os.path.exists(new_dir):
+                os.makedirs(new_dir)
+
+    def teardown_method(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    def teardown_class(self):
+        if os.path.exists(self._tmp_dir):
+            shutil.rmtree(self._tmp_dir)
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('epochs',
+                             ['foo', 'benchmark', '0', -1, 0])
+    def test_train_invalid_epochs(self, epochs):
+        """
+        Verifies that train command fails if the epoch parameter is invalid
+        """
+
+        result = self._runner.invoke(train,
+                                     ["--model-name", "foo",
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--epochs", epochs])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--epochs'" in result.output
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('framework',
+                             ['foo', 'benchmark', '0'])
+    def test_train_invalid_framework(self, framework):
+        """
+        Verifies that train command fails if the framework value is invalid
+        """
+
+        result = self._runner.invoke(train,
+                                     ["--model-name", "foo",
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--framework", framework])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--framework'" in result.output
+        assert "'{}' is not one of 'tensorflow', 'pytorch'".format(framework) in result.output
+
+    @pytest.mark.common
+    @pytest.mark.parametrize('dataset_catalog', ['foo', 'benchmark', '0'])
+    def test_train_invalid_dataset_catalog(self, dataset_catalog):
+        """
+        Verifies that train command fails if the dataset catalog value is invalid
+        """
+
+        result = self._runner.invoke(train,
+                                     ["--model-name", "foo",
+                                      "--dataset_dir", self._dataset_dir,
+                                      "--output-dir", self._output_dir,
+                                      "--dataset-catalog", dataset_catalog])
+
+        assert result.exit_code == 2
+        assert "Invalid value for '--dataset-catalog'" in result.output
+        assert "'{}' is not one of 'tf_datasets', 'torchvision', 'huggingface'".format(dataset_catalog) in result.output
diff --git a/tests/utils/__init__.py b/tests/utils/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tests/utils/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tests/utils/files/sorted_membind_info.json b/tests/utils/files/sorted_membind_info.json
new file mode 100644
index 0000000000000000000000000000000000000000..aa39004958feeb2ec41e6de184db90a27e0a06c5
--- /dev/null
+++ b/tests/utils/files/sorted_membind_info.json
@@ -0,0 +1,342 @@
+[
+    [
+        {
+            "cpu_id": 0,
+            "ht_cpu_id": 56,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 1,
+            "ht_cpu_id": 57,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 2,
+            "ht_cpu_id": 58,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 3,
+            "ht_cpu_id": 59,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 4,
+            "ht_cpu_id": 60,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 5,
+            "ht_cpu_id": 61,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 6,
+            "ht_cpu_id": 62,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 7,
+            "ht_cpu_id": 63,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 8,
+            "ht_cpu_id": 64,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 9,
+            "ht_cpu_id": 65,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 10,
+            "ht_cpu_id": 66,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 11,
+            "ht_cpu_id": 67,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 12,
+            "ht_cpu_id": 68,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 13,
+            "ht_cpu_id": 69,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 14,
+            "ht_cpu_id": 70,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 15,
+            "ht_cpu_id": 71,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 16,
+            "ht_cpu_id": 72,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 17,
+            "ht_cpu_id": 73,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 18,
+            "ht_cpu_id": 74,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 19,
+            "ht_cpu_id": 75,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 20,
+            "ht_cpu_id": 76,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 21,
+            "ht_cpu_id": 77,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 22,
+            "ht_cpu_id": 78,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 23,
+            "ht_cpu_id": 79,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 24,
+            "ht_cpu_id": 80,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 25,
+            "ht_cpu_id": 81,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 26,
+            "ht_cpu_id": 82,
+            "node_id": 0,
+            "socket_id": 0
+        },
+        {
+            "cpu_id": 27,
+            "ht_cpu_id": 83,
+            "node_id": 0,
+            "socket_id": 0
+        }
+    ],
+    [
+        {
+            "cpu_id": 28,
+            "ht_cpu_id": 84,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 29,
+            "ht_cpu_id": 85,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 30,
+            "ht_cpu_id": 86,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 31,
+            "ht_cpu_id": 87,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 32,
+            "ht_cpu_id": 88,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 33,
+            "ht_cpu_id": 89,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 34,
+            "ht_cpu_id": 90,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 35,
+            "ht_cpu_id": 91,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 36,
+            "ht_cpu_id": 92,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 37,
+            "ht_cpu_id": 93,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 38,
+            "ht_cpu_id": 94,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 39,
+            "ht_cpu_id": 95,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 40,
+            "ht_cpu_id": 96,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 41,
+            "ht_cpu_id": 97,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 42,
+            "ht_cpu_id": 98,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 43,
+            "ht_cpu_id": 99,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 44,
+            "ht_cpu_id": 100,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 45,
+            "ht_cpu_id": 101,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 46,
+            "ht_cpu_id": 102,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 47,
+            "ht_cpu_id": 103,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 48,
+            "ht_cpu_id": 104,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 49,
+            "ht_cpu_id": 105,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 50,
+            "ht_cpu_id": 106,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 51,
+            "ht_cpu_id": 107,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 52,
+            "ht_cpu_id": 108,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 53,
+            "ht_cpu_id": 109,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 54,
+            "ht_cpu_id": 110,
+            "node_id": 1,
+            "socket_id": 1
+        },
+        {
+            "cpu_id": 55,
+            "ht_cpu_id": 111,
+            "node_id": 1,
+            "socket_id": 1
+        }
+    ]
+]
diff --git a/tests/utils/files/sorted_membind_info_no_numa.json b/tests/utils/files/sorted_membind_info_no_numa.json
new file mode 100644
index 0000000000000000000000000000000000000000..27349186d8774d662ac8663f78427998ca3e4d12
--- /dev/null
+++ b/tests/utils/files/sorted_membind_info_no_numa.json
@@ -0,0 +1,22 @@
+[
+    [{
+        "cpu_id": 0,
+        "node_id": 0,
+        "socket_id": -1
+    }],
+    [{
+        "cpu_id": 1,
+        "node_id": 1,
+        "socket_id": -1
+    }],
+    [{
+        "cpu_id": 2,
+        "node_id": 2,
+        "socket_id": -1
+    }],
+    [{
+        "cpu_id": 3,
+        "node_id": 3,
+        "socket_id": -1
+    }]
+]
diff --git a/tests/utils/test_file_utils.py b/tests/utils/test_file_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..377e3057d2bf11b07dd472466d154b8601e8b234
--- /dev/null
+++ b/tests/utils/test_file_utils.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2018-2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import io
+import mock
+import os
+import pytest
+import shutil
+import tempfile
+from unittest.mock import MagicMock
+
+from tlt.utils.file_utils import validate_model_name, download_file
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('model_name,valid_model_name',
+                         [['my/model', 'my_model'],
+                          ['m.o/d~e!@#l', 'm_o_d_e___l'],
+                          ['mod\tel', 'mod_el'],
+                          ['m        odel', 'm_odel'],
+                          ['-.,!@#$%^&*()', '-____________']])
+def test_validate_model_name(model_name, valid_model_name):
+    """
+    Verifies that the model name passed as a string into the
+    validate_model_name() function gives us the proper value based on
+    the output string provided.
+    """
+    val = validate_model_name(model_name)
+    assert val == valid_model_name
+
+
+@pytest.mark.common
+def test_download():
+    output_dir = tempfile.mkdtemp()
+    expected = os.path.join(output_dir, 'example.txt')
+
+    # Set up mock return value
+    mock_file_contents = MagicMock()
+    mock_file_contents.read.return_value = b''
+
+    mock_file = MagicMock(spec=io.BytesIO)
+    mock_file.__enter__.return_value = mock_file
+    mock_file.raw = mock_file_contents
+
+    # Patch requests.get
+    with mock.patch('requests.get', return_value=mock_file) as mock_get:
+        result = download_file('https://example-files.online-convert.com/document/txt/example.txt', output_dir)
+        assert result == expected
+
+        # Check that the mock was called as expected
+        mock_get.assert_called_with('https://example-files.online-convert.com/document/txt/example.txt',
+                                    stream=True, timeout=30)
+        mock_file_contents.read.assert_called_once()
+
+    # Delete the temp output directory
+    if os.path.exists(output_dir) and os.path.isdir(output_dir):
+        shutil.rmtree(output_dir)
diff --git a/tests/utils/test_inc_utils.py b/tests/utils/test_inc_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..2a5ee1ac85d28923876e3f224593321127aa00f2
--- /dev/null
+++ b/tests/utils/test_inc_utils.py
@@ -0,0 +1,102 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import pytest
+
+from tlt.utils.inc_utils import get_inc_config
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('accuracy_criterion,valid',
+                         [[0.1, True],
+                          [-1, False],
+                          [0.01, True],
+                          [1.434, False],
+                          ['foo', False]])
+def test_inc_config_accuracy_criterion(accuracy_criterion, valid):
+    """
+    Tests an INC config with good and bad accuracy_criterion_relative values
+    """
+    if not valid:
+        with pytest.raises(ValueError):
+            get_inc_config(accuracy_criterion_relative=accuracy_criterion)
+    else:
+        config = get_inc_config(accuracy_criterion_relative=accuracy_criterion)
+        assert config.accuracy_criterion.relative == accuracy_criterion
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('timeout,valid',
+                         [[0.1, False],
+                          [-1, False],
+                          [0, True],
+                          [60, True],
+                          ['foo', False]])
+def test_inc_config_timeout(timeout, valid):
+    """
+    Tests an INC config with good and bad exit_policy_timeout values
+    """
+    if not valid:
+        with pytest.raises(ValueError):
+            get_inc_config(exit_policy_timeout=timeout)
+    else:
+        config = get_inc_config(exit_policy_timeout=timeout)
+        assert config.timeout == timeout
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('max_trials,valid',
+                         [[0.1, False],
+                          [-1, False],
+                          [0, False],
+                          [1, True],
+                          [60, True],
+                          ['foo', False]])
+def test_inc_config_max_trials(max_trials, valid):
+    """
+    Tests an INC config with good and bad exit_policy_max_trials values
+    """
+    if not valid:
+        with pytest.raises(ValueError):
+            get_inc_config(exit_policy_max_trials=max_trials)
+    else:
+        config = get_inc_config(exit_policy_max_trials=max_trials)
+        assert config.max_trials == max_trials
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('approach,valid',
+                         [['foo', False],
+                          [-1, False],
+                          [0, False],
+                          ['static', True],
+                          ['dynamic', True],
+                          [True, False],
+                          [False, False]])
+def test_inc_config_approach(approach, valid):
+    """
+    Tests an INC config with good and bad approach values
+    """
+    if not valid:
+        with pytest.raises(ValueError):
+            get_inc_config(approach=approach)
+    else:
+        config = get_inc_config(approach=approach)
+        assert config.approach == 'post_training_{}_quant'.format(approach)
diff --git a/tests/utils/test_platform_util.py b/tests/utils/test_platform_util.py
new file mode 100644
index 0000000000000000000000000000000000000000..abf8cb00b92b409a40da97b2fd11d4c5acd95911
--- /dev/null
+++ b/tests/utils/test_platform_util.py
@@ -0,0 +1,366 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2018-2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import json
+import pytest
+import os
+from mock import mock_open, patch
+
+from tlt.utils.platform_util import PlatformUtil, OptimizedPlatformUtil, CPUInfo
+from test_utils import platform_config
+
+
+def setup_mock_values(mock_platform, mock_os, mock_subprocess):
+    platform_config.set_mock_system_type(mock_platform)
+    platform_config.set_mock_os_access(mock_os)
+    platform_config.set_mock_lscpu_subprocess_values(mock_subprocess)
+
+
+@pytest.fixture
+def os_mock(patch):
+    return patch("os.access")
+
+
+@pytest.fixture
+def subprocess_mock(patch):
+    return patch("subprocess.check_output")
+
+
+@pytest.fixture
+def subprocess_popen_mock(patch):
+    return patch("subprocess.Popen")
+
+
+@pytest.fixture
+def platform_mock(patch):
+    return patch("system_platform.system")
+
+
+@pytest.fixture
+def read_mock(patch):
+    return patch("read")
+
+
+@pytest.mark.common
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+def test_platform_util_lscpu_parsing(get_cpuset_mock, platform_mock, subprocess_mock, os_mock):
+    """
+    Verifies that platform_utils gives us the proper values that we expect
+    based on the lscpu_output string provided.
+    """
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    os_mock.return_value = True
+    get_cpuset_mock.return_value = "0-111"
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    platform_util = PlatformUtil(verbose=True)
+    platform_util.linux_init()
+    assert platform_util.num_cpu_sockets == 2
+    assert platform_util.num_cores_per_socket == 28
+    assert platform_util.num_threads_per_core == 2
+    assert platform_util.num_logical_cpus == 112
+    assert platform_util.num_numa_nodes == 2
+    assert platform_util.cpu_family == '6'
+    assert platform_util.cpu_model == '143'
+    assert platform_util.cpu_type == 'SPR'
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('cpu_model,expected_type',
+                         [['85', 'SKX, CPX, CLX'],
+                          ['143', 'SPR'],
+                          ['123', '']])
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+def test_platform_util_known_cpu_types(get_cpuset_mock, platform_mock, subprocess_mock, os_mock,
+                                       cpu_model, expected_type):
+    """
+    Verifies the are getting the proper CPU type for cpu family/models that we know. For ones that we
+    don't know, it should return an empty string.
+    """
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    os_mock.return_value = True
+    get_cpuset_mock.return_value = "0-111"
+
+    # get the lscpu sample output, but replace in the parameterized cpu model id
+    lscpu_value = platform_config.LSCPU_OUTPUT
+    original_model_value = "Model:                 143\n"  # model test value from the test platform config
+    new_model_value = "Model:                 {}\n".format(cpu_model)
+    lscpu_value = lscpu_value.replace(original_model_value, new_model_value)
+
+    subprocess_mock.return_value = lscpu_value
+    platform_util = PlatformUtil(verbose=True)
+    platform_util.linux_init()
+    assert platform_util.cpu_type == expected_type
+
+
+@pytest.mark.common
+def test_platform_util_unsupported_os(platform_mock, subprocess_mock, os_mock):
+    """
+    Verifies that platform_utils gives us the proper values that we expect
+    based on the lscpu_output string provided.
+    """
+    os_mock.return_value = True
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    # Mac is not supported yet
+    platform_mock.return_value = "Mac"
+    with pytest.raises(NotImplementedError) as e:
+        PlatformUtil(verbose=True)
+    assert "Mac Support not yet implemented" in str(e)
+
+
+@pytest.mark.common
+def test_cpu_info_binding_information(subprocess_mock):
+    """
+    Verifies that cpu_info binding_information property gives us the proper values
+    that we expect based on the lscpu_output string provided.
+    """
+    subprocess_mock.return_value = (
+        '# The following is the parsable format, which can be fed to other\n'
+        '# programs. Each different item in every column has an unique ID\n'
+        '# starting from zero.\n# CPU,Core,Socket,Node\n0,0,0,0\n1,1,0,0\n'
+        '2,2,0,0\n3,3,0,0\n4,4,0,0\n5,5,0,0\n6,6,0,0\n7,7,0,0\n8,8,0,0\n'
+        '9,9,0,0\n10,10,0,0\n11,11,0,0\n12,12,0,0\n13,13,0,0\n14,14,0,0\n'
+        '15,15,0,0\n16,16,0,0\n17,17,0,0\n18,18,0,0\n19,19,0,0\n20,20,0,0\n'
+        '21,21,0,0\n22,22,0,0\n23,23,0,0\n24,24,0,0\n25,25,0,0\n26,26,0,0\n'
+        '27,27,0,0\n28,28,1,1\n29,29,1,1\n30,30,1,1\n31,31,1,1\n32,32,1,1\n'
+        '33,33,1,1\n34,34,1,1\n35,35,1,1\n36,36,1,1\n37,37,1,1\n38,38,1,1\n'
+        '39,39,1,1\n40,40,1,1\n41,41,1,1\n42,42,1,1\n43,43,1,1\n44,44,1,1\n'
+        '45,45,1,1\n46,46,1,1\n47,47,1,1\n48,48,1,1\n49,49,1,1\n50,50,1,1\n'
+        '51,51,1,1\n52,52,1,1\n53,53,1,1\n54,54,1,1\n55,55,1,1\n56,0,0,0\n'
+        '57,1,0,0\n58,2,0,0\n59,3,0,0\n60,4,0,0\n61,5,0,0\n62,6,0,0\n63,7,0,0\n'
+        '64,8,0,0\n65,9,0,0\n66,10,0,0\n67,11,0,0\n68,12,0,0\n69,13,0,0\n'
+        '70,14,0,0\n71,15,0,0\n72,16,0,0\n73,17,0,0\n74,18,0,0\n75,19,0,0\n'
+        '76,20,0,0\n77,21,0,0\n78,22,0,0\n79,23,0,0\n80,24,0,0\n81,25,0,0\n'
+        '82,26,0,0\n83,27,0,0\n84,28,1,1\n85,29,1,1\n86,30,1,1\n87,31,1,1\n'
+        '88,32,1,1\n89,33,1,1\n90,34,1,1\n91,35,1,1\n92,36,1,1\n93,37,1,1\n'
+        '94,38,1,1\n95,39,1,1\n96,40,1,1\n97,41,1,1\n98,42,1,1\n99,43,1,1\n'
+        '100,44,1,1\n101,45,1,1\n102,46,1,1\n103,47,1,1\n104,48,1,1\n105,49,1,1\n'
+        '106,50,1,1\n107,51,1,1\n108,52,1,1\n109,53,1,1\n110,54,1,1\n111,55,1,1\n')
+    generated_value = CPUInfo().binding_information
+    tests_data_dir = os.path.dirname(os.path.abspath(__file__))
+    with open(os.path.join(tests_data_dir, "files", "sorted_membind_info.json")) as json_data:
+        expected_value = json.load(json_data)
+
+    assert generated_value == expected_value
+
+
+@pytest.mark.common
+def test_cpu_info_binding_information_no_numa(subprocess_mock):
+    """
+    Verifies that cpu_info binding_information property gives us the proper values
+    that we expect based on the lscpu_output string provided.
+    """
+    subprocess_mock.return_value = (
+        '# The following is the parsable format, which can be fed to other\n'
+        '# programs. Each different item in every column has an unique ID\n'
+        '# starting from zero.\n# CPU,Core,Socket,Node\n0,0,0,\n1,1,1,\n'
+        '2,2,2,\n3,3,3,\n')
+    generated_value = CPUInfo().binding_information
+    tests_data_dir = os.path.dirname(os.path.abspath(__file__))
+    with open(os.path.join(tests_data_dir, "files", "sorted_membind_info_no_numa.json")) as json_data:
+        expected_value = json.load(json_data)
+
+    assert generated_value == expected_value
+
+
+@pytest.mark.common
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+def test_numa_cpu_core_list(get_cpuset_mock, subprocess_mock, subprocess_popen_mock, platform_mock, os_mock):
+    """ Test the platform utils to ensure that we are getting the proper core lists """
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    subprocess_popen_mock.return_value.stdout.readlines.return_value = platform_config.NUMA_CORES_OUTPUT
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    get_cpuset_mock.return_value = "0-111"
+    os_mock.return_value = True
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    platform_util = PlatformUtil(verbose=True, numa_cores_per_instance="socket")
+
+    # ensure there are 2 items in the list since there are 2 sockets
+    assert len(platform_util.cpu_core_list) == 2
+
+    # ensure each list of cores has the length of the number of cores per socket
+    for core_list in platform_util.cpu_core_list:
+        assert len(core_list) == platform_util.num_cores_per_socket
+
+
+@pytest.mark.common
+def test_platform_util_wmic_parsing(platform_mock, subprocess_mock, os_mock):
+    """
+    Verifies that platform_utils gives us the proper values that we expect
+    based on the wmic_output string provided.
+    """
+    platform_mock.return_value = "Windows"
+    os_mock.return_value = True
+    subprocess_mock.return_value = platform_config.WMIC_OUTPUT
+    platform_util = PlatformUtil(verbose=True)
+    platform_util.windows_init()
+    assert platform_util.num_cpu_sockets == 2
+    assert platform_util.num_cores_per_socket == 28
+    assert platform_util.num_threads_per_core == 28
+    assert platform_util.num_logical_cpus == 56
+    assert platform_util.num_numa_nodes == 0
+
+    # We don't have this info for Windows yet, so we just expect empty strings
+    assert platform_util.cpu_family == ''
+    assert platform_util.cpu_model == ''
+    assert platform_util.cpu_type == ''
+
+
+@pytest.mark.common
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+@pytest.mark.parametrize('cpuset_range,expected_list',
+                         [['0-5', [0, 1, 2, 3, 4, 5]],
+                          ['0-3,7,6', [0, 1, 2, 3, 6, 7]],
+                          ['2-3,7,9-11,20', [2, 3, 7, 9, 10, 11, 20]],
+                          ['0-3,7-6,11,11', [0, 1, 2, 3, 11]],
+                          ['7-9,5-10,6,4', [4, 5, 6, 7, 8, 9, 10]],
+                          ['0', [0]],
+                          ['', []]])
+def test_get_list_from_string_ranges(get_cpuset_mock, platform_mock, subprocess_mock, os_mock,
+                                     cpuset_range, expected_list,):
+    """
+    Tests the PlatformUtils _get_list_from_string_ranges function that converts string
+    number ranges to an integer list.
+    """
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    get_cpuset_mock.return_value = cpuset_range
+    os_mock.return_value = True
+    platform_util = PlatformUtil()
+    result = platform_util._get_list_from_string_ranges(cpuset_range)
+    assert result == expected_list
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('cpuset_range,expected_core_list',
+                         [["0-7,28-35",
+                           [["0", "1", "2", "3", "4", "5", "6", "7"],
+                            ["28", "29", "30", "31", "32", "33", "34", "35"]]],
+                          ["0,2-5,20,29-32,1",
+                           [["0", "1", "2", "3", "4", "5", "20"],
+                            ["29", "30", "31", "32"]]]])
+@patch("os.path.exists")
+def test_numa_cpu_core_list_cpuset(path_exists_mock, subprocess_mock, subprocess_popen_mock,
+                                   platform_mock, os_mock, cpuset_range, expected_core_list):
+    """ Test the platform utils to ensure that we are getting the proper core lists """
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    subprocess_popen_mock.return_value.stdout.readlines.return_value = platform_config.NUMA_CORES_OUTPUT
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    os_mock.return_value = True
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    path_exists_mock.return_value = True
+    cpuset_mock = mock_open(read_data=cpuset_range)
+    with patch("builtins.open", cpuset_mock):
+        platform_util = PlatformUtil(verbose=True, numa_cores_per_instance=4)
+
+    # ensure there are 2 items in the list since there are 2 sockets
+    assert len(platform_util.cpu_core_list) == 2
+
+    # Check that the core list matches the ranges defined for the cpuset file read
+    assert platform_util.cpu_core_list == expected_core_list
+
+
+@pytest.mark.common
+@patch("tlt.utils.platform_util.PlatformUtil._get_cpuset")
+@pytest.mark.parametrize('cpuset_range,expected_num_sockets',
+                         [['0-5', 1],
+                          ['0-3,7,6', 1],
+                          ['2-3,7,9-11,20', 1],
+                          ['0-3,7-6,11,11', 1],
+                          ['7-9,5-10,6,4', 1],
+                          ['0-111', 2],
+                          ['28-32,84-90', 1]])
+def test_platform_utils_num_sockets_with_cpuset(get_cpuset_mock, platform_mock, subprocess_mock,
+                                                os_mock, cpuset_range, expected_num_sockets):
+    """
+    Checks that the number of sockets in platform_utils reflects the proper value based on
+    the cpuset. If the cores being used by the container in the cpuset are all on one socket,
+    then the num_cpu_sockets should be 1, even if the system itself has 2 sockets (since the
+    container only has access to 1).
+    """
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    os_mock.return_value = True
+    get_cpuset_mock.return_value = cpuset_range
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    platform_util = PlatformUtil(verbose=True)
+    platform_util.linux_init()
+    assert platform_util.num_cpu_sockets == expected_num_sockets
+
+
+@pytest.mark.common
+def test_platform_util_with_no_args(platform_mock, subprocess_mock):
+    """
+    Verifies that PlatformUtil object can be created with an empty string, as needed
+    by the performance Jupyter notebooks.
+    """
+    platform_mock.return_value = platform_config.SYSTEM_TYPE
+    subprocess_mock.return_value = platform_config.LSCPU_OUTPUT
+    platform_util = PlatformUtil()
+    assert platform_util.num_logical_cpus == 112
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('omp_num_threads,omp_thread_limit,kmp_blocktime,kmp_affinity,'
+                         'tf_num_intraop_threads,tf_num_interop_threads,'
+                         'tf_enable_mkl_native_format,ld_preload',
+                         [[-1, None, None, None, None, None, None, None],
+                          [1000, None, None, None, None, None, None, None],
+                          [None, 0, None, None, None, None, None, None],
+                          [None, 1000, None, None, None, None, None, None],
+                          [None, None, -1, None, None, None, None, None],
+                          [None, None, None, 'garbage_string', None, None, None, None],
+                          [None, None, None, None, -1, None, None, None],
+                          [None, None, None, None, None, -1, None, None],
+                          [None, None, None, None, None, None, -1, None],
+                          [None, None, None, None, None, None, None, 'path/to/non_so_file.txt'],
+                          [None, None, None, None, None, None, None, 'path/to/invalid_file.so']])
+def test_optimized_platform_util_invalid_args(omp_num_threads, omp_thread_limit, kmp_blocktime,
+                                              kmp_affinity, tf_num_intraop_threads, tf_num_interop_threads,
+                                              tf_enable_mkl_native_format, ld_preload):
+    with pytest.raises((ValueError, FileNotFoundError)):
+        OptimizedPlatformUtil(omp_num_threads, omp_thread_limit, kmp_blocktime, kmp_affinity,
+                              tf_num_intraop_threads, tf_num_interop_threads,
+                              tf_enable_mkl_native_format, ld_preload)
+
+
+@pytest.mark.common
+@pytest.mark.parametrize('omp_num_threads,omp_thread_limit,kmp_blocktime,kmp_affinity,'
+                         'tf_num_intraop_threads,tf_num_interop_threads,'
+                         'tf_enable_mkl_native_format,ld_preload',
+                         [[28, 112, 0, 'granularity=fine', 28, 2, 1, '/tmp/valid_file.so']])
+def test_optimized_platform_util_set_env_vars(omp_num_threads, omp_thread_limit, kmp_blocktime,
+                                              kmp_affinity, tf_num_intraop_threads, tf_num_interop_threads,
+                                              tf_enable_mkl_native_format, ld_preload):
+    try:
+        with open('/tmp/valid_file.so', 'x'):
+            OptimizedPlatformUtil(omp_num_threads, omp_thread_limit, kmp_blocktime, kmp_affinity,
+                                  tf_num_intraop_threads, tf_num_interop_threads,
+                                  tf_enable_mkl_native_format, ld_preload)
+
+            assert 'OMP_NUM_THREADS' in os.environ and os.environ.get('OMP_NUM_THREADS') == str(omp_num_threads)
+            assert 'OMP_THREAD_LIMIT' in os.environ and os.environ.get('OMP_THREAD_LIMIT') == str(omp_thread_limit)
+            assert 'KMP_BLOCKTIME' in os.environ and os.environ.get('KMP_BLOCKTIME') == str(kmp_blocktime)
+            assert 'KMP_AFFINITY' in os.environ and os.environ.get('KMP_AFFINITY') == kmp_affinity
+            assert 'TF_NUM_INTRAOP_THREADS' in os.environ and os.environ.get(
+                'TF_NUM_INTRAOP_THREADS') == str(tf_num_intraop_threads)
+            assert 'TF_NUM_INTEROP_THREADS' in os.environ and os.environ.get(
+                'TF_NUM_INTEROP_THREADS') == str(tf_num_interop_threads)
+            assert 'TF_ENABLE_MKL_NATIVE_FORMAT' in os.environ and os.environ.get(
+                'TF_ENABLE_MKL_NATIVE_FORMAT') == str(tf_enable_mkl_native_format)
+            assert 'LD_PRELOAD' in os.environ and os.environ.get('LD_PRELOAD') == ld_preload
+    finally:
+        os.remove('/tmp/valid_file.so')
diff --git a/tlt/__init__.py b/tlt/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..9b78caa91914ea7c6c982e5a9e186be432b6eeb1
--- /dev/null
+++ b/tlt/__init__.py
@@ -0,0 +1,23 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+TLT_BASE_DIR = os.path.dirname(__file__)
diff --git a/tlt/datasets/__init__.py b/tlt/datasets/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tlt/datasets/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/datasets/configs/hf_text_classification_datasets.json b/tlt/datasets/configs/hf_text_classification_datasets.json
new file mode 100644
index 0000000000000000000000000000000000000000..2dbe3ab7cd8588287c31f76f372d1b35eabce648
--- /dev/null
+++ b/tlt/datasets/configs/hf_text_classification_datasets.json
@@ -0,0 +1,62 @@
+{
+    "imdb": {
+        "dataset_hub": "huggingface",
+        "url": "https://huggingface.co/datasets/imdb"
+    },
+    "tweet_eval/emoji": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/emotion": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/hate": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/irony": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/offensive": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/sentiment": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/stance_abortion": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/stance_atheism": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/stance_climate": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/stance_feminist": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "tweet_eval/stance_hillary": {
+        "dataset_hub":"huggingface",
+        "url": "https://huggingface.co/datasets/tweet_eval"
+    },
+    "rotten_tomatoes": {
+        "dataset_hub": "huggingface",
+        "url": "https://huggingface.co/datasets/rotten_tomatoes"
+    },
+    "ag_news": {
+        "dataset_hub": "huggingface",
+        "url": "https://huggingface.co/datasets/ag_news"
+    },
+    "sst2": {
+        "dataset_hub": "huggingface",
+        "url": "https://huggingface.co/datasets/sst2"
+    }
+}
diff --git a/tlt/datasets/configs/tf_text_classification_datasets.json b/tlt/datasets/configs/tf_text_classification_datasets.json
new file mode 100644
index 0000000000000000000000000000000000000000..17ad3f3b930c5cfbb6b5986759836bcab17a10ef
--- /dev/null
+++ b/tlt/datasets/configs/tf_text_classification_datasets.json
@@ -0,0 +1,18 @@
+{
+    "imdb_reviews": {
+        "dataset_hub": "tfhub",
+        "url": "https://www.tensorflow.org/datasets/catalog/imdb_reviews"
+    },
+    "ag_news_subset": {
+        "dataset_hub": "tfhub",
+        "url": "https://www.tensorflow.org/datasets/catalog/ag_news_subset"
+    },
+        "glue/sst2": {
+        "dataset_hub": "tfhub",
+        "url": "https://www.tensorflow.org/datasets/catalog/glue"
+    },
+        "glue/cola": {
+        "dataset_hub": "tfhub",
+        "url": "https://www.tensorflow.org/datasets/catalog/glue"
+    }
+}
diff --git a/tlt/datasets/dataset.py b/tlt/datasets/dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..9d03c71f1793a9b81c9519fe3b9d6c2910e4290f
--- /dev/null
+++ b/tlt/datasets/dataset.py
@@ -0,0 +1,94 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import abc
+
+
+class BaseDataset(abc.ABC):
+    """
+    Abstract base class for a dataset used for training and evaluation
+    """
+    def __init__(self, dataset_dir, dataset_name=None, dataset_catalog=None):
+        """
+        Class constructor
+        """
+        self._dataset_dir = dataset_dir
+        self._dataset_name = dataset_name
+        self._dataset_catalog = dataset_catalog
+
+    @property
+    def dataset_name(self):
+        """
+        Name of the dataset
+        """
+        return self._dataset_name
+
+    @property
+    def dataset_dir(self):
+        """
+        Host directory containing the dataset files
+        """
+        return self._dataset_dir
+
+    @property
+    def dataset_catalog(self):
+        """
+        The string name of the dataset catalog (or None)
+        """
+        return self._dataset_catalog
+
+    @property
+    @abc.abstractmethod
+    def dataset(self):
+        """
+        The framework dataset object
+        """
+        pass
+
+    @property
+    @abc.abstractmethod
+    def train_subset(self):
+        """
+        A subset of the dataset used for training
+        """
+        pass
+
+    @property
+    @abc.abstractmethod
+    def validation_subset(self):
+        """
+        A subset of the dataset used for validation/evaluation
+        """
+        pass
+
+    @property
+    @abc.abstractmethod
+    def test_subset(self):
+        """
+        A subset of the dataset held out for final testing/evaluation
+        """
+        pass
+
+    @abc.abstractmethod
+    def get_batch(self):
+        """
+        Get a single batch of images and labels from the dataset
+        """
+        pass
diff --git a/tlt/datasets/dataset_factory.py b/tlt/datasets/dataset_factory.py
new file mode 100644
index 0000000000000000000000000000000000000000..d6c8825196124b2b16ec05e6bc72a99b8e39b8f0
--- /dev/null
+++ b/tlt/datasets/dataset_factory.py
@@ -0,0 +1,203 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from pydoc import locate
+
+from tlt.utils.types import FrameworkType, UseCaseType
+
+dataset_map = {
+    FrameworkType.TENSORFLOW: {
+        UseCaseType.IMAGE_CLASSIFICATION: {
+            "tf_datasets": {"module": "tlt.datasets.image_classification.tfds_image_classification_dataset",
+                            "class": "TFDSImageClassificationDataset"},
+            "custom": {"module": "tlt.datasets.image_classification.tf_custom_image_classification_dataset",
+                       "class": "TFCustomImageClassificationDataset"}
+        },
+        UseCaseType.TEXT_CLASSIFICATION: {
+            "tf_datasets": {"module": "tlt.datasets.text_classification.tfds_text_classification_dataset",
+                            "class": "TFDSTextClassificationDataset"},
+            "custom": {"module": "tlt.datasets.text_classification.tf_custom_text_classification_dataset",
+                       "class": "TFCustomTextClassificationDataset"}
+        }
+    },
+    FrameworkType.PYTORCH: {
+        UseCaseType.IMAGE_CLASSIFICATION: {
+            "torchvision": {"module": "tlt.datasets.image_classification.torchvision_image_classification_dataset",
+                            "class": "TorchvisionImageClassificationDataset"},
+            "custom": {"module": "tlt.datasets.image_classification.pytorch_custom_image_classification_dataset",
+                       "class": "PyTorchCustomImageClassificationDataset"}
+        },
+        UseCaseType.TEXT_CLASSIFICATION: {
+            "huggingface": {"module": "tlt.datasets.text_classification.hf_text_classification_dataset",
+                            "class": "HFTextClassificationDataset"},
+            "custom": {"module": "tlt.datasets.text_classification.hf_custom_text_classification_dataset",
+                       "class": "HFCustomTextClassificationDataset"}
+        },
+        UseCaseType.IMAGE_ANOMALY_DETECTION: {
+            "custom": {"module": "tlt.datasets.image_anomaly_detection.pytorch_custom_image_anomaly_detection_dataset",
+                       "class": "PyTorchCustomImageAnomalyDetectionDataset"}
+        },
+    }
+}
+
+
+def load_dataset(dataset_dir: str, use_case: UseCaseType, framework: FrameworkType, dataset_name=None, **kwargs):
+    """A factory method for loading a custom dataset.
+
+    Image classification datasets expect a directory of images organized with subfolders for each image class, which
+    can themselves be in split directories named 'train', 'validation', and/or 'test'. Each class subfolder should
+    contain .jpg images for the class. The name of the subfolder will be used as the class label.
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── class_a
+          ├── class_b
+          └── class_c
+
+    Or:
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── train
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          ├── validation
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          └── test
+              ├── class_a
+              ├── class_b
+              └── class_c
+
+    Text classification datasets are expected to be a directory with text/csv file with two columns: the label and the
+    text/sentence to classify. See the TFCustomTextClassificationDataset documentation for a list of the additional
+    kwargs that are used for loading the a text classification dataset file.
+
+    .. code-block:: text
+
+        class_a,<text>
+        class_b,<text>
+        class_a,<text>
+        ...
+
+    Args:
+        dataset_dir (str): directory containing the dataset
+        use_case (str or UseCaseType): use case or task the dataset will be used to model
+        framework (str or FrameworkType): framework
+        dataset_name (str): optional; name of the dataset used for informational purposes
+        kwargs: optional; additional keyword arguments depending on the type of dataset being loaded
+
+    Returns:
+        (dataset)
+
+    Raises:
+        NotImplementedError: if the type of dataset being loaded is not supported
+
+    Example:
+        >>> from tlt.datasets.dataset_factory import load_dataset
+        >>> data = load_dataset('/tmp/data/flower_photos', 'image_classification', 'tensorflow')
+        Found 3670 files belonging to 5 classes.
+        >>> data.class_names
+        ['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips']
+
+    """
+    if not isinstance(framework, FrameworkType):
+        framework = FrameworkType.from_str(framework)
+
+    if not isinstance(use_case, UseCaseType):
+        use_case = UseCaseType.from_str(use_case)
+
+    dataset_catalog = "custom"
+
+    if framework in dataset_map.keys():
+        if use_case in dataset_map[framework].keys():
+            if dataset_catalog in dataset_map[framework][use_case]:
+                dataset_class_str = '{}.{}'.format(dataset_map[framework][use_case][dataset_catalog]['module'],
+                                                   dataset_map[framework][use_case][dataset_catalog]['class'])
+                dataset_class = locate(dataset_class_str)
+
+                if not dataset_class:
+                    raise NotImplementedError("Unable to find the dataset class:", dataset_class_str)
+                return dataset_class(dataset_dir, dataset_name, **kwargs)
+
+    # If no match was found in the map, then it's not implemented yet
+    raise NotImplementedError("Custom dataset support for {} {} {} has not been implemented yet".format(
+        str(framework), str(use_case), dataset_catalog))
+
+
+def get_dataset(dataset_dir: str, use_case: UseCaseType, framework: FrameworkType,
+                dataset_name: str = None, dataset_catalog: str = None, **kwargs):
+    """
+    A factory method for using a dataset from a catalog.
+
+    Args:
+        dataset_dir (str): directory containing the dataset or to which the dataset should be downloaded
+        use_case (str or UseCaseType): use case or task the dataset will be used to model
+        framework (str or FrameworkType): framework
+        dataset_name (str): optional; name of the dataset
+        dataset_catalog (str): optional; catalog from which to download the dataset. If a dataset name is
+                               provided and no dataset catalog is given, it will default to use tf_datasets
+                               for a TensorFlow model, torchvision for PyTorch CV models, and huggingface
+                               datasets for PyTorch NLP models or Hugging Face models.
+        **kwargs: optional; additional keyword arguments for the framework or dataset_catalog
+
+    Returns:
+        (dataset)
+
+    Raises:
+        NotImplementedError: if the dataset requested is not supported yet
+
+    Example:
+        >>> from tlt.datasets.dataset_factory import get_dataset
+        >>> data = get_dataset('/tmp/data/', 'image_classification', 'tensorflow', 'tf_flowers', 'tf_datasets')
+        >>> sorted(data.class_names)
+        ['daisy', 'dandelion', 'roses', 'sunflowers', 'tulips']
+
+    """
+    if not isinstance(framework, FrameworkType):
+        framework = FrameworkType.from_str(framework)
+
+    if not isinstance(use_case, UseCaseType):
+        use_case = UseCaseType.from_str(use_case)
+
+    if dataset_name and not dataset_catalog:
+        # Try to assume a dataset catalog based on the other information that we have
+        if framework is FrameworkType.TENSORFLOW:
+            dataset_catalog = "tf_datasets"
+        elif framework is FrameworkType.PYTORCH:
+            if use_case in [UseCaseType.IMAGE_CLASSIFICATION, UseCaseType.OBJECT_DETECTION]:
+                dataset_catalog = "torchvision"
+            elif use_case is UseCaseType.TEXT_CLASSIFICATION:
+                dataset_catalog = "huggingface"
+
+    if framework in dataset_map.keys():
+        if use_case in dataset_map[framework].keys():
+            if dataset_catalog and dataset_catalog in dataset_map[framework][use_case]:
+                dataset_class = locate('{}.{}'.format(dataset_map[framework][use_case][dataset_catalog]['module'],
+                                                      dataset_map[framework][use_case][dataset_catalog]['class']))
+                return dataset_class(dataset_dir, dataset_name, **kwargs)
+
+    # If no match was found in the map, then it's not implemented yet
+    raise NotImplementedError("Datasets support for {} {} {} has not been implemented yet".format(
+        str(framework), str(use_case), dataset_catalog))
diff --git a/tlt/datasets/hf_dataset.py b/tlt/datasets/hf_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..5570c1733769cc6ed6a16a7bb5d2984d28002eda
--- /dev/null
+++ b/tlt/datasets/hf_dataset.py
@@ -0,0 +1,342 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import re
+import torch
+import random
+import time
+
+from requests.adapters import ProxyError
+
+from transformers import AutoTokenizer
+
+from torch.utils.data import DataLoader as loader
+from tlt.datasets.dataset import BaseDataset
+
+
+class HFDataset(BaseDataset):
+    """
+    Base class to represent Hugging Face Dataset
+    """
+
+    def __init__(self, dataset_dir, dataset_name="", dataset_catalog=""):
+        BaseDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog)
+
+    def get_batch(self, subset='all'):
+        """
+        Get a single batch of images and labels from the dataset.
+
+            Args:
+                subset (str): default "all", can also be "train", "validation", or "test"
+
+            Returns:
+                (examples, labels)
+
+            Raises:
+                ValueError: if the dataset is not defined yet or the given subset is not valid
+        """
+
+        if subset == 'all' and self._dataset is not None:
+            return next(iter(self._data_loader))
+        elif subset == 'train' and self.train_subset is not None:
+            return next(iter(self._train_loader))
+        elif subset == 'validation' and self.validation_subset is not None:
+            return next(iter(self._validation_loader))
+        elif subset == 'test' and self.test_subset is not None:
+            return next(iter(self._test_loader))
+        else:
+            raise ValueError("Unable to return a batch, because the dataset or subset hasn't been defined.")
+
+    def preprocess(
+        self,
+        model_name: str,
+        batch_size: int = 32,
+        padding: str = "max_length",
+        truncation: bool = True,
+        max_length: int = 64,
+        **kwargs
+    ) -> None:
+        """
+        Preprocess the textual dataset to apply padding, truncation and tokenize.
+
+            Args:
+                model_name (str): Name of the model to get a matching tokenizer.
+                batch_size (int): Number of batches to split the data.
+                padding (str): desired padding. (default: "max_length")
+                max_length (int): desired max length. (default: 64)
+                truncation (bool): Boolean specifying to truncate the word tokens to match with the
+                longest sentence. (default: True)
+                max_length (int): Maximum sequence length
+            Raises:
+                ValueError: if data has already been preprocessed (or) non integer batch size given (or)
+                given dataset hasn't been implemented into the API yet.
+        """
+
+        # Sanity checks
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be an positive integer")
+
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+
+        column_names = self._dataset.column_names
+
+        # There must be at least one feature named 'label' in the self._dataset. The remaining features
+        # become the text columns provided they contain only strings
+        text_column_names = [col_name for col_name in column_names if col_name != 'label' and
+                             all(isinstance(s, str) for s in self._dataset[col_name])]
+
+        # Get the tokenizer
+        try:
+            self._tokenizer = AutoTokenizer.from_pretrained(model_name)
+        except ProxyError:
+            print("Max retries reached. Sleeping for 10 sec...")
+            time.sleep(10)
+            self._tokenizer = AutoTokenizer.from_pretrained(model_name)
+
+        # Define a tokenize function to map the text to the tokenizer
+        def tokenize_function(examples):
+            # Define the tokenizer args, depending on number of text columns present in the dataset
+            args = (examples[text_column_name] for text_column_name in text_column_names)
+
+            result = self._tokenizer(*args, padding=padding, max_length=max_length, truncation=truncation)
+            return result
+
+        self._dataset = self._dataset.map(tokenize_function, batched=True)
+
+        # Prepare the tokenized dataset in the format expected by model.
+        # Remove the rest of the features from the tokenized dataset except 'label'
+        self._dataset = self._dataset.remove_columns([col for col in column_names if col != 'label'])
+
+        # Set format to torch
+        self._dataset.set_format("torch")
+
+        self._preprocessed = {
+            'padding': padding,
+            'truncation': truncation,
+            'batch_size': batch_size,
+        }
+        self._make_data_loaders(batch_size=batch_size)
+        print("Tokenized Dataset:", self._dataset)
+
+    def shuffle_split(self, train_pct=.75, val_pct=.25, test_pct=0., shuffle_files=True, seed=None):
+        """
+        Randomly split the dataset into train, validation, and test subsets with a pseudo-random seed option.
+
+            Args:
+                train_pct (float): default .75, percentage of dataset to use for training
+                val_pct (float):  default .25, percentage of dataset to use for validation
+                test_pct (float): default 0.0, percentage of dataset to use for testing
+                shuffle_files (bool): default True, optionally control whether shuffling occurs
+                seed (None or int): default None, can be set for pseudo-randomization
+
+            Raises:
+                ValueError: if percentage input args are not floats or sum to greater than 1
+                """
+        # Sanity checks
+        if not (isinstance(train_pct, float) and isinstance(val_pct, float) and isinstance(test_pct, float)):
+            raise ValueError("Percentage arguments must be floats.")
+
+        if train_pct + val_pct + test_pct > 1.0:
+            raise ValueError("Sum of percentage arguments must be less than or equal to 1.")
+
+        self._validation_type = 'shuffle_split'
+
+        # Calculating splits
+        length = len(self._dataset)
+        train_size = int(train_pct * length)
+        val_size = int(val_pct * length)
+        test_size = int(test_pct * length)
+
+        generator = torch.Generator().manual_seed(seed) if seed else None
+        if shuffle_files:
+            dataset_indices = torch.randperm(length, generator=generator).tolist()
+        else:
+            dataset_indices = range(length)
+        self._train_indices = dataset_indices[:train_size]
+        self._validation_indices = dataset_indices[train_size:train_size + val_size]
+
+        if test_pct:
+            self._test_indices = dataset_indices[train_size + val_size:train_size + val_size + test_size]
+        else:
+            self._test_indices = None
+
+        if self._preprocessed and 'batch_size' in self._preprocessed:
+            self._make_data_loaders(batch_size=self._preprocessed['batch_size'], generator=generator)
+
+        print("Dataset split into:")
+        print("-------------------")
+        print("{} train samples".format(train_size))
+        print("{} test samples".format(test_size))
+        print("{} validation samples".format(val_size))
+
+    def _make_data_loaders(self, batch_size, generator=None):
+
+        def seed_worker(worker_id):
+            import numpy as np
+            worker_seed = torch.initial_seed() % 2**32
+            np.random.seed(worker_seed)
+            random.seed(worker_seed)
+
+        if self._validation_type == 'shuffle_split':
+            self._train_loader = loader(self.train_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                        num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator)
+
+            self._validation_loader = loader(self.validation_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                             num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                             generator=generator)
+
+            if self._test_indices:
+                self._test_loader = loader(self.test_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                           num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                           generator=generator)
+
+        elif self._validation_type == 'defined_split':
+            if 'train' in self._split:
+                self._train_loader = loader(self.train_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                            num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                            generator=generator)
+            if 'test' in self._split:
+                self._test_loader = loader(self.test_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                           num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                           generator=generator)
+            if 'validation' in self._split:
+                self._validation_loader = loader(self.validation_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                                 num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                                 generator=generator)
+        elif self._validation_type is None:
+
+            self._data_loader = loader(self._dataset, batch_size=batch_size, shuffle=self._shuffle,
+                                       num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator)
+
+            self._train_loader = self._data_loader
+            self._test_loader = self._data_loader
+            self._validation_loader = self._data_loader
+
+    def get_text(self, input_ids):
+        """
+        Helper function to decode the input_ids to text
+        """
+        decoded_text = []
+        if isinstance(input_ids, list):
+            input_ids = torch.tensor(input_ids)
+
+        if input_ids.ndim > 1:
+            decoded_tokens = self._tokenizer.batch_decode(input_ids)
+            for t in decoded_tokens:
+                decoded_text.append(re.search(r'\[CLS\] (.*?) \[SEP\]', t).group(1))
+        else:
+            decoded_tokens = self._tokenizer.decode(input_ids)
+            decoded_text.append(re.search(r'\[CLS\] (.*?) \[SEP\]', decoded_tokens).group(1))
+
+        return decoded_text
+
+    @property
+    def train_subset(self):
+        train_ds = None
+
+        if self._validation_type == 'shuffle_split':
+            train_ds = self._dataset.select(self._train_indices)
+        elif self._validation_type == 'defined_split':
+            if 'train' in self._split:
+                train_ds = self._dataset.select(self._train_indices)
+            else:
+                raise ValueError("train split not specified")
+        elif self._validation_type is None:
+            train_ds = self._dataset
+
+        return train_ds
+
+    @property
+    def test_subset(self):
+        test_ds = None
+
+        if self._validation_type == 'shuffle_split':
+            if self._test_indices:
+                test_ds = self._dataset.select(self._test_indices)
+        elif self._validation_type == 'defined_split':
+            if 'test' in self._split:
+                test_ds = self._dataset.select(self._test_indices)
+            else:
+                raise ValueError("test split not specified")
+        elif self._validation_type is None:
+            test_ds = self._dataset
+
+        return test_ds
+
+    @property
+    def validation_subset(self):
+        validation_ds = None
+
+        if self._validation_type == 'shuffle_split':
+            validation_ds = self._dataset.select(self._validation_indices)
+        elif self._validation_type == 'defined_split':
+            if 'validation' in self._split:
+                validation_ds = self._dataset.select(self._validation_indices)
+            else:
+                raise ValueError("validation split not specified")
+        elif self._validation_type is None:
+            validation_ds = self._dataset
+
+        return validation_ds
+
+    @property
+    def train_loader(self):
+        if self._train_loader:
+            return self._train_loader
+        else:
+            raise ValueError("train split not specified")
+
+    @property
+    def test_loader(self):
+        if self._test_loader:
+            return self._test_loader
+        else:
+            raise ValueError("test split not specified")
+
+    @property
+    def validation_loader(self):
+        if self._validation_loader:
+            return self._validation_loader
+        else:
+            raise ValueError("validation split not specified")
+
+    def get_inc_dataloaders(self):
+        calib_dataset = self.train_subset
+        if self.validation_loader is not None:
+            eval_dataset = self.validation_subset
+        elif self.test_loader is not None:
+            eval_dataset = self.test_subset
+        else:
+            eval_dataset = self.train_subset
+
+        # Drop the label column because Intel Neural Compressor does not like it embedded with the features
+        # If we need to compute metrics from the labels, we can improve this with a subclass of
+        # torch.utils.data.Dataset or neural_compressor.data.datasets.bert_dataset.PytorchBertDataset that
+        # also returns the labels from __getitem__
+        for label_col_name in ['labels', 'label']:
+            if label_col_name in self._dataset.features.keys():
+                calib_dataset = calib_dataset.remove_columns(label_col_name)
+                eval_dataset = eval_dataset.remove_columns(label_col_name)
+
+        calib_dataloader = loader(calib_dataset, batch_size=self._preprocessed['batch_size'])
+        eval_dataloader = loader(eval_dataset, batch_size=self._preprocessed['batch_size'])
+
+        return calib_dataloader, eval_dataloader
diff --git a/tlt/datasets/image_anomaly_detection/__init__.py b/tlt/datasets/image_anomaly_detection/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..6c4a7f4caf7799f9d26becadb6083c766422a7c8
--- /dev/null
+++ b/tlt/datasets/image_anomaly_detection/__init__.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from tlt.datasets.image_classification import image_classification_dataset  # noqa: F401
diff --git a/tlt/datasets/image_anomaly_detection/pytorch_custom_image_anomaly_detection_dataset.py b/tlt/datasets/image_anomaly_detection/pytorch_custom_image_anomaly_detection_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..5e5bab8c193ae8882c715afacf2d8117569928f6
--- /dev/null
+++ b/tlt/datasets/image_anomaly_detection/pytorch_custom_image_anomaly_detection_dataset.py
@@ -0,0 +1,536 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import inspect
+import os
+import random
+import numpy as np
+from typing import Any, Callable, Dict, List, Optional, Tuple, Union, cast
+
+import torch
+from torch.utils.data import DataLoader as loader
+from torchvision.datasets import DatasetFolder
+import torchvision.transforms as T
+from torchvision.datasets.folder import default_loader, IMG_EXTENSIONS
+
+from tlt.datasets.pytorch_dataset import PyTorchDataset
+from tlt.models.image_anomaly_detection.simsiam import loader as ssloader
+from tlt.models.image_anomaly_detection.cutpaste.cutpaste import CutPasteNormal, CutPasteScar,\
+    CutPaste3Way, CutPasteUnion, get_cutpaste_transforms
+
+
+class AnomalyImageFolder(DatasetFolder):
+    """Inherits from DatasetFolder.
+
+    This class overrides the find_classes() and make_dataset() methods of DatasetFolder to support filtering for
+    specific defect/class folders and searching the 'train' and 'test' subdirectories when using the optional
+    train/test image folder layout.
+    """
+
+    def has_valid_file_extension(self, filename: str, extensions: Union[str, Tuple[str, ...]]) -> bool:
+        """Checks if a file has a valid extension.
+
+        Args:
+            filename (string): path to a file
+            extensions (tuple of strings): extensions to consider (lowercase)
+
+        Returns:
+            bool: True if the filename ends with one of given extensions
+        """
+        return filename.lower().endswith(extensions if isinstance(extensions, str) else tuple(extensions))
+
+    def find_classes(self, directory: str) -> Tuple[List[str], Dict[str, int]]:
+        """Finds the class folders in a dataset and assigns them to 'good' and 'bad'.
+
+        See :class:`DatasetFolder` for details.
+        """
+        if self._classes_to_find is None:
+            classes = sorted(entry.name for entry in os.scandir(directory) if entry.is_dir())
+            self._defects = [c for c in classes if c != 'good']
+        elif isinstance(self._classes_to_find, list):
+            classes = self._classes_to_find
+        class_to_idx = {cls_name: int(cls_name == 'good') for cls_name in classes}
+        return ['bad', 'good'], class_to_idx
+
+    def make_dataset(
+            self,
+            directory: str,
+            class_to_idx: Optional[Dict[str, int]] = None,
+            extensions: Optional[Union[str, Tuple[str, ...]]] = None,
+            is_valid_file: Optional[Callable[[str], bool]] = None,
+    ) -> List[Tuple[str, int]]:
+        """Generates a list of samples of a form (path_to_sample, class).
+
+        See :class:`DatasetFolder` for details.
+
+        Note: The class_to_idx parameter is optional and will use the logic of the `find_classes` function by default.
+        """
+        directory = os.path.expanduser(directory)
+
+        if class_to_idx is None:
+            _, class_to_idx = self.find_classes(directory)
+        elif not class_to_idx:
+            raise ValueError("'class_to_index' must have at least one entry to collect any samples.")
+
+        both_none = extensions is None and is_valid_file is None
+        both_something = extensions is not None and is_valid_file is not None
+        if both_none or both_something:
+            raise ValueError("Both extensions and is_valid_file cannot be None or not None at the same time")
+
+        if extensions is not None:
+            def is_valid_file(x: str) -> bool:
+                return self.has_valid_file_extension(x, extensions)  # type: ignore[arg-type]
+
+        is_valid_file = cast(Callable[[str], bool], is_valid_file)
+
+        instances = []
+        available_classes = set()
+        for target_class in sorted(class_to_idx.keys()):
+            class_index = class_to_idx[target_class]
+            # This is the specific edit that supports nested train/test subdirs for Intel Transfer Learning Tool
+            target_dirs = [os.path.join(directory, target_class),
+                           os.path.join(directory, 'train', target_class),
+                           os.path.join(directory, 'test', target_class)]
+            for target_dir in target_dirs:
+                if not os.path.isdir(target_dir):
+                    continue
+                for root, _, fnames in sorted(os.walk(target_dir, followlinks=True)):
+                    for fname in sorted(fnames):
+                        path = os.path.join(root, fname)
+                        if is_valid_file(path):
+                            item = path, class_index
+                            instances.append(item)
+
+                            if target_class not in available_classes:
+                                available_classes.add(target_class)
+
+        empty_classes = set(class_to_idx.keys()) - available_classes
+        if empty_classes:
+            msg = f"Found no valid file for the classes {', '.join(sorted(empty_classes))}. "
+            if extensions is not None:
+                msg += f"Supported extensions are: " \
+                       f"{extensions if isinstance(extensions, str) else ', '.join(extensions)}"
+            raise FileNotFoundError(msg)
+
+        return instances
+
+    def __init__(
+            self,
+            root: str,
+            transform: Optional[Callable] = None,
+            target_transform: Optional[Callable] = None,
+            loader: Callable[[str], Any] = default_loader,
+            is_valid_file: Optional[Callable[[str], bool]] = None,
+            classes=None
+    ):
+        self._classes_to_find = classes
+        super().__init__(
+            root,
+            loader,
+            IMG_EXTENSIONS if is_valid_file is None else None,
+            transform=transform,
+            target_transform=target_transform,
+            is_valid_file=is_valid_file,
+        )
+        self.imgs = self.samples
+
+
+class PyTorchCustomImageAnomalyDetectionDataset(PyTorchDataset):
+    """
+    A custom image anomaly detection dataset that can be used with PyTorch models. Note that the
+    directory of images is expected to be organized in one of two ways.
+
+    Method 1: With one subfolder named `good` and at least one other folder of defective examples. It does not matter
+    what the names of the other folders are or how many there are, as long as there is at least one. All of the images
+    in the non-good subfolders will be coded to `bad` and will only be used for validation/testing (not training).
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── good
+          ├── defective_type_a
+          └── defective_type_b
+
+    Method 2: With subfolders named `train` and either `validation` or `test`. The `train` subdirectory should
+    contain a folder named `good` with training samples, and the `test`/`validation` subdirectory should contain
+    a folder named `good` and at least one other folder of defective examples for validation.
+
+    .. code-block:: text
+
+        dataset_dir
+          └── train
+              └── good
+          └── test
+              ├── good
+              ├── defective_type_a
+              └── defective_type_b
+
+    Args:
+        dataset_dir (str): Directory where the data is located. It should contain subdirectories with images for
+                           each class.
+        dataset_name (str): optional; Name of the dataset. If no dataset name is given, the dataset_dir folder name
+                            will be used as the dataset name.
+        num_workers (int): optional; Number of processes to use for data loading, default is 56
+        shuffle_files (bool): optional; Whether to shuffle the data. Defaults to True.
+        defects (list[str]): Specific defects or category names to use for validation (default: None); if None, all
+                             subfolders in the dataset directory will be used.
+
+    Raises:
+        FileNotFoundError if dataset directory does not exist or if a subdirectory named `good` is not found
+
+    """
+
+    def __init__(self, dataset_dir, dataset_name=None, num_workers=56, shuffle_files=True, defects=None):
+        """
+        Class constructor
+        """
+        if not os.path.exists(dataset_dir):
+            raise FileNotFoundError("The dataset directory ({}) does not exist".format(dataset_dir))
+
+        # Determine which layout the images are in - category folders or train/test folders
+        # The validation_type will be None for the former and "defined_split" for the latter
+        if os.path.exists(os.path.join(dataset_dir, 'train')):
+            self._validation_type = 'defined_split'
+            if not os.path.exists(os.path.join(dataset_dir, 'train', 'good')):
+                raise FileNotFoundError("Couldn't find 'good' folder in {}".format(os.path.join(dataset_dir, 'train')))
+            if os.path.exists(os.path.join(dataset_dir, 'validation')):
+                validation_dir = 'validation'
+            elif os.path.exists(os.path.join(dataset_dir, 'test')):
+                validation_dir = 'test'
+            else:
+                raise FileNotFoundError("Found a 'train' directory, but not a 'test' or 'validation' directory.")
+        else:
+            self._validation_type = None
+            if not os.path.exists(os.path.join(dataset_dir, 'good')):
+                raise FileNotFoundError("Couldn't find 'good' folder in {}".format(dataset_dir))
+
+        # Inspect and validate defects
+        if self._validation_type is None:
+            defect_directory = dataset_dir
+        elif self._validation_type == 'defined_split':
+            defect_directory = os.path.join(dataset_dir, validation_dir)
+        classes = [d.name for d in os.scandir(defect_directory) if d.is_dir()]
+
+        if defects:
+            # If the defects filter is being used, check that all the folders are present
+            complement = set(defects) - set(classes)
+            if complement:
+                raise ValueError('Some of the defects provided were not found in {}: {}'.format(defect_directory,
+                                                                                                complement))
+        else:
+            # Detect the defects if not provided by user
+            defects = [c for c in classes if c != 'good']
+        self._defects = defects
+
+        # The dataset name is only used for informational purposes. If one isn't given, use the directory name
+        if not dataset_name:
+            dataset_name = os.path.basename(dataset_dir)
+
+        PyTorchDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog=None)
+
+        self._info = {
+            "name": dataset_name,
+            "dataset_dir": dataset_dir
+        }
+        self._num_workers = num_workers
+        self.train_sampler = None
+        self._shuffle = self.train_sampler is None
+        self._preprocessed = None
+        self._train_indices = None
+        self._validation_indices = None
+        self._test_indices = None
+
+        valid_classes = ['good'] + defects
+        self._dataset = AnomalyImageFolder(dataset_dir, classes=valid_classes)
+
+        # For the train/test layout, initialize indices for the train and test subsets
+        if self._validation_type == 'defined_split':
+            train_img_string = '{}/train/'.format(dataset_dir)
+            self._train_indices = [i for i, t in enumerate(self._dataset.imgs) if train_img_string in t[0]]
+            self._test_indices = [i for i, t in enumerate(self._dataset.imgs) if train_img_string not in t[0]]
+            if self._shuffle:
+                random.shuffle(self._train_indices)
+                random.shuffle(self._test_indices)
+
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+        self._class_names = self._dataset.classes
+        if not self._defects:
+            self._defects = self._dataset._defects
+
+        self._train_pct = 1.0
+        self._val_pct = 0
+        self._test_pct = 0
+
+        self._simsiam_transform = None
+        self._cutpaste_transform = None
+        self._train_transform = None
+        self._validation_transform = None
+
+    @property
+    def class_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._class_names
+
+    @property
+    def defect_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._defects
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (torch.utils.data.Dataset)
+        """
+        return self._dataset
+
+    def shuffle_split(self, train_pct=.75, val_pct=0.25, test_pct=0.0, shuffle_files=True, seed=None):
+        """
+        Randomly split the good examples into train, validation, and test subsets with a pseudo-random seed option.
+        All of the bad examples will be split into validation and test subsets with a similar proportion
+        to the val_pct and test_pct arguments.
+
+
+            Args:
+                train_pct (float): default .75, percentage of good examples to use for training
+                val_pct (float):  default .25, percentage of good examples to use for validation
+                test_pct (float): default 0.0, percentage of good examples to use for testing
+                shuffle_files (bool): default True, optionally control whether shuffling occurs
+                seed (None or int): default None, can be set for pseudo-randomization
+
+            Raises:
+                ValueError if percentage input args are not floats or sum to greater than 1
+        """
+        if not (isinstance(train_pct, float) and isinstance(val_pct, float) and isinstance(test_pct, float)):
+            raise ValueError("Percentage arguments must be floats.")
+        if train_pct + val_pct + test_pct > 1.0:
+            raise ValueError("Sum of percentage arguments must be less than or equal to 1.")
+
+        good_indices = [i for i, t in enumerate(self._dataset.targets) if t == 1]
+        bad_indices = [i for i, t in enumerate(self._dataset.targets) if t == 0]
+
+        good_length = len(good_indices)
+        good_train_size = int(train_pct * good_length)
+        good_val_size = int(val_pct * good_length)
+
+        # By default 100% of the bad samples will be used in the validation set. But if test_pct is positive,
+        # use the ratio of val_pct/test_pct to determine the split of bad samples
+        bad_val_pct = 1.0
+        if test_pct:
+            ratio = val_pct / test_pct
+            bad_val_pct = ratio / (ratio + 1)
+
+        bad_length = len(bad_indices)
+        bad_val_size = int(bad_val_pct * bad_length)
+
+        generator = torch.Generator().manual_seed(seed) if seed else None
+        if shuffle_files:
+            random.Random(seed).shuffle(good_indices)
+            random.Random(seed).shuffle(bad_indices)
+        self._train_indices = good_indices[:good_train_size]
+        self._validation_indices = good_indices[good_train_size:good_train_size + good_val_size] + \
+            bad_indices[:bad_val_size]
+        if test_pct:
+            self._test_indices = good_indices[good_train_size + good_val_size:] + \
+                bad_indices[bad_val_size:]
+        else:
+            self._test_indices = None
+        self._validation_type = 'shuffle_split'
+        if self._preprocessed and 'batch_size' in self._preprocessed:
+            self._make_data_loaders(batch_size=self._preprocessed['batch_size'], generator=generator)
+
+    def _make_data_loaders(self, batch_size, generator=None):
+        """Make data loaders for the whole dataset and the subsets that have indices defined. Note that this only
+        concerns indices, not transforms. The transforms get applied when the dataloaders are used, not created, so
+        we need to switch transforms appropriately for train/val subsets when the data is ingested."""
+        def seed_worker(worker_id):
+            worker_seed = torch.initial_seed() % 2**32
+            np.random.seed(worker_seed)
+            random.seed(worker_seed)
+
+        if self._dataset:
+            # The data_loader for the whole dataset should only have the good samples
+            good_indices = [idx for idx, target in enumerate(self._dataset.targets) if target == 1]
+            good_samples = torch.utils.data.Subset(self._dataset, good_indices)
+            self._data_loader = loader(good_samples, batch_size=batch_size, shuffle=self._shuffle,
+                                       num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator,
+                                       pin_memory=True, sampler=self.train_sampler, drop_last=False)
+        else:
+            self._data_loader = None
+        if self._train_indices:
+            self._train_loader = loader(self.train_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                        num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator,
+                                        pin_memory=True, sampler=self.train_sampler, drop_last=False)
+        else:
+            self._train_loader = None
+        if self._validation_indices or (self._validation_type == 'defined_split' and self._validation_subset):
+            self._validation_loader = loader(self.validation_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                             num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                             generator=generator, pin_memory=True, sampler=self.train_sampler,
+                                             drop_last=False)
+        else:
+            self._validation_loader = None
+        if self._test_indices or (self._validation_type == 'defined_split' and self._test_subset):
+            self._test_loader = loader(self.test_subset, batch_size=batch_size, shuffle=self._shuffle,
+                                       num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                       generator=generator, pin_memory=True, sampler=self.train_sampler,
+                                       drop_last=False)
+        else:
+            self._test_loader = None
+
+    def simsiam_transform(self, image_size):
+        """
+        Perform TwoCropsTransform and GaussianBlur on the dataset for SIMSIAM training.
+
+        Args:
+            image_size (int): desired image size
+
+        """
+        augmentation = [T.RandomResizedCrop(image_size, scale=(0.2, 1.)),
+                        T.RandomApply(
+                            [T.ColorJitter(0.1, 0.1, 0.1, 0.1)], p=0.8),
+                        T.RandomGrayscale(p=0.2),
+                        T.RandomApply(
+                            [ssloader.GaussianBlur([.1, 2.])], p=0.5),
+                        T.RandomHorizontalFlip(),
+                        T.ToTensor(),
+                        T.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
+                        ]
+
+        return ssloader.TwoCropsTransform(T.Compose(augmentation))
+
+    def preprocess(self, image_size=224, batch_size=64, add_aug=None, cutpaste_type='normal', **kwargs):
+        """
+        Preprocess the dataset to resize, normalize, and batch the images. Apply augmentation
+        if specified.
+
+            Args:
+                image_size (int or 'variable'): desired square image size (if 'variable', does not alter image size)
+                batch_size (int): desired batch size (default 64)
+                add_aug (None or list[str]): choice of augmentations ('hflip', 'rotate') to be
+                                             applied during training
+                cutpaste_type (str): choice of cutpaste variant ('normal', 'scar', '3way', 'union'),
+                                     default is 'normal'
+                kwargs: optional; additional keyword arguments for Resize and Normalize transforms
+            Raises:
+                ValueError if the dataset is not defined or has already been processed
+        """
+        if not (self._dataset):
+            raise ValueError("Unable to preprocess, because the dataset hasn't been defined.")
+
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be an positive integer")
+
+        if not image_size == 'variable' and not (isinstance(image_size, int) and image_size >= 1):
+            raise ValueError("Input image_size must be either a positive int or 'variable'")
+
+        # Get the user-specified keyword arguments
+        resize_args = {k: v for k, v in kwargs.items() if k in inspect.getfullargspec(T.Resize).args}
+        normalize_args = {k: v for k, v in kwargs.items() if k in inspect.getfullargspec(T.Normalize).args}
+
+        variant_map = {'normal': CutPasteNormal, 'scar': CutPasteScar,
+                       '3way': CutPaste3Way, 'union': CutPasteUnion}
+        variant = variant_map[cutpaste_type]
+
+        def get_transform(image_size, add_aug, train=True):
+            """The train argument, if True, will add augmentation transforms, while if False, will add only the
+            Resize and Normalize transforms for validation."""
+            transforms = []
+            if isinstance(image_size, int):
+                transforms.append(T.Resize([image_size, image_size], **resize_args))
+            if train and add_aug is not None:
+                aug_dict = {'hflip': T.RandomHorizontalFlip(),
+                            'rotate': T.RandomRotation(0.5)}
+                aug_list = ['hflip', 'rotate']
+                for option in add_aug:
+                    if option not in aug_list:
+                        raise ValueError("Unsupported augmentation for PyTorch:{}. \
+                        Supported augmentations are {}".format(option, aug_list))
+                    transforms.append(aug_dict[option])
+            transforms.append(T.ToTensor())
+            transforms.append(T.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225], **normalize_args))
+
+            return T.Compose(transforms)
+
+        self._simsiam_transform = self.simsiam_transform(image_size)
+        self._cutpaste_transform = get_cutpaste_transforms(image_size, variant)
+        self._train_transform = get_transform(image_size, add_aug, True)
+        self._validation_transform = get_transform(image_size, add_aug, False)
+        self._preprocessed = {'image_size': image_size, 'batch_size': batch_size}
+        self._make_data_loaders(batch_size=batch_size)
+
+    def get_batch(self, subset='all', simsiam=False, cutpaste=False):
+        """
+        Get a single batch of images and labels from the dataset.
+
+            Args:
+                subset (str): default "all", can also be "train", "validation", or "test"
+                simsiam (bool): if preprocess() has been previously used on the dataset and this argument is True,
+                                the simsiam transform will be applied, otherwise it will not; default False
+                cutpaste (bool): if preprocess() has been previously used on the dataset and this argument is True,
+                                the cutpaste transform will be applied, otherwise it will not; default False
+
+            Returns:
+                (examples, labels)
+
+            Raises:
+                ValueError if the dataset is not defined yet or the given subset is not valid
+        """
+        if simsiam:
+            # SimSiam transform can be manually requested with any subset
+            self._dataset.transform = self._simsiam_transform
+        elif cutpaste:
+            # CutPaste transform can be manually requested with any subset
+            self._dataset.transform = self._cutpaste_transform
+        elif subset in ['all', 'train']:
+            # For "train"/"all" subsets, if simsiam and cutpaste are False,
+            # the train transform (including augmentation) is applied
+            self._dataset.transform = self._train_transform
+        else:
+            # For "validation"/"test" subsets, if simsiam and cutpaste are False,
+            # the validation transform (excluding augmentation) is applied
+            self._dataset.transform = self._validation_transform
+
+        if subset == 'all' and self._dataset is not None:
+            return next(iter(self._data_loader))
+        elif subset == 'train' and self._train_loader is not None:
+            return next(iter(self._train_loader))
+        elif subset == 'validation' and self._validation_loader is not None:
+            return next(iter(self._validation_loader))
+        elif subset == 'test' and self._test_loader is not None:
+            return next(iter(self._test_loader))
+        else:
+            raise ValueError("Unable to return a batch, because the dataset or subset hasn't been defined.")
diff --git a/tlt/datasets/image_classification/__init__.py b/tlt/datasets/image_classification/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..592233c8c4b0d5ad506f0386b75a80cc4ec6c648
--- /dev/null
+++ b/tlt/datasets/image_classification/__init__.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from tlt.datasets.image_classification import image_classification_dataset  # noqa: F401
diff --git a/tlt/datasets/image_classification/image_classification_dataset.py b/tlt/datasets/image_classification/image_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..2bcdacc929f01b5f4dd3cf7f63cbdc305623acc7
--- /dev/null
+++ b/tlt/datasets/image_classification/image_classification_dataset.py
@@ -0,0 +1,42 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import abc
+
+from tlt.datasets.dataset import BaseDataset
+
+
+class ImageClassificationDataset(BaseDataset):
+    """
+    Base class for an image classification dataset
+    """
+    def __init__(self, dataset_dir, dataset_name="", dataset_catalog=""):
+        """
+        Class constructor
+        """
+        BaseDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog)
+
+    @property
+    @abc.abstractmethod
+    def class_names(self):
+        """
+        Returns the list of class names (abstract method implemented by subclasses)
+        """
+        pass
diff --git a/tlt/datasets/image_classification/pytorch_custom_image_classification_dataset.py b/tlt/datasets/image_classification/pytorch_custom_image_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..ef6a0ec9b1bbfda87cbf75bcaebe3ac3b2bb68c6
--- /dev/null
+++ b/tlt/datasets/image_classification/pytorch_custom_image_classification_dataset.py
@@ -0,0 +1,155 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import torch
+from torchvision import datasets
+
+from tlt.datasets.pytorch_dataset import PyTorchDataset
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+
+
+class PyTorchCustomImageClassificationDataset(ImageClassificationDataset, PyTorchDataset):
+    """
+    A custom image classification dataset that can be used with PyTorch models. Note that the
+    directory of images is expected to be organized with subfolders for each image class. Each subfolder should
+    contain .jpg images for the class. The name of the subfolder will be used as the class label.
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── class_a
+          ├── class_b
+          └── class_c
+
+    For a user-defined split of train, validation, and test subsets, arrange class subfolders in accordingly named
+    subfolders (note: the only acceptable names are 'train', 'validation', and/or 'test').
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── train
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          ├── validation
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          └── test
+              ├── class_a
+              ├── class_b
+              └── class_c
+
+    Args:
+        dataset_dir (str): Directory where the data is located. It should contain subdirectories with images for
+                           each class.
+        dataset_name (str): optional; Name of the dataset. If no dataset name is given, the dataset_dir folder name
+                            will be used as the dataset name.
+        num_workers (int): optional; Number of processes to use for data loading, default is 0
+        shuffle_files (bool): optional; Whether to shuffle the data. Defaults to True.
+
+    Raises:
+        FileNotFoundError: if dataset directory does not exist
+
+    """
+
+    def __init__(self, dataset_dir, dataset_name=None, num_workers=0, shuffle_files=True):
+        """
+        Class constructor
+        """
+        if not os.path.exists(dataset_dir):
+            raise FileNotFoundError("The dataset directory ({}) does not exist".format(dataset_dir))
+
+        # The dataset name is only used for informational purposes. If one isn't given, use the directory name
+        if not dataset_name:
+            dataset_name = os.path.basename(dataset_dir)
+
+        ImageClassificationDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog=None)
+
+        self._info = {
+            "name": dataset_name,
+            "dataset_dir": dataset_dir
+        }
+        self._num_workers = num_workers
+        self._shuffle = shuffle_files
+        self._preprocessed = None
+        self._dataset = None
+        self._train_indices = None
+        self._validation_indices = None
+        self._test_indices = None
+
+        self._train_pct = 1.0
+        self._val_pct = 0
+        self._test_pct = 0
+
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+        # Determine which layout the images are in - category folders or train/test folders
+        # The validation_type will be None for the former and "defined_split" for the latter
+        if os.path.exists(os.path.join(dataset_dir, 'train')):
+            self._validation_type = 'defined_split'
+            self._dataset = datasets.ImageFolder(os.path.join(dataset_dir, 'train'))
+            self._train_indices = range(len(self._dataset))
+            self._class_names = self._dataset.classes
+            if os.path.exists(os.path.join(dataset_dir, 'validation')) or os.path.exists(os.path.join(dataset_dir,
+                                                                                                      'test')):
+                train_length = len(self._dataset)
+                validation_length = 0
+                if os.path.exists(os.path.join(dataset_dir, 'validation')):
+                    validation_data = datasets.ImageFolder(os.path.join(dataset_dir, 'validation'))
+                    validation_length = len(validation_data)
+                    self._dataset = torch.utils.data.ConcatDataset([self._dataset, validation_data])
+                    self._validation_indices = range(train_length, train_length + validation_length)
+                if os.path.exists(os.path.join(dataset_dir, 'test')):
+                    test_data = datasets.ImageFolder(os.path.join(dataset_dir, 'test'))
+                    test_length = len(test_data)
+                    self._dataset = torch.utils.data.ConcatDataset([self._dataset, test_data])
+                    self._test_indices = range(train_length + validation_length,
+                                               train_length + validation_length + test_length)
+            else:
+                raise FileNotFoundError("Found a 'train' directory, but not a 'test' or 'validation' directory.")
+        else:
+            self._validation_type = None
+            self._dataset = datasets.ImageFolder(self._dataset_dir)
+            self._class_names = self._dataset.classes
+
+    @property
+    def class_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._class_names
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (torch.utils.data.Dataset)
+        """
+        return self._dataset
diff --git a/tlt/datasets/image_classification/tf_custom_image_classification_dataset.py b/tlt/datasets/image_classification/tf_custom_image_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..e6012e6a08f0184181fd5499ff5efb987056bda4
--- /dev/null
+++ b/tlt/datasets/image_classification/tf_custom_image_classification_dataset.py
@@ -0,0 +1,237 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import tensorflow as tf
+
+from tlt.datasets.tf_dataset import TFDataset
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+
+
+class TFCustomImageClassificationDataset(ImageClassificationDataset, TFDataset):
+    """
+    A custom image classification dataset that can be used with TensorFlow models. Note that the
+    directory of images is expected to be organized with subfolders for each image class. Each subfolder should
+    contain .jpg images for the class. The name of the subfolder will be used as the class label.
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── class_a
+          ├── class_b
+          └── class_c
+
+    For a user-defined split of train, validation, and test subsets, arrange class subfolders in accordingly named
+    subfolders (note: the only acceptable names are 'train', 'validation', and/or 'test').
+
+    .. code-block:: text
+
+        dataset_dir
+          ├── train
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          ├── validation
+          |   ├── class_a
+          |   ├── class_b
+          |   └── class_c
+          └── test
+              ├── class_a
+              ├── class_b
+              └── class_c
+
+    Args:
+        dataset_dir (str): Directory where the data is located. It should contain subdirectories with images for
+                           each class.
+        dataset_name (str): optional; Name of the dataset. If no dataset name is given, the dataset_dir folder name
+                            will be used as the dataset name.
+        color_mode (str): optional; Specify the color mode as "greyscale", "rgb", or "rgba". Defaults to "rgb".
+        shuffle_files (bool): optional; Whether to shuffle the data. Defaults to True.
+        seed (int): optional; Random seed for shuffling
+
+    Raises:
+        FileNotFoundError: if dataset directory does not exist
+
+    """
+
+    def __init__(self, dataset_dir, dataset_name=None, color_mode="rgb", shuffle_files=True, seed=None, **kwargs):
+        """
+        Class constructor
+        """
+        if not os.path.exists(dataset_dir):
+            raise FileNotFoundError("The dataset directory ({}) does not exist".format(dataset_dir))
+
+        # The dataset name is only used for informational purposes. If one isn't given, use the directory name
+        if not dataset_name:
+            dataset_name = os.path.basename(dataset_dir)
+
+        ImageClassificationDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog=None)
+
+        self._info = {
+            "name": dataset_name,
+            "dataset_dir": dataset_dir,
+            "color_mode": color_mode
+        }
+        self._preprocessed = None
+        self._seed = seed
+
+        self._train_pct = 1.0
+        self._val_pct = 0
+        self._test_pct = 0
+        self._validation_type = None
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+        # Determine which layout the images are in - category folders or train/test folders
+        # The validation_type will be None for the former and "defined_split" for the latter
+        if os.path.exists(os.path.join(dataset_dir, 'train')):
+            self._validation_type = 'defined_split'
+            self._train_subset = tf.keras.utils.image_dataset_from_directory(
+                os.path.join(dataset_dir, 'train'),
+                batch_size=None,
+                shuffle=shuffle_files,
+                seed=self._seed,
+                color_mode=color_mode)
+            self._dataset = self._train_subset
+            self._class_names = self._dataset.class_names
+            if os.path.exists(os.path.join(dataset_dir, 'validation')) or \
+                    os.path.exists(os.path.join(dataset_dir, 'test')):
+                if os.path.exists(os.path.join(dataset_dir, 'validation')):
+                    self._validation_subset = tf.keras.utils.image_dataset_from_directory(
+                        os.path.join(dataset_dir, 'validation'),
+                        batch_size=None,
+                        shuffle=shuffle_files,
+                        seed=self._seed,
+                        color_mode=color_mode)
+                    self._dataset = self._dataset.concatenate(self._validation_subset)
+                if os.path.exists(os.path.join(dataset_dir, 'test')):
+                    self._test_subset = tf.keras.utils.image_dataset_from_directory(
+                        os.path.join(dataset_dir, 'test'),
+                        batch_size=None,
+                        shuffle=shuffle_files,
+                        seed=self._seed,
+                        color_mode=color_mode)
+                    self._dataset = self._dataset.concatenate(self._test_subset)
+            else:
+                raise FileNotFoundError("Found a 'train' directory, but not a 'test' or 'validation' directory.")
+        else:
+            self._validation_type = None
+            self._dataset = tf.keras.utils.image_dataset_from_directory(
+                self._dataset_dir,
+                batch_size=None,
+                shuffle=shuffle_files,
+                seed=self._seed,
+                color_mode=color_mode)
+            self._class_names = self._dataset.class_names
+
+    @property
+    def class_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._class_names
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (tf.data.Dataset)
+        """
+        return self._dataset
+
+    def preprocess(self, image_size, batch_size, add_aug=None, preprocessor=None):
+        """
+        Preprocess the dataset to convert to float32, resize, normalize, and batch the images
+
+            Args:
+                image_size (int): desired square image size
+                batch_size (int): desired batch size
+                normalize (bool): rescale the image between (1, 255), default True; should be disabled when using keras
+                                  applications because the model's initial layers apply the requisite model-specific
+                                  normalization
+                add_aug (None or list[str]): Choice of augmentations (RandomHorizontalandVerticalFlip,
+                                             RandomHorizontalFlip, RandomVerticalFlip, RandomZoom, RandomRotation) to be
+                                             applied during training
+                preprocessor (None or preprocess_input function from keras.applications): Should be provided when using
+                                             Keras Applications models, which have model-specific preprocessors;
+                                             otherwise, use None (the default) to apply generic normalization and
+                                             resizing
+
+            Raises:
+                ValueError: if the dataset is not defined or has already been processed
+        """
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be an positive integer")
+        if not isinstance(image_size, int) or image_size < 1:
+            raise ValueError("image_size should be an positive integer")
+        if not (self._dataset or self._train_subset or self._validation_subset or self._test_subset):
+            raise ValueError("Unable to preprocess, because the dataset hasn't been defined.")
+
+        if add_aug is not None:
+            aug_dict = {
+                'hvflip': tf.keras.layers.RandomFlip("horizontal_and_vertical",
+                                                     input_shape=(image_size, image_size, 3), seed=self._seed),
+                'hflip': tf.keras.layers.RandomFlip("horizontal",
+                                                    input_shape=(image_size, image_size, 3), seed=self._seed),
+                'vflip': tf.keras.layers.RandomFlip("vertical",
+                                                    input_shape=(image_size, image_size, 3), seed=self._seed),
+                'rotate': tf.keras.layers.RandomRotation(0.5, seed=self._seed),
+                'zoom': tf.keras.layers.RandomZoom(0.3, seed=self._seed)}
+            aug_list = ['hvflip', 'hflip', 'vflip', 'rotate', 'zoom']
+
+            data_augmentation = tf.keras.Sequential()
+
+            for option in add_aug:
+                if option not in aug_list:
+                    raise ValueError("Unsupported augmentation for TensorFlow:{}. \
+                        Supported augmentations are {}".format(option, aug_list))
+                data_augmentation.add(aug_dict[option])
+
+        normalization_layer = tf.keras.layers.Rescaling(1. / 255)
+
+        def preprocess_image(image, label):
+            image = tf.image.resize_with_pad(image, image_size, image_size)
+            if preprocessor is None:
+                image = normalization_layer(image)
+            return (image, label)
+
+        # Get the non-None splits
+        split_list = ['_dataset', '_train_subset', '_validation_subset', '_test_subset']
+        subsets = [s for s in split_list if getattr(self, s, None)]
+        for subset in subsets:
+            setattr(self, subset, getattr(self, subset).map(preprocess_image))
+            if preprocessor:
+                setattr(self, subset, getattr(self, subset).map(lambda x, y: (preprocessor(x), y)))
+            setattr(self, subset, getattr(self, subset).cache())
+            setattr(self, subset, getattr(self, subset).batch(batch_size))
+            setattr(self, subset, getattr(self, subset).prefetch(tf.data.AUTOTUNE))
+            if add_aug is not None and subset in ['_dataset', '_train_subset']:
+                setattr(self, subset, getattr(self, subset).map(lambda x, y: (data_augmentation(x, training=True), y),
+                                                                num_parallel_calls=tf.data.AUTOTUNE))
+        self._preprocessed = {'image_size': image_size, 'batch_size': batch_size}
diff --git a/tlt/datasets/image_classification/tfds_image_classification_dataset.py b/tlt/datasets/image_classification/tfds_image_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..1c783e99fbe1d772c9bdf2b9701cbd5ee0f36b72
--- /dev/null
+++ b/tlt/datasets/image_classification/tfds_image_classification_dataset.py
@@ -0,0 +1,150 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import tensorflow as tf
+
+from tlt.datasets.tf_dataset import TFDataset
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+from downloader.datasets import DataDownloader
+
+
+class TFDSImageClassificationDataset(ImageClassificationDataset, TFDataset):
+    """
+    An image classification dataset from the TensorFlow datasets catalog
+    """
+    def __init__(self, dataset_dir, dataset_name, split=["train"],
+                 as_supervised=True, shuffle_files=True, seed=None, **kwargs):
+        """
+        Class constructor
+        """
+        if not isinstance(split, list):
+            raise ValueError("Value of split argument must be a list.")
+        ImageClassificationDataset.__init__(self, dataset_dir, dataset_name)
+        self._preprocessed = {}
+        self._seed = seed
+        tf.get_logger().setLevel('ERROR')
+
+        downloader = DataDownloader(dataset_name, dataset_dir=dataset_dir, catalog='tfds', as_supervised=as_supervised,
+                                    shuffle_files=shuffle_files, with_info=True)
+        data, self._info = downloader.download(split=split)
+
+        self._dataset = None
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+        if len(split) == 1:
+            self._validation_type = None  # Train & evaluate on the whole dataset
+            self._dataset = data[0]
+        else:
+            self._validation_type = 'defined_split'  # Defined by user or TFDS
+            for i, s in enumerate(split):
+                if s == 'train':
+                    self._train_subset = data[i]
+                elif s == 'validation':
+                    self._validation_subset = data[i]
+                elif s == 'test':
+                    self._test_subset = data[i]
+                self._dataset = data[i] if self._dataset is None else self._dataset.concatenate(data[i])
+
+    @property
+    def class_names(self):
+        """Returns the list of class names"""
+        return self._info.features["label"].names
+
+    @property
+    def info(self):
+        """Returns a dictionary of information about the dataset"""
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (tf.data.Dataset)
+        """
+        return self._dataset
+
+    def preprocess(self, image_size, batch_size, add_aug=None, preprocessor=None):
+        """
+        Preprocess the dataset to convert to float32, resize, and batch the images
+
+            Args:
+                image_size (int): desired square image size
+                batch_size (int): desired batch size
+                add_aug (None or list[str]): Choice of augmentations (RandomHorizontalandVerticalFlip,
+                                             RandomHorizontalFlip, RandomVerticalFlip, RandomZoom, RandomRotation) to
+                                             be applied during training
+                preprocessor (None or preprocess_input function from keras.applications): Should be provided when using
+                                             Keras Applications models, which have model-specific preprocessors;
+                                             otherwise, use None (the default) to apply generic type conversion and
+                                             resizing
+
+            Raises:
+                ValueError: if the dataset is not defined or has already been processed
+        """
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be a positive integer")
+        if not isinstance(image_size, int) or image_size < 1:
+            raise ValueError("image_size should be a positive integer")
+        if not (self._dataset or self._train_subset or self._validation_subset or self._test_subset):
+            raise ValueError("Unable to preprocess, because the dataset hasn't been defined.")
+
+        if add_aug is not None:
+            aug_dict = {
+                'hvflip': tf.keras.layers.RandomFlip("horizontal_and_vertical",
+                                                     input_shape=(image_size, image_size, 3), seed=self._seed),
+                'hflip': tf.keras.layers.RandomFlip("horizontal",
+                                                    input_shape=(image_size, image_size, 3), seed=self._seed),
+                'vflip': tf.keras.layers.RandomFlip("vertical",
+                                                    input_shape=(image_size, image_size, 3), seed=self._seed),
+                'rotate': tf.keras.layers.RandomRotation(0.5, seed=self._seed),
+                'zoom': tf.keras.layers.RandomZoom(0.3, seed=self._seed)}
+            aug_list = ['hvflip', 'hflip', 'vflip', 'rotate', 'zoom']
+
+            data_augmentation = tf.keras.Sequential()
+
+            for option in add_aug:
+                if option not in aug_list:
+                    raise ValueError("Unsupported augmentation for TensorFlow:{}. \
+                    Supported augmentations are {}".format(option, aug_list))
+                data_augmentation.add(aug_dict[option])
+
+        def preprocess_image(image, label):
+            if preprocessor is None:
+                image = tf.image.convert_image_dtype(image, tf.float32)
+            image = tf.image.resize_with_pad(image, image_size, image_size)
+            return (image, label)
+
+        # Get the non-None splits
+        split_list = ['_dataset', '_train_subset', '_validation_subset', '_test_subset']
+        subsets = [s for s in split_list if getattr(self, s, None)]
+        for subset in subsets:
+            setattr(self, subset, getattr(self, subset).map(preprocess_image))
+            if preprocessor:
+                setattr(self, subset, getattr(self, subset).map(lambda x, y: (preprocessor(x), y)))
+            setattr(self, subset, getattr(self, subset).cache())
+            setattr(self, subset, getattr(self, subset).batch(batch_size))
+            setattr(self, subset, getattr(self, subset).prefetch(tf.data.AUTOTUNE))
+            if add_aug is not None and subset in ['_dataset', '_train_subset']:
+                setattr(self, subset, getattr(self, subset).map(lambda x, y: (data_augmentation(x, training=True), y),
+                                                                num_parallel_calls=tf.data.AUTOTUNE))
+        self._preprocessed = {'image_size': image_size, 'batch_size': batch_size}
diff --git a/tlt/datasets/image_classification/torchvision_image_classification_dataset.py b/tlt/datasets/image_classification/torchvision_image_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..7df9edcc5ee994900b9df2f22527fefb3c684d65
--- /dev/null
+++ b/tlt/datasets/image_classification/torchvision_image_classification_dataset.py
@@ -0,0 +1,129 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import torch
+
+from tlt.datasets.pytorch_dataset import PyTorchDataset
+from tlt.datasets.image_classification.image_classification_dataset import ImageClassificationDataset
+from downloader.datasets import DataDownloader
+
+DATASETS = ["CIFAR10", "Food101", "Country211", "DTD", "FGVCAircraft", "RenderedSST2"]
+
+
+class TorchvisionImageClassificationDataset(ImageClassificationDataset, PyTorchDataset):
+    """
+    An image classification dataset from the torchvision catalog
+    """
+
+    def __init__(self, dataset_dir, dataset_name, split=['train'], download=True, num_workers=0, shuffle_files=True,
+                 **kwargs):
+        """
+        Class constructor
+        """
+        if not isinstance(split, list):
+            raise ValueError("Value of split argument must be a list.")
+        for s in split:
+            if not isinstance(s, str) or s not in ['train', 'validation', 'test']:
+                raise ValueError('Split argument can only contain these strings: train, validation, test.')
+        if dataset_name not in DATASETS:
+            raise ValueError("Dataset name is not supported. Choose from: {}".format(DATASETS))
+
+        ImageClassificationDataset.__init__(self, dataset_dir, dataset_name)
+        self._num_workers = num_workers
+        self._shuffle = shuffle_files
+        self._preprocessed = {}
+        self._dataset = None
+        self._train_indices = None
+        self._validation_indices = None
+        self._test_indices = None
+        self._distributed = kwargs.get("distributed", None)
+
+        downloader = DataDownloader(dataset_name, dataset_dir=dataset_dir, catalog='torchvision')
+        if len(split) == 1:
+            # If there is only one split, use it for _dataset and do not define any indices
+            if split[0] == 'train':
+                self._dataset = downloader.download(split='train')
+            elif split[0] == 'validation':
+                try:
+                    self._dataset = downloader.download(split='val')
+                except TypeError:
+                    raise ValueError('No validation split was found for this dataset: {}'.format(dataset_name))
+            elif split[0] == 'test':
+                try:
+                    self._dataset = downloader.download(split='test')
+                except TypeError:
+                    raise ValueError('No test split was found for this dataset: {}'.format(dataset_name))
+            self._validation_type = None  # Train & evaluate on the whole dataset
+        else:
+            # If there are multiple splits, concatenate them for _dataset and define indices
+            if 'train' in split:
+                self._dataset = downloader.download(split='train')
+                self._train_indices = range(len(self._dataset))
+            if 'validation' in split:
+                try:
+                    validation_data = downloader.download(split='val')
+                    validation_length = len(validation_data)
+                    if self._dataset:
+                        current_length = len(self._dataset)
+                        self._dataset = torch.utils.data.ConcatDataset([self._dataset, validation_data])
+                        self._validation_indices = range(current_length, current_length + validation_length)
+                    else:
+                        self._dataset = validation_data
+                        self._validation_indices = range(validation_length)
+                except ValueError:
+                    raise ValueError('No validation split was found for this dataset: {}'.format(dataset_name))
+            if 'test' in split:
+                try:
+                    test_data = downloader.download(split='test')
+                except ValueError:
+                    raise ValueError('No test split was found for this dataset: {}'.format(dataset_name))
+                finally:
+                    test_length = len(test_data)
+                    if self._dataset:
+                        current_length = len(self._dataset)
+                        self._dataset = torch.utils.data.ConcatDataset([self._dataset, test_data])
+                        self._test_indices = range(current_length, current_length + test_length)
+                    else:
+                        self._dataset = test_data
+                        self._validation_indices = range(test_length)
+            self._validation_type = 'defined_split'  # Defined by user or torchvision
+        self._info = {'name': dataset_name, 'size': len(self._dataset), 'distributed': self._distributed}
+        self._make_data_loaders(batch_size=1)
+
+    @property
+    def class_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._dataset.classes
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (torch.utils.data.Dataset)
+        """
+        return self._dataset
diff --git a/tlt/datasets/pytorch_dataset.py b/tlt/datasets/pytorch_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..05837d8b23e7343d50f62116264ca4ae04d1444c
--- /dev/null
+++ b/tlt/datasets/pytorch_dataset.py
@@ -0,0 +1,246 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import torch
+import torchvision.transforms as T
+from torch.utils.data import DataLoader as loader
+import numpy as np
+import random
+import inspect
+
+from tlt.datasets.dataset import BaseDataset
+
+
+class PyTorchDataset(BaseDataset):
+    """
+    Base class to represent a PyTorch Dataset
+    """
+
+    def __init__(self, dataset_dir, dataset_name="", dataset_catalog=""):
+        """
+        Class constructor
+        """
+        BaseDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog)
+
+    @property
+    def train_subset(self):
+        """
+        A subset of the dataset used for training
+        """
+        return torch.utils.data.Subset(self._dataset, self._train_indices) if self._train_indices else None
+
+    @property
+    def validation_subset(self):
+        """
+        A subset of the dataset used for validation/evaluation
+        """
+        return torch.utils.data.Subset(self._dataset, self._validation_indices) if self._validation_indices else None
+
+    @property
+    def test_subset(self):
+        """
+        A subset of the dataset held out for final testing/evaluation
+        """
+        return torch.utils.data.Subset(self._dataset, self._test_indices) if self._test_indices else None
+
+    @property
+    def data_loader(self):
+        """
+        A data loader object corresponding to the dataset
+        """
+        return self._data_loader
+
+    @property
+    def train_loader(self):
+        """
+        A data loader object corresponding to the training subset
+        """
+        return self._train_loader
+
+    @property
+    def validation_loader(self):
+        """
+        A data loader object corresponding to the validation subset
+        """
+        return self._validation_loader
+
+    @property
+    def test_loader(self):
+        """
+        A data loader object corresponding to the test subset
+        """
+        return self._test_loader
+
+    def get_batch(self, subset='all'):
+        """
+        Get a single batch of images and labels from the dataset.
+
+            Args:
+                subset (str): default "all", can also be "train", "validation", or "test"
+
+            Returns:
+                (examples, labels)
+
+            Raises:
+                ValueError: if the dataset is not defined yet or the given subset is not valid
+        """
+        if subset == 'all' and self._dataset is not None:
+            return next(iter(self._data_loader))
+        elif subset == 'train' and self._train_loader is not None:
+            return next(iter(self._train_loader))
+        elif subset == 'validation' and self._validation_loader is not None:
+            return next(iter(self._validation_loader))
+        elif subset == 'test' and self._test_loader is not None:
+            return next(iter(self._test_loader))
+        else:
+            raise ValueError("Unable to return a batch, because the dataset or subset hasn't been defined.")
+
+    def shuffle_split(self, train_pct=.75, val_pct=.25, test_pct=0., shuffle_files=True, seed=None):
+        """
+        Randomly split the dataset into train, validation, and test subsets with a pseudo-random seed option.
+
+            Args:
+                train_pct (float): default .75, percentage of dataset to use for training
+                val_pct (float):  default .25, percentage of dataset to use for validation
+                test_pct (float): default 0.0, percentage of dataset to use for testing
+                shuffle_files (bool): default True, optionally control whether shuffling occurs
+                seed (None or int): default None, can be set for pseudo-randomization
+
+            Raises:
+                ValueError: if percentage input args are not floats or sum to greater than 1
+        """
+        if not (isinstance(train_pct, float) and isinstance(val_pct, float) and isinstance(test_pct, float)):
+            raise ValueError("Percentage arguments must be floats.")
+        if train_pct + val_pct + test_pct > 1.0:
+            raise ValueError("Sum of percentage arguments must be less than or equal to 1.")
+
+        length = len(self._dataset)
+        train_size = int(train_pct * length)
+        val_size = int(val_pct * length)
+        test_size = int(test_pct * length)
+        generator = torch.Generator().manual_seed(seed) if seed else None
+        if shuffle_files:
+            dataset_indices = torch.randperm(length, generator=generator).tolist()
+        else:
+            dataset_indices = range(length)
+        self._train_indices = dataset_indices[:train_size]
+        self._validation_indices = dataset_indices[train_size:train_size + val_size]
+        if test_pct:
+            self._test_indices = dataset_indices[train_size + val_size:train_size + val_size + test_size]
+        else:
+            self._test_indices = None
+        self._validation_type = 'shuffle_split'
+        if self._preprocessed and 'batch_size' in self._preprocessed:
+            self._make_data_loaders(batch_size=self._preprocessed['batch_size'], generator=generator)
+
+    def _make_data_loaders(self, batch_size, generator=None):
+        """Make data loaders for the whole dataset and the subsets that have indices defined"""
+        def seed_worker(worker_id):
+            worker_seed = torch.initial_seed() % 2**32
+            np.random.seed(worker_seed)
+            random.seed(worker_seed)
+
+        if self._dataset:
+            self._data_loader = loader(self.dataset, batch_size=batch_size, shuffle=False,
+                                       num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator)
+        else:
+            self._data_loader = None
+        if self._train_indices:
+            self._train_loader = loader(self.train_subset, batch_size=batch_size, shuffle=False,
+                                        num_workers=self._num_workers, worker_init_fn=seed_worker, generator=generator)
+        else:
+            self._train_loader = None
+        if self._validation_indices:
+            self._validation_loader = loader(self.validation_subset, batch_size=batch_size, shuffle=False,
+                                             num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                             generator=generator)
+        else:
+            self._validation_loader = None
+        if self._test_indices:
+            self._test_loader = loader(self.test_subset, batch_size=batch_size, shuffle=False,
+                                       num_workers=self._num_workers, worker_init_fn=seed_worker,
+                                       generator=generator)
+        else:
+            self._test_loader = None
+
+    def preprocess(self, image_size='variable', batch_size=32, add_aug=None, **kwargs):
+        """
+        Preprocess the dataset to resize, normalize, and batch the images. Apply augmentation
+        if specified.
+
+            Args:
+                image_size (int or 'variable'): desired square image size (if 'variable', does not alter image size)
+                batch_size (int): desired batch size (default 32)
+                add_aug (None or list[str]): Choice of augmentations (RandomHorizontalFlip, RandomRotation) to be
+                                             applied during training
+                kwargs: optional; additional keyword arguments for Resize and Normalize transforms
+            Raises:
+                ValueError if the dataset is not defined or has already been processed
+        """
+        # NOTE: Should this be part of init? If we get image_size and batch size during init,
+        # then we don't need a separate call to preprocess.
+        if not (self._dataset):
+            raise ValueError("Unable to preprocess, because the dataset hasn't been defined.")
+
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be an positive integer")
+
+        if not image_size == 'variable' and not (isinstance(image_size, int) and image_size >= 1):
+            raise ValueError("Input image_size must be either a positive int or 'variable'")
+
+        # Get the user-specified keyword arguments
+        resize_args = {k: v for k, v in kwargs.items() if k in inspect.getfullargspec(T.Resize).args}
+        normalize_args = {k: v for k, v in kwargs.items() if k in inspect.getfullargspec(T.Normalize).args}
+
+        def get_transform(image_size, add_aug):
+            transforms = []
+            if isinstance(image_size, int):
+                transforms.append(T.Resize([image_size, image_size], **resize_args))
+            if add_aug is not None:
+                aug_dict = {'hflip': T.RandomHorizontalFlip(),
+                            'rotate': T.RandomRotation(0.5)}
+                aug_list = ['hflip', 'rotate']
+                for option in add_aug:
+                    if option not in aug_list:
+                        raise ValueError("Unsupported augmentation for PyTorch:{}. \
+                        Supported augmentations are {}".format(option, aug_list))
+                    transforms.append(aug_dict[option])
+            transforms.append(T.ToTensor())
+            transforms.append(T.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225], **normalize_args))
+
+            return T.Compose(transforms)
+
+        self._dataset.transform = get_transform(image_size, add_aug)
+        self._preprocessed = {'image_size': image_size, 'batch_size': batch_size}
+        self._make_data_loaders(batch_size=batch_size)
+
+    def get_inc_dataloaders(self):
+        calib_dataloader = self.train_loader
+        if self.validation_loader is not None:
+            eval_dataloader = self.validation_loader
+        elif self.test_loader is not None:
+            eval_dataloader = self.test_loader
+        else:
+            eval_dataloader = self.train_loader
+
+        return calib_dataloader, eval_dataloader
diff --git a/tlt/datasets/text_classification/hf_custom_text_classification_dataset.py b/tlt/datasets/text_classification/hf_custom_text_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..29c60d033b15d32c78f4e75b3e31f67d8bfd2be4
--- /dev/null
+++ b/tlt/datasets/text_classification/hf_custom_text_classification_dataset.py
@@ -0,0 +1,182 @@
+import os
+from typing import List, Optional
+
+import pandas as pd
+
+from datasets.arrow_dataset import Dataset
+
+from tlt.datasets.hf_dataset import HFDataset
+from tlt.datasets.text_classification.text_classification_dataset import TextClassificationDataset
+
+
+class HFCustomTextClassificationDataset(TextClassificationDataset, HFDataset):
+    """
+    A custom text classification dataset that can be used with Transformer models.
+    """
+
+    def __init__(
+        self,
+        dataset_dir,
+        dataset_name: Optional[str],
+        csv_file_name: str,
+        class_names: Optional[List[str]] = None,
+        column_names: Optional[List[str]] = None,
+        label_map_func: Optional[callable] = None,
+        label_col: Optional[int] = 0,
+        delimiter: Optional[str] = ",",
+        header: Optional[bool] = False,
+        select_cols: Optional[List[int]] = None,
+        exclude_cols: Optional[List[int]] = None,
+        shuffle_files: Optional[bool] = True,
+        num_workers: Optional[int] = 0,
+    ):
+        """
+        A custom text classification dataset that can be used with Transformer models.
+        Note that this dataset class expects a .csv file with two columns where the first column is the label and
+        the second column is the text/sentence to classify.
+
+        For example, a comma separated value file will look similar to the snippet below:
+
+        .. code-block:: text
+
+            class_a,<text>
+            class_b,<text>
+            class_a,<text>
+            ...
+
+        If the .csv files has more columns, the select_cols or exclude_cols parameters can be used to filter out which
+        columns will be parsed.
+
+        Args:
+            dataset_dir (str): Directory containing the dataset
+            dataset_name (str): Name of the dataset. If no dataset name is given, the dataset_dir folder name
+                will be used as the dataset name.
+            csv_file_name (str): Name of the file to load from the dataset directory
+            class_names (list(str)): optional; List of ordered class names. If None, class_names are inferred from
+                label_col column
+            column_names (list(str)): optional; List of column names. If given, there must be exactly one value as
+                "label" in the position corresponding to the 'label_col' argument. If None, column names are assigned
+                as "label" for the label_col column and "text_1", "text_2", ... for the rest of the columns.
+            label_map_func (function): optional; Maps the label_map_func across the label column of the dataset to
+                apply a transform to the elements. For example, if the .csv file has string class labels
+                instead of numerical values, you can provide a function that maps the string to a numerical
+                value or specify the index of the label column to apply a default label_map_func which assigns an
+                integer for every unique class label, starting with 0.
+            label_col (int): optional; Column index of the dataset to use as label column. Defaults to "0"
+            delimiter (str): String character that separates the text in each row. Defaults to ","
+            header (bool): optional; Boolean indicating whether or not the csv file has a header line that should be
+                skipped. Defaults to False.
+            select_cols (list): optional; Specify a list of sorted indices for columns from the dataset file(s) that
+                should be parsed. Defaults to parsing all columns. At most one of select_cols and exclude_cols can
+                be specified.
+            exclude_cols (list): optional; Specify a list of sorted indices for columns from the dataset file(s) that
+                should be excluded from parsing. Defaults to parsing all columns. At most one of select_cols and
+                exclude_cols can be specified.
+            shuffle_files (bool): optional; Whether to shuffle the data. Defaults to True.
+            num_workers (int): Number of workers to pass into a DataLoader.
+
+        Raises:
+            FileNotFoundError: if the csv file is not found in the dataset directory
+            TypeError: if label_map_func is not callable
+            ValueError: if class_names list is empty
+            ValueError: if column_names list does not contain the value 'label'
+            ValueError: if index of 'label' in column_names and label_col mismatch
+            ValueError: if the values of column_names are not strings.
+            ValueError: if column_names contains more than one value as 'label'
+
+        """
+        # Sanity checks
+        dataset_file = os.path.join(dataset_dir, csv_file_name)
+        if not os.path.exists(dataset_file):
+            raise FileNotFoundError("The dataset file ({}) does not exist".format(dataset_file))
+
+        if isinstance(class_names, list) and len(class_names) == 0:
+            raise ValueError("The class_names list cannot be empty.")
+
+        if label_map_func and not callable(label_map_func):
+            raise TypeError("The label_map_func is expected to be a function, but found a {}", type(label_map_func))
+
+        # The dataset name is only used for informational purposes. Default to use the file name without extension.
+        if not dataset_name:
+            dataset_name = os.path.splitext(csv_file_name)[0]
+
+        if column_names:
+            if 'label' not in column_names:
+                raise ValueError("The column_names list must contain one value as 'label'")
+            if column_names.count('label') > 1:
+                raise ValueError("There must be exactly one value as 'label' in column_names.")
+            if not all(isinstance(c, str) for c in column_names):
+                raise ValueError("All column names must be strings.")
+            if column_names.index('label') != label_col:
+                raise ValueError("The label_col index ({}) does not match with column_names {}."
+                                 "Either specify label_col argument (or) make the first value "
+                                 "in your column_names as 'label'".format(label_col, column_names))
+
+        TextClassificationDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog=None)
+
+        print("WARNING: Using column {} as label column. To change this behavior, "
+              "specify the label_col argument".format(label_col))
+        if delimiter == 't':
+            delimiter = '\t'
+        if header:
+            dataset_df = pd.read_csv(dataset_file, delimiter=delimiter, encoding='utf-8', dtype=str, names=column_names,
+                                     header=0)
+        else:
+            dataset_df = pd.read_csv(dataset_file, delimiter=delimiter, encoding='utf-8', dtype=str, names=column_names,
+                                     header=None)
+            if not column_names:
+                column_names = {i: 'label' if i == label_col else f'text_{i}' for i in dataset_df.columns}
+                dataset_df.rename(column_names, axis=1, inplace=True)
+
+        if select_cols and not exclude_cols:
+            dataset_df = dataset_df[dataset_df.columns[select_cols]]
+        elif exclude_cols and not select_cols:
+            dataset_df = dataset_df.drop(dataset_df.columns[exclude_cols], axis=1)
+        elif select_cols and exclude_cols:
+            if not set(select_cols).isdisjoint(exclude_cols):
+                raise ValueError("select_cols and exclude_cols lists are ambiguous. \
+                                  Please make sure they are disjoint")
+            dataset_df = dataset_df.drop(dataset_df.columns[exclude_cols], axis=1)
+            dataset_df = dataset_df[dataset_df.columns[select_cols]]
+
+        if not class_names:
+            class_names = dataset_df.iloc[:, label_col].unique()
+
+        if not label_map_func:
+            label_str_dict = {label_name: idx for idx, label_name in enumerate(class_names)}
+
+            def label_map_func(x):
+                return label_str_dict[x]
+
+        dataset_df.iloc[:, label_col] = dataset_df.iloc[:, label_col].map(label_map_func)
+
+        self._dataset = Dataset.from_pandas(dataset_df)
+
+        self._info = {
+            "name": dataset_name,
+            "dataset_dir": dataset_dir,
+            "file_name": csv_file_name,
+            "delimiter": delimiter,
+            "header": header,
+            "select_cols": select_cols,
+            "exclude_cols": exclude_cols,
+            'class_names': class_names
+        }
+
+        self._class_names = class_names
+        self._validation_type = None
+        self._preprocessed = {}
+        self._shuffle = shuffle_files
+        self._num_workers = num_workers
+
+    @property
+    def dataset(self):
+        return self._dataset
+
+    @property
+    def class_names(self):
+        return self._class_names
+
+    @property
+    def info(self):
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
diff --git a/tlt/datasets/text_classification/hf_text_classification_dataset.py b/tlt/datasets/text_classification/hf_text_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..1f780918938f2006d916897a36268fef18be628a
--- /dev/null
+++ b/tlt/datasets/text_classification/hf_text_classification_dataset.py
@@ -0,0 +1,159 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+from datasets import concatenate_datasets
+from datasets.arrow_dataset import Dataset
+
+from tlt import TLT_BASE_DIR
+from tlt.utils.file_utils import read_json_file
+from tlt.datasets.hf_dataset import HFDataset
+from tlt.datasets.text_classification.text_classification_dataset import TextClassificationDataset
+from downloader.datasets import DataDownloader
+
+DATASET_CONFIG_DIR = os.path.join(TLT_BASE_DIR, "datasets/configs")
+
+
+class HFTextClassificationDataset(TextClassificationDataset, HFDataset):
+    """
+    A text classification dataset from the Hugging Face datasets catalog
+    """
+
+    def __init__(self, dataset_dir, dataset_name, split=['train'], num_workers=0, shuffle_files=True,
+                 distributed=False):
+        if not isinstance(split, list):
+            raise ValueError("Value of split argument must be a list.")
+
+        TextClassificationDataset.__init__(self, dataset_dir, dataset_name, "huggingface")
+        self._preprocessed = {}
+        self._split = split
+        self._data_loader = None
+        self._train_loader = None
+        self._test_loader = None
+        self._validation_loader = None
+        self._train_subset = None
+        self._test_subset = None
+        self._validation_subset = None
+        self._num_workers = num_workers
+        self._shuffle = shuffle_files
+        self._distributed = distributed
+        self._info = {
+            'name': dataset_name
+        }
+
+        if len(split) == 1:
+            self._validation_type = None  # Train & evaluate on the whole dataset
+
+            # If only one split is given use it as the main dataset object
+            self._dataset = self.load_hf_dataset(dataset_name, split=split[0])
+
+        else:
+            self._validation_type = 'defined_split'  # Defined by user or Hugging Face
+            if 'train' in split:
+                self._dataset = self.load_hf_dataset(dataset_name, split='train')
+                self._train_indices = range(len(self._dataset))
+                self._train_subset = self.train_subset
+
+            if 'test' in split:
+                test_dataset = self.load_hf_dataset(dataset_name, split='test')
+                test_length = len(test_dataset)
+                if self._dataset:
+                    current_length = len(self._dataset)
+                    self._dataset = concatenate_datasets([self._dataset, test_dataset])
+                    self._test_indices = range(current_length, current_length + test_length)
+                else:
+                    self._dataset = test_dataset
+                    self._test_indices = range(test_length)
+
+                self._test_subset = self.test_subset
+
+            if 'validation' in split:
+                validation_dataset = self.load_hf_dataset(dataset_name, split='validation')
+                validation_length = len(validation_dataset)
+                if self._dataset:
+                    current_length = len(self._dataset)
+                    self._dataset = concatenate_datasets([self._dataset, validation_dataset])
+                    self._validation_indices = range(current_length, current_length + validation_length)
+                else:
+                    self._dataset = validation_dataset
+                    self._validation_indices = range(validation_length)
+
+                self._validation_subset = self.validation_subset
+
+            if 'unsupervised' in split:
+                unsupervised_dataset = self.load_hf_dataset(dataset_name, split='unsupervised')
+                if self._dataset:
+                    self._dataset = concatenate_datasets([self._dataset, unsupervised_dataset])
+                else:
+                    self._dataset = unsupervised_dataset
+
+    def load_hf_dataset(self, dataset_name: str, split: str) -> Dataset:
+        """
+        Helper function to load the dataset from hugging face catalog
+        """
+        main_dataset = dataset_name
+        subset = None
+        config_file = os.path.join(DATASET_CONFIG_DIR, "hf_text_classification_datasets.json")
+        config_dict = read_json_file(config_file)
+        available_datasets = list(config_dict.keys())
+
+        if dataset_name not in available_datasets:
+            raise ValueError("Dataset is not supported. Choose from: {}".format(available_datasets))
+
+        # We separate the dataset_name by checking whether it has the format of "dataset/subset"
+        if '/' in dataset_name:
+            main_dataset = dataset_name.split('/')[0]
+            subset = dataset_name.split('/')[1]
+
+        if subset is not None:
+            downloader = DataDownloader(main_dataset, self._dataset_dir, catalog='hugging_face', subset=subset)
+        else:
+            downloader = DataDownloader(main_dataset, self._dataset_dir, catalog='hugging_face')
+        return downloader.download(split=split)
+
+    @property
+    def dataset(self) -> Dataset:
+        """
+        Returns datasets.arrow_dataset.Dataset object
+        """
+        return self._dataset
+
+    @property
+    def class_names(self) -> list:
+        """
+        Returns a list of class labels
+        """
+        try:
+            names = self.dataset.features['label'].names
+        except KeyError:
+            names = self.dataset.features['labels'].names
+
+        return names
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    def __len__(self):
+        return len(self._dataset)
diff --git a/tlt/datasets/text_classification/text_classification_dataset.py b/tlt/datasets/text_classification/text_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..14d7f7a635b65dbfb2b62b1526dc253125b82e93
--- /dev/null
+++ b/tlt/datasets/text_classification/text_classification_dataset.py
@@ -0,0 +1,60 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import abc
+
+from tlt.datasets.dataset import BaseDataset
+
+
+class TextClassificationDataset(BaseDataset):
+    """
+    Base class for a text classification dataset
+    """
+    def __init__(self, dataset_dir, dataset_name="", dataset_catalog=""):
+        BaseDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog)
+
+    @property
+    @abc.abstractmethod
+    def class_names(self):
+        pass
+
+    def get_str_label(self, numerical_value):
+        """
+            Returns the string label (class name) associated with the specified numerical value. If the numerical
+            value provided is a float, it will be rounded to the nearest integer.
+
+            Args:
+                numerical_value (int or float): Numerical label value
+
+            Raises:
+                TypeError: if the numerical value is not a float or an integer
+                ValueError: if the numerical value does not map to a class label
+        """
+        if isinstance(numerical_value, float):
+            numerical_value = int(round(numerical_value))
+
+        if not isinstance(numerical_value, int):
+            raise TypeError("Invalid type for the numerical value. Expected an integer or float value.")
+
+        if len(self.class_names) > numerical_value:
+            return self.class_names[numerical_value]
+        else:
+            raise ValueError("The numerical value {} exceeds the number of classes in the dataset ({})".format(
+                numerical_value, len(self.class_names)))
diff --git a/tlt/datasets/text_classification/tf_custom_text_classification_dataset.py b/tlt/datasets/text_classification/tf_custom_text_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..8ac2033431dc30a4c83fbf170fe96c865d968db6
--- /dev/null
+++ b/tlt/datasets/text_classification/tf_custom_text_classification_dataset.py
@@ -0,0 +1,211 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import tensorflow as tf
+
+from tlt.datasets.tf_dataset import TFDataset
+from tlt.datasets.text_classification.text_classification_dataset import TextClassificationDataset
+from tlt.utils.dataset_utils import prepare_huggingface_input_data
+from tlt.utils.inc_utils import INCTFDataLoader
+
+
+class TFCustomTextClassificationDataset(TextClassificationDataset, TFDataset):
+    """
+    A custom text classification dataset that can be used with TensorFlow models.
+    Note that this dataset class expects a .csv file with two columns where the first column is the label and
+    the second column is the text/sentence to classify.
+
+    For example, a comma separated value file will look similar to the snippet below:
+
+    .. code-block:: text
+
+        class_a,<text>
+        class_b,<text>
+        class_a,<text>
+        ...
+
+    If the .csv files has more columns, the select_cols or exclude_cols parameters can be used to filter out which
+    columns will be parsed.
+
+    Args:
+        dataset_dir (str): Directory containing the dataset
+        dataset_name (str): Name of the dataset. If no dataset name is given, the dataset_dir folder name
+                            will be used as the dataset name.
+        csv_file_name (str): Name of the csv file to load from the dataset directory
+        class_names (list): List of ordered class names
+        label_map_func (function): optional; Maps the label_map_func across the label column of the dataset to apply a
+                                   transform to the elements. For example, if the .csv file has string class labels
+                                   instead of numerical values, provide a function that maps the string to a numerical
+                                   value.
+        defaults (list): optional; List of default values for the .csv file fields. Defaults to [tf.string, tf.string]
+        delimiter (str): optional; String character that separates the label and text in each row. Defaults to ",".
+        header (bool): optional; Boolean indicating whether or not the csv file has a header line that should be
+                       skipped. Defaults to False.
+        select_cols (list): optional; Specify a list of sorted indices for columns from the dataset file(s) that should
+                            be parsed. Defaults to parsing all columns. At most one of select_cols and exclude_cols can
+                            be specified.
+        exclude_cols (list): optional; Specify a list of sorted indices for columns from the dataset file(s) that should
+                             be excluded from parsing. Defaults to parsing all columns. At most one of select_cols and
+                             exclude_cols can be specified.
+        shuffle_files (bool): optional; Whether to shuffle the data. Defaults to True.
+        seed (int): optional; Random seed for shuffling
+
+    Raises:
+        FileNotFoundError: if the csv file is not found in the dataset directory
+        TypeError: if the class_names parameter is not a list or the label_map_func is not callable
+        ValueError: if the class_names list is empty
+
+    """
+
+    def __init__(self, dataset_dir, dataset_name, csv_file_name, class_names, label_map_func=None,
+                 defaults=[tf.string, tf.string], delimiter=",", header=False, select_cols=None, exclude_cols=None,
+                 shuffle_files=True, seed=None, **kwargs):
+        """
+        Class constructor
+        """
+        dataset_file = os.path.join(dataset_dir, csv_file_name)
+        if not os.path.exists(dataset_file):
+            raise FileNotFoundError("The dataset file ({}) does not exist".format(dataset_file))
+
+        if not isinstance(class_names, list):
+            raise TypeError("The class_names is expected to be a list, but found a {}", type(class_names))
+        if len(class_names) == 0:
+            raise ValueError("The class_names list cannot be empty.")
+
+        if label_map_func and not callable(label_map_func):
+            raise TypeError("The label_map_func is expected to be a function, but found a {}", type(label_map_func))
+
+        # The dataset name is only used for informational purposes. Default to use the file name without extension.
+        if not dataset_name:
+            dataset_name = csv_file_name[:csv_file_name.index('.')] if '.' in csv_file_name else csv_file_name
+
+        TextClassificationDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog=None)
+
+        self._dataset = tf.data.experimental.CsvDataset(filenames=dataset_file,
+                                                        record_defaults=defaults,
+                                                        field_delim=delimiter,
+                                                        use_quote_delim=False,
+                                                        header=header,
+                                                        select_cols=select_cols,
+                                                        exclude_cols=exclude_cols)
+
+        if shuffle_files:
+            self._dataset = self._dataset.shuffle(1, seed=seed)
+
+        # Count the number of lines in the csv file to get the dataset length
+        dataset_len = sum(1 for _ in open(dataset_file))
+
+        if header:
+            dataset_len -= 1
+
+        # Set the cardinality so that the dataset length can be used for shuffle splits and progress bars
+        self._dataset = self._dataset.apply(tf.data.experimental.assert_cardinality(dataset_len))
+
+        # If a map function has not been defined, we know that we a least need to convert the string from the
+        # csv file to a integer for the label field
+        if not label_map_func:
+            def label_map_func(x):
+                return int(x)
+
+        self._dataset = self._dataset.map(lambda x, y: (y, label_map_func(x)))
+
+        self._info = {
+            "name": dataset_name,
+            "dataset_dir": dataset_dir,
+            "file_name": csv_file_name,
+            "delimiter": delimiter,
+            "defaults": defaults,
+            "header": header,
+            "select_cols": select_cols,
+            "exclude_cols": exclude_cols
+        }
+        self._preprocessed = None
+
+        self._class_names = class_names
+        self._train_pct = 1.0
+        self._val_pct = 0
+        self._test_pct = 0
+        self._validation_type = None
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+    @property
+    def class_names(self):
+        """
+        Returns the list of class names
+        """
+        return self._class_names
+
+    @property
+    def info(self):
+        """
+        Returns a dictionary of information about the dataset
+        """
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        """
+        Returns the framework dataset object (tf.data.Dataset)
+        """
+        return self._dataset
+
+    def preprocess(self, batch_size):
+        """
+            Batch the dataset
+
+            Args:
+                batch_size (int): desired batch size
+
+            Raises:
+                TypeError if the batch_size is not a positive integer
+                ValueError if the dataset is not defined or has already been processed
+        """
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be a positive integer")
+
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+
+        # Get the non-None splits
+        split_list = ['_dataset', '_train_subset', '_validation_subset', '_test_subset']
+        subsets = [s for s in split_list if getattr(self, s, None)]
+        for subset in subsets:
+            setattr(self, subset, getattr(self, subset).cache())
+            setattr(self, subset, getattr(self, subset).batch(batch_size))
+            setattr(self, subset, getattr(self, subset).prefetch(tf.data.AUTOTUNE))
+        self._preprocessed = {'batch_size': batch_size}
+
+    def get_inc_dataloaders(self, hub_name, max_seq_length):
+        calib_data, calib_labels = prepare_huggingface_input_data(self.train_subset, hub_name, max_seq_length)
+        calib_data['label'] = tf.convert_to_tensor(calib_labels)
+
+        eval_data, eval_labels = prepare_huggingface_input_data(self.validation_subset, hub_name, max_seq_length)
+        eval_data['label'] = tf.convert_to_tensor(eval_labels)
+
+        calib_data.pop('token_type_ids')
+        eval_data.pop('token_type_ids')
+
+        calib_dataloader = INCTFDataLoader(calib_data, batch_size=self._preprocessed['batch_size'])
+        eval_dataloader = INCTFDataLoader(eval_data, batch_size=self._preprocessed['batch_size'])
+
+        return calib_dataloader, eval_dataloader
diff --git a/tlt/datasets/text_classification/tfds_text_classification_dataset.py b/tlt/datasets/text_classification/tfds_text_classification_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..3a4a6a67887dc694358a110f6314980ea2c8c6d4
--- /dev/null
+++ b/tlt/datasets/text_classification/tfds_text_classification_dataset.py
@@ -0,0 +1,142 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import tensorflow as tf
+
+from tlt import TLT_BASE_DIR
+from tlt.datasets.tf_dataset import TFDataset
+from tlt.datasets.text_classification.text_classification_dataset import TextClassificationDataset
+from tlt.utils.dataset_utils import prepare_huggingface_input_data
+from tlt.utils.file_utils import read_json_file
+from tlt.utils.inc_utils import INCTFDataLoader
+from downloader.datasets import DataDownloader
+
+DATASET_CONFIG_DIR = os.path.join(TLT_BASE_DIR, "datasets/configs")
+config_file = os.path.join(DATASET_CONFIG_DIR, "tf_text_classification_datasets.json")
+config_dict = read_json_file(config_file)
+DATASETS = list(config_dict.keys())
+
+
+class TFDSTextClassificationDataset(TFDataset, TextClassificationDataset):
+    """
+    A text classification dataset from the TensorFlow datasets catalog
+    """
+    def __init__(self, dataset_dir, dataset_name, split=["train"], shuffle_files=True, **kwargs):
+        if not isinstance(split, list):
+            raise ValueError("Value of split argument must be a list.")
+
+        TextClassificationDataset.__init__(self, dataset_dir, dataset_name, "tf_datasets")
+
+        if dataset_name not in DATASETS:
+            raise ValueError("Dataset name is not supported. Choose from: {}".format(DATASETS))
+
+        # as_supervised gives us the (input, label) structure that the model expects
+        as_supervised = True
+
+        # Glue datasets don't support as_supervised=True, so we need to set as_supervised=False, and then fix
+        # the data format after loading
+        if "glue" in dataset_name:
+            as_supervised = False
+
+        downloader = DataDownloader(dataset_name, dataset_dir=dataset_dir, catalog='tfds', as_supervised=as_supervised,
+                                    shuffle_files=shuffle_files, with_info=True)
+        data, self._info = downloader.download(split=split)
+
+        # Since glue datasets don't support the supervised (input, label) structure, we have to manually format it
+        if "glue" in dataset_name:
+            for split_id in range(len(data)):
+                data[split_id] = data[split_id].map(lambda x: (x['sentence'], x['label']))
+
+        self._dataset = None
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+        self._preprocessed = None
+
+        if len(split) == 1:
+            self._validation_type = None  # Train & evaluate on the whole dataset
+            self._dataset = data[0]
+        else:
+            self._validation_type = 'defined_split'  # Defined by user or TFDS
+            for i, s in enumerate(split):
+                if s == 'train':
+                    self._train_subset = data[i]
+                elif s == 'validation':
+                    self._validation_subset = data[i]
+                elif s == 'test':
+                    self._test_subset = data[i]
+                self._dataset = data[i] if self._dataset is None else self._dataset.concatenate(data[i])
+
+    @property
+    def class_names(self):
+        if "label" in self._info.features.keys():
+            return self._info.features["label"].names
+        else:
+            return []
+
+    @property
+    def info(self):
+        return {'dataset_info': self._info, 'preprocessing_info': self._preprocessed}
+
+    @property
+    def dataset(self):
+        return self._dataset
+
+    def preprocess(self, batch_size):
+        """
+            Batch the dataset
+
+            Args:
+                batch_size (int): desired batch size
+
+            Raises:
+                TypeError: if the batch_size is not a positive integer
+                ValueError: if the dataset is not defined or has already been processed
+        """
+        if not isinstance(batch_size, int) or batch_size < 1:
+            raise ValueError("batch_size should be a positive integer")
+
+        if self._preprocessed:
+            raise ValueError("Data has already been preprocessed: {}".format(self._preprocessed))
+
+        # Get the non-None splits
+        split_list = ['_dataset', '_train_subset', '_validation_subset', '_test_subset']
+        subsets = [s for s in split_list if getattr(self, s, None)]
+        for subset in subsets:
+            setattr(self, subset, getattr(self, subset).cache())
+            setattr(self, subset, getattr(self, subset).batch(batch_size))
+            setattr(self, subset, getattr(self, subset).prefetch(tf.data.AUTOTUNE))
+        self._preprocessed = {'batch_size': batch_size}
+
+    def get_inc_dataloaders(self, hub_name, max_seq_length):
+        calib_data, calib_labels = prepare_huggingface_input_data(self.train_subset, hub_name, max_seq_length)
+        calib_data['label'] = tf.convert_to_tensor(calib_labels)
+
+        eval_data, eval_labels = prepare_huggingface_input_data(self.validation_subset, hub_name, max_seq_length)
+        eval_data['label'] = tf.convert_to_tensor(eval_labels)
+
+        calib_data.pop('token_type_ids')
+        eval_data.pop('token_type_ids')
+
+        calib_dataloader = INCTFDataLoader(calib_data, batch_size=self._preprocessed['batch_size'])
+        eval_dataloader = INCTFDataLoader(eval_data, batch_size=self._preprocessed['batch_size'])
+
+        return calib_dataloader, eval_dataloader
diff --git a/tlt/datasets/tf_dataset.py b/tlt/datasets/tf_dataset.py
new file mode 100644
index 0000000000000000000000000000000000000000..318e6a1e936e357a9269c600fe4ab8bca9c8f598
--- /dev/null
+++ b/tlt/datasets/tf_dataset.py
@@ -0,0 +1,153 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from neural_compressor.data import DataLoader
+import tensorflow as tf
+
+from tlt.datasets.dataset import BaseDataset
+
+
+class TFDataset(BaseDataset):
+    """
+    Base class to represent a TF Dataset
+    """
+
+    def __init__(self, dataset_dir, dataset_name="", dataset_catalog=""):
+        """
+        Class constructor
+        """
+        BaseDataset.__init__(self, dataset_dir, dataset_name, dataset_catalog)
+        self._train_subset = None
+        self._validation_subset = None
+        self._test_subset = None
+
+    @property
+    def train_subset(self):
+        """
+        A subset of the dataset used for training
+        """
+        return self._train_subset
+
+    @property
+    def validation_subset(self):
+        """
+        A subset of the dataset used for validation/evaluation
+        """
+        return self._validation_subset
+
+    @property
+    def test_subset(self):
+        """
+        A subset of the dataset held out for final testing/evaluation
+        """
+        return self._test_subset
+
+    def get_batch(self, subset='all'):
+        """
+        Get a single batch of images and labels from the dataset.
+
+            Args:
+                subset (str): default "all", can also be "train", "validation", or "test"
+
+            Returns:
+                (examples, labels)
+
+            Raises:
+                ValueError: if the dataset is not defined yet or the given subset is not valid
+        """
+        if subset == 'all' and self._dataset is not None:
+            return next(iter(self._dataset))
+        elif subset == 'train' and self._train_subset is not None:
+            return next(iter(self._train_subset))
+        elif subset == 'validation' and self._validation_subset is not None:
+            return next(iter(self._validation_subset))
+        elif subset == 'test' and self._test_subset is not None:
+            return next(iter(self._test_subset))
+        else:
+            raise ValueError("Unable to return a batch, because the dataset or subset hasn't been defined.")
+
+    def shuffle_split(self, train_pct=.75, val_pct=.25, test_pct=0., shuffle_files=True, seed=None):
+        """
+        Randomly split the dataset into train, validation, and test subsets with a pseudo-random seed option.
+
+            Args:
+                train_pct (float): default .75, percentage of dataset to use for training
+                val_pct (float):  default .25, percentage of dataset to use for validation
+                test_pct (float): default 0.0, percentage of dataset to use for testing
+                shuffle_files (bool): default True, optionally control whether shuffling occurs
+                seed (None or int): default None, can be set for pseudo-randomization
+
+            Raises:
+                ValueError: if percentage input args are not floats or sum to greater than 1
+        """
+        if not (isinstance(train_pct, float) and isinstance(val_pct, float) and isinstance(test_pct, float)):
+            raise ValueError("Percentage arguments must be floats.")
+        if train_pct + val_pct + test_pct > 1.0:
+            raise ValueError("Sum of percentage arguments must be less than or equal to 1.")
+
+        cardinality = self._dataset.cardinality()
+        length = len(self._dataset)  # Length is different from cardinality if batched
+        batched = self._preprocessed and 'batch_size' in self._preprocessed
+
+        if shuffle_files:
+            # A batched TF dataset has to be unbatched for the shuffle command to apply to all files
+            if batched:
+                self._dataset = self._dataset.unbatch()
+            self._dataset = self._dataset.shuffle(cardinality, reshuffle_each_iteration=False, seed=seed)
+            if batched:
+                self._dataset = self._dataset.cache()
+                self._dataset = self._dataset.batch(self._preprocessed['batch_size'])
+                self._dataset = self._dataset.prefetch(tf.data.AUTOTUNE)
+
+        train_size = int(train_pct * length)
+        val_size = int(val_pct * length)
+
+        self._train_subset = self._dataset.take(train_size)
+        self._validation_subset = self._dataset.skip(train_size).take(val_size)
+        if test_pct:
+            self._test_subset = self._dataset.skip(train_size + val_size)
+        else:
+            self._test_subset = None
+        self._validation_type = 'shuffle_split'
+
+    def get_inc_dataloaders(self):
+        # The added dimension of a batched TF dataset throws Intel Neural Compressor off, so use unbatched dataset
+        batched = self._preprocessed and 'batch_size' in self._preprocessed
+        if batched:
+            calib_dataloader = DataLoader('tensorflow_itex', self.train_subset.unbatch(),
+                                          batch_size=self._preprocessed['batch_size'])
+        else:
+            calib_dataloader = DataLoader('tensorflow_itex', self.train_subset)
+        if self.validation_subset is not None:
+            if batched:
+                eval_dataloader = DataLoader('tensorflow_itex', self.validation_subset.unbatch(),
+                                             batch_size=self._preprocessed['batch_size'])
+            else:
+                eval_dataloader = DataLoader('tensorflow_itex', self.validation_subset)
+        elif self.test_subset is not None:
+            if batched:
+                eval_dataloader = DataLoader('tensorflow_itex', self.test_subset.unbatch(),
+                                             batch_size=self._preprocessed['batch_size'])
+            else:
+                eval_dataloader = DataLoader('tensorflow_itex', self.test_subset)
+        else:
+            eval_dataloader = calib_dataloader
+
+        return calib_dataloader, eval_dataloader
diff --git a/tlt/distributed/README.md b/tlt/distributed/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..adda9688a048ac9d08810a8cc5fc433ffe9530c2
--- /dev/null
+++ b/tlt/distributed/README.md
@@ -0,0 +1,42 @@
+# Distributed Training
+
+Here are instructions for using distributed/multinode Training with Intel® Transfer Learning Tool.
+
+## Prerequisites
+
+- Participating nodes should have Intel® oneAPI Base Toolkit installed. Verify the files under `/opt/intel/oneapi`
+- Participating nodes should have passwordless SSH setup. Instructions to set up are given below.
+
+### Passwordless SSH setup
+
+- Use an existing (or create an) SSH key pair.
+
+    - Check under `~/.ssh` and see if they exist. If present, make sure they have default names `(id_rsa.pub id_rsa)` and they don't have any passphrase.
+
+    - To remove passphrase, type `ssh-keygen -p [-P old_passphrase] [-N new_passphrase] [-f keyfile]` by replacing `new_passphrase` with a blank space.
+
+- How to create SSH key pair:
+
+    - Get to your .ssh directory `cd ~/.ssh` (if this gives you an error, change the permissions: `chmod u+x ~/.ssh`)
+
+    - Run the command: `ssh-keygen -t rsa`
+
+    - The first prompt will ask you what you want to call your key files `(id_rsa.pub id_rsa)`. Press `<enter>` to use the default key names.
+
+    - The second prompt will ask for passphrase. Do not enter any passphrase, just press `<enter>`.
+
+- Locate the two ssh key pair files in your `.ssh` directory (`id_rsa.pub`, `id_rsa`):
+
+    - Open the Public Key in an editor like vi/vim/nano/pico (this is the `.pub` file)
+
+    - The ending of the public key may say `<your_idsid>@<hostname.domain>`, edit this file to omit the `"@<hostname.domain>"` at the end. The result will be your `idsid` only.
+
+    - Create a file in your .ssh directory called `authorized_keys`
+
+    - Paste your entire public key into this file
+
+    - Make sure your new ssh key pair files AND `authorized_keys` files are read-write only for yourself with no permissions for anyone else `(chmod 600 file1 file2 file3)`
+
+- Test the SSH `ssh <ip_or_hostname.domain>`
+
+IMPORTANT NOTE: You have to make sure the `authorized_keys` file exists on all of the target systems that will participate in running the workload (in your local home dir in your `.ssh` directory) with contents of public key inside as well.
diff --git a/tlt/distributed/__init__.py b/tlt/distributed/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..f14b78f57965a99669ef0ca6f0ad5bd3c9d55680
--- /dev/null
+++ b/tlt/distributed/__init__.py
@@ -0,0 +1,23 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+TLT_DISTRIBUTED_DIR = os.path.dirname(__file__)
diff --git a/tlt/distributed/pytorch/README.md b/tlt/distributed/pytorch/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..f1937adda655e3dcfba93d2209c0416ce5831933
--- /dev/null
+++ b/tlt/distributed/pytorch/README.md
@@ -0,0 +1,102 @@
+# Distributed Training with PyTorch and Intel® Transfer Learning Tool
+
+## Multinode setup
+
+### Create and activate a Python3 virtual environment
+
+We encourage you to use a python virtual environment (virtualenv or conda) for consistent package management. Make sure to follow only the chosen method on all the nodes. Mixing those configurations is not supported. 
+
+There are two ways to do this:
+
+a. Using `virtualenv`:
+
+1. Login to one of the participating nodes.
+
+2. Create and activate a new python3 virtualenv
+
+```
+virtualenv -p python3 tlt_dev_venv
+source tlt_dev_venv/bin/activate
+```
+
+3. Install Intel® Transfer Learning Tool (see main [README](/README.md))
+```
+pip install --editable .
+```
+
+4. Install multinode dependencies from the shell script. You can also compile `torch_ccl` manually from [here](https://github.com/intel/torch-ccl)
+```
+bash tlt/distributed/pytorch/pyt_hvd_setup.sh
+```
+
+b. Or `conda`:
+
+1. Login to one of the participating nodes.
+
+2. Create and activate a new conda environment
+```
+conda create -n tlt_dev_venv python=3.8 --yes
+conda activate tlt_dev_venv
+```
+
+3. Install Intel® Transfer Learning Tool (see main [README](/README.md))
+```
+pip install --editable .
+```
+
+4. Install dependencies from the shell script
+```
+bash tlt/distributed/pytorch/run_install.sh
+```
+
+## Verify multinode setup
+
+Create a `hostfile` with a list of IP addresses of the participating nodes and type the following command. You should see a list of hostnames of the nodes.
+```
+mpiexec.hydra -ppn 1 -f hostfile hostname
+```
+**Note:** If the above command errors out as `'mpiexec.hydra' command not found`, activate the oneAPI environment:
+```
+source /opt/intel/oneapi/setvars.sh
+```
+
+## Launch a distributed training job with TLT CLI
+
+**Step 1:** Create a `hostfile` with a list of IP addresses of the participating nodes. Make sure 
+the first IP address to be of the current node.
+
+**Step 2:** Launch a distributed training job with TLT CLI using the appropriate flags.
+```
+tlt train \
+    -f pytorch \
+    --model_name resnet50 \
+    --dataset_name CIFAR10 \
+    --output_dir $OUTPUT_DIR \
+    --dataset_dir $DATASET_DIR \
+    --distributed \
+    --hostfile hostfile \
+    --nnodes 2 \
+    --nproc_per_node 2
+```
+
+**(Optional)**: Use the `--use_horovod` flag to use horovod for distributed training
+
+## Troubleshooting
+
+- ***"Port already in use"***
+    
+    Might happen when you keyboard interrupt training.
+
+    **Fix:** Release the port from the terminal (or) log out and log in again to free the port.
+
+- ***"HTTP Connection error"***
+
+    Might happen if there are several attempts to train text classification model as it uses Hugging Face API to make calls to get dataset, model, tokenizer.
+
+    **Fix:** Wait for about few seconds and try again.
+
+- ***"TimeoutException"*** when using horovod
+
+    Might happen when horovod times out waiting for tasks to start. 
+    
+    **Fix:** Check connectivity between servers. You may need to increase the `--hvd-start-timeout` parameter if you have too many servers. Default value for timeout is 30 seconds.
diff --git a/tlt/distributed/pytorch/__init__.py b/tlt/distributed/pytorch/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..0c8b2229f41ce8d40df28728d6dcebe388ab41de
--- /dev/null
+++ b/tlt/distributed/pytorch/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: EPL-2.0
+#
diff --git a/tlt/distributed/pytorch/deploy/install_torch_ccl.sh b/tlt/distributed/pytorch/deploy/install_torch_ccl.sh
new file mode 100644
index 0000000000000000000000000000000000000000..17fb6a9ddaf179cc3630b9a25fcad5b77d9f9b9a
--- /dev/null
+++ b/tlt/distributed/pytorch/deploy/install_torch_ccl.sh
@@ -0,0 +1,24 @@
+#!/usr/bin/env bash
+
+GCC_GOOD=`gcc --version | awk '/gcc/ && ($3+0)>=8.3{print "1"}'`
+if [ "x$GCC_GOOD" != "x1" ] ; then
+      echo "Requires gcc version later than 8.3.0"
+        exit 1
+fi
+
+pt_version=$(python -c "import torch; print(torch.__version__)" 2> /dev/null)
+if [ "x$pt_version" == "x" ] ; then
+      echo "Can't find pytorch version, need PyTorch 1.9 or higher..."
+        exit 1
+fi
+
+branch=$(echo $pt_version | tr "." " " | awk '{print "ccl_torch" $1 "." $2}')
+
+if ! test -d ./torch-ccl ; then
+      git clone https://github.com/intel/torch-ccl.git
+fi
+cd torch-ccl
+# workaround to disable linker error for linking to mkl libraries
+# export CMAKE_FIND_DEBUG_MODE=ON
+export CMAKE_DISABLE_FIND_PACKAGE_MKL=TRUE
+git checkout $branch && git submodule sync && git submodule update --init --recursive && CC=gcc CXX=g++ CMAKE_C_COMPILER=gcc CMAKE_CXX_COMPILER=g++ python setup.py install
diff --git a/tlt/distributed/pytorch/pyt_hvd_setup.sh b/tlt/distributed/pytorch/pyt_hvd_setup.sh
new file mode 100644
index 0000000000000000000000000000000000000000..583d0216bf3393d5ca91a478e2475e321f036051
--- /dev/null
+++ b/tlt/distributed/pytorch/pyt_hvd_setup.sh
@@ -0,0 +1,39 @@
+#!/bin/bash
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+path_to_requirements_file=$(dirname "$(readlink -f "$0")")/requirements.txt
+
+# Read the file line by line
+while IFS= read -r package || [[ -n $package ]]; do
+    # Replace "@" with "-f" using the sed command
+    if [[ $package == *"@"* ]]; then
+        modified_string=$(echo $package | sed 's/@/-f/g')
+        pip install $modified_string
+    # Install horovod with appropriate flags set
+    elif [[ $package =~ "horovod" ]]; then
+        HOROVOD_WITH_MPI=1
+        HOROVOD_WITH_MXNET=0
+        HOROVOD_WITH_PYTORCH=1
+        HOROVOD_WITH_TENSORFLOW=0
+        pip install --no-cache-dir $package
+    else
+        pip install $package
+    fi
+done < $path_to_requirements_file
diff --git a/tlt/distributed/pytorch/requirements.txt b/tlt/distributed/pytorch/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..beb80f54a57dbde1c84430135debce7dea4f5849
--- /dev/null
+++ b/tlt/distributed/pytorch/requirements.txt
@@ -0,0 +1,2 @@
+oneccl-bind-pt @ https://intel-extension-for-pytorch.s3.amazonaws.com/torch_ccl/cpu/oneccl_bind_pt-1.13.0%2Bcpu-cp39-cp39-linux_x86_64.whl
+horovod[mpi,pytorch]~=0.27.0
\ No newline at end of file
diff --git a/tlt/distributed/pytorch/run_install.sh b/tlt/distributed/pytorch/run_install.sh
new file mode 100644
index 0000000000000000000000000000000000000000..7e4d913276ea4d809cfb67f318064ac201c7ce04
--- /dev/null
+++ b/tlt/distributed/pytorch/run_install.sh
@@ -0,0 +1,26 @@
+#!/usr/bin/env bash
+
+conda install -y \
+  'numpy==1.23.5' \
+  'pytorch==1.13.1' \
+  'pyyaml==6.0' \
+  'scikit-learn==1.2.2' \
+  'torchaudio==1.13.1' \
+  'torchvision==0.14.1' \
+  'tqdm==4.65.0' \
+  cmake \
+  cpuonly \
+  future \
+  gperftools \
+  intel-openmp \
+  ninja \
+  pydot \
+  setuptools \
+  -c pytorch -c intel -c conda-forge
+
+pip install \
+  'datasets~=2.12.0' \
+  'intel_extension_for_pytorch==1.13.100' \
+  'transformers~=4.30.0'
+
+bash deploy/install_torch_ccl.sh
diff --git a/tlt/distributed/pytorch/run_train_pyt.py b/tlt/distributed/pytorch/run_train_pyt.py
new file mode 100644
index 0000000000000000000000000000000000000000..312b6dc72ad81763cf55a4506f50780e512c7d39
--- /dev/null
+++ b/tlt/distributed/pytorch/run_train_pyt.py
@@ -0,0 +1,149 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import argparse
+import tempfile
+
+from transformers import AutoTokenizer
+
+from filelock import FileLock
+
+from downloader.datasets import DataDownloader
+from downloader.models import ModelDownloader
+
+from tlt.distributed.pytorch.utils.pyt_distributed_utils import (
+    DistributedTorch,
+    DistributedTrainingArguments,
+    HorovodTrainer
+)
+
+
+if __name__ == "__main__":
+
+    default_data_dir = os.path.join(tempfile.gettempdir(), 'data')
+    default_output_dir = os.path.join(tempfile.gettempdir(), 'output')
+
+    for d in [default_data_dir, default_output_dir]:
+        if not os.path.exists(d):
+            os.makedirs(d)
+
+    def directory_path(path):
+        if os.path.isdir(path):
+            return path
+        else:
+            raise argparse.ArgumentTypeError("'{}' is not a valid directory path.".format(path))
+
+    print("******Distributed Training*****")
+
+    description = 'Distributed training with PyTorch.'
+
+    parser = argparse.ArgumentParser(description=description)
+
+    parser.add_argument('--master_addr', type=str, required=False, help="Master node to run this script")
+    parser.add_argument('--master_port', type=str, required=False, default='29500', help='Master port')
+    parser.add_argument('--backend', type=str, required=False, default='ccl', help='Type of backend to use '
+                        '(default: ccl)')
+    parser.add_argument('--use-case', '--use_case', type=str, required=True,
+                        help='Use case (image_classification|text_classification)')
+    parser.add_argument('--epochs', type=int, required=False, default=1, help='Total epochs to train the model')
+    parser.add_argument('--batch_size', type=int, required=False, default=128,
+                        help='Global batch size to distribute data (default: 128)')
+    parser.add_argument('--disable_ipex', action='store_true', required=False, help="Disables IPEX optimization to "
+                        "the model. No effect when given --use-horovod as horovod with IPEX isn't supported.")
+    parser.add_argument('--tlt_saved_objects_dir', type=directory_path, required=False, help='Path to TLT saved '
+                        'distributed objects. The path must be accessible to all the nodes. For example: mounted '
+                        'NFS drive. This arg is helpful when using TLT API/CLI. '
+                        'See DistributedTorch.load_saved_objects() for more information.')
+    parser.add_argument('--use-horovod', '--use_horovod', action='store_true', help='Use horovod for distributed '
+                        'training.')
+    parser.add_argument('--cuda', action='store_true', help='Use cuda device for distributed training')
+    parser.add_argument('--dataset-dir', '--dataset_dir', type=directory_path, default=default_data_dir,
+                        help="Path to dataset directory to save/load tfds dataset. This arg is helpful if you "
+                        "plan to use this as a stand-alone script. Custom dataset is not supported yet!")
+    parser.add_argument('--output-dir', '--output_dir', type=directory_path, default=default_output_dir,
+                        help="Path to save the trained model and store logs. This arg is helpful if you "
+                        "plan to use this as a stand-alone script")
+    parser.add_argument('--dataset-name', '--dataset_name', type=str, default=None,
+                        help="Dataset name to load from torchvision/Huggingface. This arg is helpful if you "
+                        "plan to use this as a stand-alone script. Custom dataset is not supported yet!")
+    parser.add_argument('--model-name', '--model_name', type=str, default=None,
+                        help="Torchvision image classification model name "
+                        "(or) Huggingface hub name for text classification models. This arg is helpful if you "
+                        "plan to use this as a stand-alone script.")
+    parser.add_argument('--max_seq_length', type=int, default=128,
+                        help='Maximum sequence length that the model will be used with for text classification')
+
+    args = parser.parse_args()
+
+    train_data = None
+    model = None
+    optimizer, loss = None, None
+    data_kwargs = {}
+
+    if args.tlt_saved_objects_dir is not None:
+        # Load the saved dataset and model objects
+        loaded_objects = DistributedTorch.load_saved_objects(args.tlt_saved_objects_dir)
+
+        train_data = loaded_objects.get('train_data')
+        model = loaded_objects['model']
+        loss = loaded_objects['loss']
+        optimizer = loaded_objects['optimizer']
+        data_kwargs['is_preprocessed'] = True
+    else:
+        if args.dataset_name is None:
+            raise argparse.ArgumentError(args.dataset_name, "Please provide a dataset name to load from torchvision "
+                                         "(or) datasets using --dataset-name")
+        if args.model_name is None:
+            raise argparse.ArgumentError(args.model_name, "Please provide torchvision model name (or) "
+                                         "Huggingface hub name using --model-name")
+
+        catalog = 'torchvision' if args.use_case == 'image_classification' else 'hugging_face'
+        with FileLock(os.path.expanduser('~/.horovod_lock')):
+            train_data = DataDownloader(args.dataset_name, args.dataset_dir, catalog).download(split='train')
+            model = ModelDownloader(args.model_name, catalog, args.output_dir).download()
+            if args.use_case == 'text_classification':
+                data_kwargs['hf_tokenizer'] = AutoTokenizer.from_pretrained(args.model_name)
+                data_kwargs['max_seq_length'] = args.max_seq_length
+                data_kwargs['text_column_names'] = [c for c in train_data.column_names if c != 'label']
+        data_kwargs['is_preprocessed'] = False
+
+    if args.use_horovod:
+        hvd_trainer = HorovodTrainer(args.cuda)
+
+        train_loader, train_sampler = hvd_trainer.prepare_data(train_data, args.use_case, args.batch_size,
+                                                               **data_kwargs)
+        hvd_trainer.prepare_model(model, args.use_case, optimizer, loss)
+
+        hvd_trainer.fit(train_loader, train_sampler, args.use_case, args.epochs)
+    else:
+        # Launch distributed job
+        training_args = DistributedTrainingArguments(
+            dataset=train_data,
+            model=model,
+            criterion=loss,
+            optimizer=optimizer,
+            epochs=args.epochs,
+            batch_size=args.batch_size,
+            disable_ipex=args.disable_ipex
+        )
+
+        dt = DistributedTorch(use_case=args.use_case)
+        dt.launch_distributed_job(training_args, args.master_addr, args.master_port, args.backend)
diff --git a/tlt/distributed/pytorch/utils/__init__.py b/tlt/distributed/pytorch/utils/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..55899ddaa2b193dbc3b2d314ec2712c6378dd375
--- /dev/null
+++ b/tlt/distributed/pytorch/utils/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/distributed/pytorch/utils/pyt_distributed_utils.py b/tlt/distributed/pytorch/utils/pyt_distributed_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..8e0c749b1d49d40bb6ac6cbdd409159e4827cb87
--- /dev/null
+++ b/tlt/distributed/pytorch/utils/pyt_distributed_utils.py
@@ -0,0 +1,378 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+
+import torch
+import torch.distributed as dist
+import torch.multiprocessing as mp
+import torchvision.transforms as T
+
+from tqdm import tqdm
+from random import Random
+from torch.utils.data import DataLoader
+from torch.utils.data.distributed import DistributedSampler
+from torch.nn.parallel import DistributedDataParallel as DDP
+
+import oneccl_bindings_for_pytorch  # noqa # pylint: disable=unused-import
+import intel_extension_for_pytorch as ipex
+
+import horovod.torch as hvd
+
+
+class HorovodTrainer:
+    def __init__(self, cuda=False) -> None:
+        # Horovod: limit # of CPU threads to be used per worker.
+        torch.set_num_threads(1)
+
+        dataloader_kwargs = {'num_workers': 1, 'pin_memory': True} if cuda else {}
+        # When supported, use 'forkserver' to spawn dataloader workers instead of 'fork' to prevent
+        # issues with Infiniband implementations that are not fork-safe
+        if (dataloader_kwargs.get('num_workers', 0) > 0 and hasattr(mp, '_supports_context') and
+                mp._supports_context and 'forkserver' in mp.get_all_start_methods()):
+            dataloader_kwargs['multi_processing_context'] = 'forkserver'
+
+        self.dataloader_kwargs = dataloader_kwargs
+
+        # Init horovod
+        hvd.init()
+
+    def prepare_data(self, dataset, use_case, batch_size=128, **kwargs):
+        if not kwargs.get('is_preprocessed'):
+            if use_case == 'image_classification':
+                dataset.transform = T.Compose([
+                    T.ToTensor(),
+                    T.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
+                ])
+                pass
+            elif use_case == 'text_classification':
+                hf_tokenizer = kwargs.get('hf_tokenizer')
+                max_seq_length = kwargs.get('max_seq_length')
+                text_column_names = kwargs.get('text_column_names')
+
+                def tokenize_func(sample):
+                    args = (sample[c] for c in text_column_names)
+                    result = hf_tokenizer(*args, padding='max_length', max_length=max_seq_length,
+                                          truncation=True)
+                    return result
+                dataset = dataset.map(tokenize_func)
+                dataset.set_format('torch')
+        data_sampler = DistributedSampler(dataset, num_replicas=hvd.size(), rank=hvd.rank())
+        dataloader = DataLoader(dataset, batch_size=batch_size, sampler=data_sampler,
+                                **self.dataloader_kwargs)
+        return dataloader, data_sampler
+
+    def prepare_model(self, model, use_case, optimizer=None, loss=None, scale_lr=True):
+        if optimizer is None:
+            if use_case == 'image_classification':
+                optimizer = torch.optim.Adam(model.parameters())
+            elif use_case == 'text_classification':
+                optimizer = torch.optim.AdamW(model.parameters())
+
+        if loss is None:
+            loss = torch.nn.CrossEntropyLoss()
+        # Horovod: scale learning rate by lr_scaler.
+        if scale_lr:
+            scaled_lr = optimizer.param_groups[0]['lr'] * hvd.size()
+            optimizer.param_groups[0]['lr'] = scaled_lr
+
+        # Horovod: broadcast parameters & optimizer state.
+        hvd.broadcast_parameters(model.state_dict(), root_rank=0)
+        hvd.broadcast_optimizer_state(optimizer, root_rank=0)
+
+        # Horovod: wrap optimizer with DistributedOptimizer.
+        optimizer = hvd.DistributedOptimizer(
+            optimizer,
+            named_parameters=model.named_parameters(),
+            compression=hvd.Compression.none,
+            op=hvd.Average
+        )
+
+        self.model = model
+        self.optimizer = optimizer
+        self.criterion = loss
+
+    def fit(self, dataloader, data_sampler, use_case, epochs=1, log_interval=10):
+        if use_case == 'image_classification':
+            for epoch in range(1, epochs + 1):
+                self.model.train()
+
+                # Horovod: set epoch to sampler for shuffling
+                data_sampler.set_epoch(epoch)
+                for batch_idx, (data, target) in enumerate(dataloader):
+                    self.optimizer.zero_grad()
+                    output = self.model(data)
+                    loss = self.criterion(output, target)
+                    loss.backward()
+                    self.optimizer.step()
+                    if batch_idx % log_interval == 0:
+                        # Horovod: use train_sampler to determine the number of examples in
+                        # this worker's partition.
+                        print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
+                            epoch, batch_idx * len(data), len(data_sampler),
+                            100. * batch_idx / len(dataloader), loss.item()))
+        elif use_case == 'text_classification':
+            for epoch in range(1, epochs + 1):
+                self.model.train()
+
+                data_sampler.set_epoch(epoch)
+                for batch_idx, data in enumerate(dataloader):
+                    inputs = {k: v for k, v in data.items() if k in ['input_ids', 'token_type_ids', 'attention_mask']}
+                    labels = data['label']
+                    outputs = self.model(**inputs)
+                    loss = self.criterion(outputs.logits, labels)
+
+                    loss.backward()
+                    self.optimizer.step()
+
+                    if batch_idx % log_interval == 0:
+                        # Horovod: use train_sampler to determine the number of examples in
+                        # this worker's partition.
+                        print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
+                            epoch, batch_idx * len(data), len(data_sampler),
+                            100. * batch_idx / len(dataloader), loss.item()))
+
+
+""" Dataset partitioning helper classes and methods """
+
+
+class Partition(object):
+
+    def __init__(self, data, index):
+        self.data = data
+        self.index = index
+
+    def __len__(self):
+        return len(self.index)
+
+    def __getitem__(self, index):
+        data_idx = self.index[index]
+        return self.data[data_idx]
+
+
+class DataPartitioner(object):
+
+    def __init__(self, data, sizes=[0.7, 0.2, 0.1], seed=1234):
+        self.data = data
+        self.partitions = []
+
+        rng = Random()
+        rng.seed(seed)
+        data_len = len(data)
+        indexes = [x for x in range(0, data_len)]
+        rng.shuffle(indexes)
+
+        for frac in sizes:
+            part_len = int(frac * data_len)
+            self.partitions.append(indexes[0:part_len])
+            indexes = indexes[part_len:]
+
+    def use(self, partition):
+        return Partition(self.data, self.partitions[partition])
+
+
+def partition_dataset(dataset, batch_size):
+    world_size = dist.get_world_size()
+    bsz = int(batch_size / world_size)
+    partition_sizes = [1.0 / world_size for _ in range(world_size)]
+    partition = DataPartitioner(dataset, partition_sizes)
+    partition = partition.use(dist.get_rank())
+    train_loader = DataLoader(partition, batch_size=bsz, shuffle=True)
+
+    return train_loader, bsz
+
+
+""" Distributed Torch helper classes """
+
+
+class DistributedTrainingArguments:
+    def __init__(self, **kwargs) -> None:
+        self.__dict__ = dict(kwargs)
+
+
+class DistributedTorch:
+
+    def __init__(self, use_case: str) -> None:
+        self.use_case = use_case
+
+    def launch_distributed_job(
+            self,
+            training_args: DistributedTrainingArguments,
+            master_addr: str,
+            master_port: str,
+            backend: str = 'ccl'
+    ):
+        DistributedTorch.setup_ddp(master_addr, master_port, backend)
+
+        self._fit(training_args)
+
+        DistributedTorch.cleanup_ddp()
+
+    def _fit(self, training_args: DistributedTrainingArguments):
+        self._model = training_args.model
+        self._optimizer = training_args.optimizer
+        self._criterion = training_args.criterion
+
+        if not training_args.disable_ipex:
+            self._model, self._optimizer = ipex.optimize(self._model, optimizer=self._optimizer)
+
+        self._ddp_model = DDP(self._model)
+
+        dataset = training_args.dataset
+        batch_size = training_args.batch_size
+        epochs = training_args.epochs
+
+        dataloader, bsz = partition_dataset(dataset, batch_size)
+        epoch_accuracies, epoch_losses = [], []
+
+        # Since we are loading the model from disk, we have to set 'requires_grad'
+        # to True for the optimizer to update the model parameters.
+        for param in self._ddp_model.parameters():
+            param.requires_grad = True
+
+        if self.use_case == 'text_classification':
+            for epoch in range(epochs):
+                print(f'Epoch {epoch+1}/{epochs}')
+                print('-' * 10)
+
+                # Training phase
+                running_loss = 0.0
+                running_corrects = 0
+
+                # Iterate over data.
+                for data_batch in tqdm(dataloader):
+                    inputs = {k: v for k, v in data_batch.items()
+                              if k in ['input_ids', 'token_type_ids', 'attention_mask']}
+                    labels = data_batch['label']
+
+                    # zero the parameter gradients
+                    self._optimizer.zero_grad()
+
+                    # Forward pass
+                    outputs = self._ddp_model(**inputs)
+                    loss = self._criterion(outputs.logits, labels)
+
+                    # Backward pass
+                    loss.backward()
+                    self.average_gradients()
+                    self._optimizer.step()
+
+                    # Statistics
+                    predictions = torch.argmax(outputs.logits, dim=-1)
+                    running_loss += torch.as_tensor(loss.item() * data_batch['input_ids'].size(0))
+                    running_corrects += torch.sum(predictions == labels)
+
+                dist.all_reduce(running_loss, op=dist.ReduceOp.SUM)
+                dist.all_reduce(running_corrects, op=dist.ReduceOp.SUM)
+                epoch_loss = running_loss / len(dataset)
+                epoch_acc = running_corrects / len(dataset)
+                epoch_accuracies.append(epoch_acc)
+                epoch_losses.append(epoch_loss)
+
+                print("Loss: {}".format(epoch_loss))
+                print("Acc: {}".format(epoch_acc))
+
+            training_loss = epoch_losses[-1]
+            training_acc = epoch_accuracies[-1]
+
+            if dist.get_rank() == 0:
+                print("Training loss:", training_loss)
+                print("Training accuracy:", training_acc)
+        elif self.use_case == 'image_classification':
+            for epoch in range(epochs):
+                print('Epoch {}/{}'.format(epoch + 1, epochs))
+
+                running_loss = 0
+                running_corrects = 0
+                for data, target in tqdm(dataloader):
+                    self._optimizer.zero_grad()
+                    out = self._ddp_model(data)
+                    loss = self._criterion(out, target)
+                    loss.backward()
+                    self.average_gradients()
+                    self._optimizer.step()
+
+                    # Statistics
+                    preds = torch.argmax(out, dim=1)
+                    running_loss += torch.as_tensor(loss.item() * data.size(0))
+                    running_corrects += torch.sum(preds == target)
+
+                # Collect all the running_loss and running_corrects tensors
+                dist.all_reduce(running_loss, op=dist.ReduceOp.SUM)
+                dist.all_reduce(running_corrects, op=dist.ReduceOp.SUM)
+                epoch_loss = running_loss / len(dataset)
+                epoch_acc = running_corrects / len(dataset)
+                epoch_accuracies.append(epoch_acc)
+                epoch_losses.append(epoch_loss)
+
+                print("Loss: {}".format(epoch_loss))
+                print("Acc: {}".format(epoch_acc))
+
+            training_loss = epoch_losses[-1]
+            training_acc = epoch_accuracies[-1]
+
+            if dist.get_rank() == 0:
+                print("Training loss:", training_loss)
+                print("Training accuracy:", training_acc)
+        else:
+            raise ValueError("PyTorch Distributed Training for {} is not implemeted yet"
+                             .format(self.use_case))
+
+    def average_gradients(self):
+        size = float(dist.get_world_size())
+        for param in self._ddp_model.parameters():
+            dist.all_reduce(param.grad.data, op=dist.ReduceOp.SUM)
+            param.grad.data /= size
+
+    @classmethod
+    def setup_ddp(cls, master_addr: str, master_port: str, backend: str = 'ccl'):
+        if dist.is_initialized():
+            print("Process Group already initialized")
+        else:
+            os.environ['MASTER_ADDR'] = master_addr
+            os.environ['MASTER_PORT'] = master_port
+            os.environ['RANK'] = os.environ.get('PMI_RANK', '0')
+            os.environ['WORLD_SIZE'] = os.environ.get('PMI_SIZE', '1')
+
+            if backend == 'ccl':
+                dist.init_process_group(
+                    backend=backend,
+                    init_method='env://'
+                )
+
+    @classmethod
+    def cleanup_ddp(cls):
+        if dist.is_initialized():
+            dist.destroy_process_group()
+
+    @classmethod
+    def load_saved_objects(cls, saved_objects_dir):
+        """
+        Helper function to load saved dataset and model objects
+
+        Args:
+            use_case (str): Use case of the saved datasets and models.
+
+        Returns:
+            dict with loaded dataset and model objects
+        """
+        saved_objects_file = 'torch_saved_objects.obj'
+
+        return torch.load(os.path.join(saved_objects_dir, saved_objects_file))
diff --git a/tlt/distributed/tensorflow/README.md b/tlt/distributed/tensorflow/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..a31124efd94751244153a5c4e8f9083a52b826d8
--- /dev/null
+++ b/tlt/distributed/tensorflow/README.md
@@ -0,0 +1,160 @@
+# Distributed Training with TensorFlow and Intel® Transfer Learning Tool
+
+## Prerequisites
+
+Prior to going over setup, ensure you 2 or more Servers/VMs with following specs:
+
+- Each server has passwordless SSH access to the other servers
+- Python 3.8 or newer
+- Python Pip
+- Python Virtualenv
+- Python Development tools
+- GCC/G++ 8 or newer
+- CMake 3 or newer
+- OpenMPI(or MPICH)
+
+## Multinode setup
+
+You can choose to install multinode dependencies in your existing TLT virtualenv (or) you can create a new virtualenv and install TLT and multinode dependencies.
+
+Step 1: Create a virtualenv and activate it (or) activate your existing TLT virtualenv
+
+```
+virtualenv -p python3 tlt_dev_venv
+source tlt_dev_venv/bin/activate
+```
+
+Step 2: Install TLT from the `setup.py` script (You can skip this step if you already have TLT installed)
+
+```
+pip install --editable .
+```
+
+Step 3: Install multinode dependencies
+
+```
+bash tf_hvd_setup.sh
+```
+
+**Note:** Repeat the steps (or) copy over the virtualenv for **all** the participating nodes and make sure all the nodes have the virtualenv in the **same location**.
+
+## Verify multinode setup
+
+Run any of the following commands on a head node by providing required env variables and IP addresses. You should see a list of hostnames of the nodes.
+
+### Using `mpirun`
+```
+source tlt_dev_venv/bin/activate && \
+mpirun --allow-run-as-root -bind-to none -map-by slot -x NCCL_DEBUG=INFO -x LD_LIBRARY_PATH -x PATH -x NCCL_SOCKET_IFNAME=^lo,docker0 -mca pml ob1 -mca btl ^openib -mca btl_tcp_if_exclude lo,docker0 \
+    -np 4 \
+    -H node_01:2,node_02:2 \
+    hostname
+```
+
+### Using `horovodrun`
+```
+source tlt_dev_venv/bin/activate && \
+horovodrun \
+    -np 4 \
+    -H node_01:2,node_02:2 \
+    hostname
+```
+
+## Launch a distributed training job with TLT CLI
+
+**Step 1:** Create a hostfile with a list of IP addresses of the participating nodes. Make sure the first IP address to be of the current node. The IP addresses can be in any of the following varieties.
+```
+"127.0.0.1"
+"127.0.0.1 slots=2"
+"127.0.0.1:2"
+"hostname-example.com"
+"hostname-example.com slots=2"
+"hostname-example.com:2"
+```
+**Step 2:** Launch a distributed training job with TLT CLI using the appropriate flags.
+
+```
+tlt train \
+    -f tensorflow \
+    --dataset-dir $DATASET_DIR \
+    --output-dir $OUTPUT_DIR \
+    --dataset-name cifar10 \
+    --model-name efficientnet_b0 \
+    --distributed \
+    --hostfile hostfile \
+    --nnodes 2 \
+    --nproc_per_node 2
+```
+
+(Optional): Use the `--use_horovod` flag to run using horovodrun instead of default mpirun.
+
+## Launch a distributed training job with `horovodrun`
+
+You can also use the `run_train_tf.py` script alone with `horovodrun` to do distributed training for TensorFlow hub/Huggingface models on TensorFlow Datasets. 
+
+```
+Distributed training with TensorFlow.
+
+optional arguments:
+  -h, --help            show this help message and exit
+  --use-case {image_classification,text_classification}, --use_case {image_classification,text_classification}
+                        Use case (image_classification|text_classification)
+  --epochs EPOCHS       Total epochs to train the model
+  --batch_size BATCH_SIZE
+                        Global batch size to distribute data (default: 128)
+  --batch_denom BATCH_DENOM
+                        Batch denominator to be used to divide global batch size (default: 1)
+  --shuffle             Shuffle dataset while training
+  --scaling {weak,strong}
+                        Weak or Strong scaling. For weak scaling, lr is scaled by a factor of sqrt(batch_size/batch_denom) and uses global batch size for
+                        all the processes. For strong scaling, lr is scaled by world size and divides global batch size by world size (default: weak)
+  --tlt_saved_objects_dir TLT_SAVED_OBJECTS_DIR
+                        Path to TLT saved distributed objects. The path must be accessible to all the nodes. For example: mounted NFS drive. This arg is
+                        helpful when using TLT API/CLI. See DistributedTF.load_saved_objects() for more information.
+  --max_seq_length MAX_SEQ_LENGTH
+                        Maximum sequence length that the model will be used with
+  --hf_bert_tokenizer HF_BERT_TOKENIZER
+                        Name of the Hugging Face BertTokenizer to use to prepare the data.
+  --dataset-dir DATASET_DIR, --dataset_dir DATASET_DIR
+                        Path to dataset directory to save/load tfds dataset. This arg is helpful if you plan to use this as a stand-alone script. Custom
+                        dataset is not supported yet!
+  --output-dir OUTPUT_DIR, --output_dir OUTPUT_DIR
+                        Path to save the trained model and store logs. This arg is helpful if you plan to use this as a stand-alone script
+  --dataset-name DATASET_NAME, --dataset_name DATASET_NAME
+                        Dataset name to load from tfds. This arg is helpful if you plan to use this as a stand-alone script. Custom dataset is not
+                        supported yet!
+  --model-name MODEL_NAME, --model_name MODEL_NAME
+                        TensorFlow image classification model url/ feature vector url from TensorFlow Hub (or) Huggingface hub name for text
+                        classification models. This arg is helpful if you plan to use this as a stand-alone script.
+  --image-size IMAGE_SIZE, --image_size IMAGE_SIZE
+                        Input image size to the given model, for which input shape is determined as (image_size, image_size, 3). This arg is helpful if
+                        you plan to use this as a stand-alone script.
+```
+
+Here are some examples:
+
+**For image classification:**
+
+```
+horovodrun \
+    -np 10 \
+    -H server_1:6,server_2:4 \
+    python tlt/distributed/tensorflow/run_train_tf.py \
+    --use-case image_classification \
+    --model-name https://tfhub.dev/google/efficientnet/b1/feature-vector/1 \
+    --dataset-name cifar10
+ 
+ ```
+
+ **For text classification**:
+
+ ```
+ horovodrun \
+    -np 10 \
+    -H server_1:6,server_2:4 \
+    python tlt/distributed/tensorflow/run_train_tf.py \
+    --use-case text_classification \
+    --model-name bert-base-uncased \
+    --dataset-name imdb_reviews
+ ```
+ 
\ No newline at end of file
diff --git a/tlt/distributed/tensorflow/__init__.py b/tlt/distributed/tensorflow/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..55899ddaa2b193dbc3b2d314ec2712c6378dd375
--- /dev/null
+++ b/tlt/distributed/tensorflow/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/distributed/tensorflow/requirements.txt b/tlt/distributed/tensorflow/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..0cab058d22b08ccb321c4cda60f516c6eadf0e0c
--- /dev/null
+++ b/tlt/distributed/tensorflow/requirements.txt
@@ -0,0 +1,2 @@
+dill~=0.3.6
+horovod~=0.27.0
diff --git a/tlt/distributed/tensorflow/run_train_tf.py b/tlt/distributed/tensorflow/run_train_tf.py
new file mode 100644
index 0000000000000000000000000000000000000000..a3aae89cd99d4e74187a86b7c2d859a59e244d92
--- /dev/null
+++ b/tlt/distributed/tensorflow/run_train_tf.py
@@ -0,0 +1,163 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import tempfile
+import argparse
+
+import tensorflow as tf
+import tensorflow_datasets as tfds
+
+from tlt.distributed.tensorflow.utils.tf_distributed_util import (
+    DistributedTF,
+    DistributedTrainingArguments
+)
+
+
+if __name__ == '__main__':
+
+    default_data_dir = os.path.join(tempfile.gettempdir(), 'data')
+    default_output_dir = os.path.join(tempfile.gettempdir(), 'output')
+
+    for d in [default_data_dir, default_output_dir]:
+        if not os.path.exists(d):
+            os.makedirs(d)
+
+    def directory_path(path):
+        if os.path.isdir(path):
+            return path
+        else:
+            raise argparse.ArgumentTypeError("'{}' is not a valid directory path.".format(path))
+
+    print("******Distributed Training*****")
+
+    description = 'Distributed training with TensorFlow.'
+
+    parser = argparse.ArgumentParser(description=description)
+
+    parser.add_argument('--use-case', '--use_case', type=str, required=True, choices=['image_classification',
+                        'text_classification'], help='Use case (image_classification|text_classification)')
+    parser.add_argument('--epochs', type=int, required=False, default=1, help='Total epochs to train the model')
+    parser.add_argument('--batch_size', type=int, required=False, default=128,
+                        help='Global batch size to distribute data (default: 128)')
+    parser.add_argument("--batch_denom", type=int, required=False, default=1,
+                        help="Batch denominator to be used to divide global batch size (default: 1)")
+    parser.add_argument('--shuffle', action='store_true', required=False, help="Shuffle dataset while training")
+    parser.add_argument('--scaling', type=str, required=False, default='weak', choices=['weak', 'strong'],
+                        help='Weak or Strong scaling. For weak scaling, lr is scaled by a factor of '
+                        'sqrt(batch_size/batch_denom) and uses global batch size for all the processes. For '
+                        'strong scaling, lr is scaled by world size and divides global batch size by world size '
+                        '(default: weak)')
+    parser.add_argument('--tlt_saved_objects_dir', type=directory_path, required=False, help='Path to TLT saved '
+                        'distributed objects. The path must be accessible to all the nodes. For example: mounted '
+                        'NFS drive. This arg is helpful when using TLT API/CLI. See DistributedTF.load_saved_objects()'
+                        ' for more information.')
+    parser.add_argument('--max_seq_length', type=int, default=128,
+                        help='Maximum sequence length that the model will be used with')
+    parser.add_argument('--dataset-dir', '--dataset_dir', type=directory_path, default=default_data_dir,
+                        help="Path to dataset directory to save/load tfds dataset. This arg is helpful if you "
+                        "plan to use this as a stand-alone script. Custom dataset is not supported yet!")
+    parser.add_argument('--output-dir', '--output_dir', type=directory_path, default=default_output_dir,
+                        help="Path to save the trained model and store logs. This arg is helpful if you "
+                        "plan to use this as a stand-alone script")
+    parser.add_argument('--dataset-name', '--dataset_name', type=str, default=None,
+                        help="Dataset name to load from tfds. This arg is helpful if you "
+                        "plan to use this as a stand-alone script. Custom dataset is not supported yet!")
+    parser.add_argument('--model-name', '--model_name', type=str, default=None,
+                        help="TensorFlow image classification model url/ feature vector url from TensorFlow Hub "
+                        "(or) Huggingface hub name for text classification models. This arg is helpful if you "
+                        "plan to use this as a stand-alone script.")
+    parser.add_argument('--image-size', '--image_size', type=int, default=None,
+                        help="Input image size to the given model, for which input shape is determined as "
+                        "(image_size, image_size, 3). This arg is helpful if you "
+                        "plan to use this as a stand-alone script.")
+
+    args = parser.parse_args()
+
+    dtf = DistributedTF()
+
+    model = None
+    optimizer, loss = None, None
+    train_data, train_labels = None, None
+    val_data, val_labels = None, None
+
+    if args.tlt_saved_objects_dir is not None:
+        model, optimizer, loss, train_data, val_data = dtf.load_saved_objects(args.tlt_saved_objects_dir)
+    else:
+        if args.dataset_name is None:
+            raise argparse.ArgumentError(args.dataset_name, "Please provide a dataset name to load from tfds "
+                                         "using --dataset-name")
+        if args.model_name is None:
+            raise argparse.ArgumentError(args.model_name, "Please provide TensorFlow Hub's model url/feature "
+                                         "vector url (or) Huggingface hub name using --model-name")
+
+        train_data, data_info = tfds.load(args.dataset_name, data_dir=args.dataset_dir, split='train',
+                                          as_supervised=True, with_info=True)
+        val_data = tfds.load(args.dataset_name, data_dir=args.dataset_dir, split='test', as_supervised=True)
+        num_classes = data_info.features['label'].num_classes
+
+        if args.use_case == 'image_classification':
+            if args.image_size is not None:
+                input_shape = (args.image_size, args.image_size, 3)
+            else:
+                try:
+                    input_shape = data_info.features['image'].shape
+                except (KeyError, AttributeError):
+                    raise argparse.ArgumentError(args.image_size, "Unable to determine input_shape, please "
+                                                 "provide --image-size/--image_size")
+
+            train_data = dtf.prepare_dataset(train_data, args.use_case, args.batch_size, args.scaling)
+            val_data = dtf.prepare_dataset(val_data, args.use_case, args.batch_size, args.scaling)
+
+            model = dtf.prepare_model(args.model_name, args.use_case, input_shape, num_classes)
+
+        elif args.use_case == 'text_classification':
+            input_shape = (args.max_seq_length,)
+            from transformers import BertTokenizer
+            hf_bert_tokenizer = BertTokenizer.from_pretrained(args.model_name)
+
+            train_data = dtf.prepare_dataset(train_data, args.use_case, args.batch_size, args.scaling,
+                                             max_seq_length=args.max_seq_length, hf_bert_tokenizer=hf_bert_tokenizer)
+            val_data = dtf.prepare_dataset(val_data, args.use_case, args.batch_size, args.scaling,
+                                           max_seq_length=args.max_seq_length, hf_bert_tokenizer=hf_bert_tokenizer)
+            model = dtf.prepare_model(args.model_name, args.use_case, input_shape, num_classes)
+
+        optimizer = tf.keras.optimizers.Adam()
+        loss = tf.keras.losses.BinaryCrossentropy(from_logits=True) if num_classes == 2 else \
+            tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
+
+    training_args = DistributedTrainingArguments(
+        use_case=args.use_case,
+        model=model,
+        optimizer=optimizer,
+        loss=loss,
+        train_data=train_data,
+        val_data=val_data,
+        epochs=args.epochs,
+        scaling=args.scaling,
+        batch_size=args.batch_size,
+        batch_denom=args.batch_denom,
+        shuffle=args.shuffle,
+        max_seq_length=args.max_seq_length,
+        hf_bert_tokenizer=args.model_name if args.tlt_saved_objects_dir is not None and
+        args.use_case == 'text_classification' else None
+    )
+
+    dtf.launch_distributed_job(training_args)
diff --git a/tlt/distributed/tensorflow/tf_hvd_setup.sh b/tlt/distributed/tensorflow/tf_hvd_setup.sh
new file mode 100644
index 0000000000000000000000000000000000000000..3c7e7c6a366118fa8c535aae3d92a306c75faa58
--- /dev/null
+++ b/tlt/distributed/tensorflow/tf_hvd_setup.sh
@@ -0,0 +1,32 @@
+#!/bin/bash
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+for package in $(cat requirements.txt)
+do
+    if [[ $package =~ "horovod" ]]; then
+        HOROVOD_WITH_MPI=1
+        HOROVOD_WITH_MXNET=0
+        HOROVOD_WITH_PYTORCH=0
+        HOROVOD_WITH_TENSORFLOW=1
+        pip install --no-cache-dir $package
+    else
+        pip install $package
+    fi
+done
diff --git a/tlt/distributed/tensorflow/utils/__init__.py b/tlt/distributed/tensorflow/utils/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..55899ddaa2b193dbc3b2d314ec2712c6378dd375
--- /dev/null
+++ b/tlt/distributed/tensorflow/utils/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/distributed/tensorflow/utils/tf_distributed_util.py b/tlt/distributed/tensorflow/utils/tf_distributed_util.py
new file mode 100644
index 0000000000000000000000000000000000000000..64a8e2580a02046eb773470417e495a319acee29
--- /dev/null
+++ b/tlt/distributed/tensorflow/utils/tf_distributed_util.py
@@ -0,0 +1,312 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import os
+import dill  # nosec: B403
+import time
+
+import tensorflow as tf
+import tensorflow_hub as hub
+
+import numpy as np
+
+from transformers import TFBertModel, BertConfig
+
+from pydoc import locate
+from tlt.utils.dataset_utils import prepare_huggingface_input_data
+from tlt.models.model_factory import get_model_info
+
+
+# This needs to be imported last to avoid "free(): invalid pointer" error
+import horovod.tensorflow.keras as hvd
+
+
+class DistributedTrainingArguments:
+
+    def __init__(self, use_case, train_data, model, optimizer, loss, test_data=None, val_data=None,
+                 epochs=1, global_batch_size=128, shuffle=True, scaling='weak', **kwargs) -> None:
+
+        self.use_case = use_case
+
+        # Model related arguments
+        self.model = model
+        self.optimizer = optimizer
+        self.loss = loss
+
+        # Data related arguments
+        self.train_data = train_data
+        self.test_data = test_data
+        self.val_data = val_data
+        self.num_classes = kwargs.get('num_classes', None)
+
+        # Training related arguments
+        self.epochs = epochs
+        self.scaling = scaling
+        self.global_batch_size = global_batch_size
+        self.batch_denom = kwargs.get('batch_denom', 1)
+        self.shuffle = shuffle
+
+        # Use case related arguments
+        # For image classification
+        self.image_size = kwargs.get('image_size', None)
+        self.image_shape = kwargs.get('image_shape', None)
+        # For text classification
+        self.max_seq_length = kwargs.get('max_seq_length', None)
+        self.padding = kwargs.get('padding', None)
+        self.truncation = kwargs.get('truncation', None)
+        self.hf_bert_tokenizer = kwargs.get('hf_bert_tokenizer', None)
+
+
+class DistributedTF:
+
+    def __init__(self) -> None:
+        hvd.init()
+
+    def prepare_dataset(self, dataset, use_case, global_batch_size, scaling, **kwargs):
+        if scaling.lower() == 'weak':
+            batch_size = global_batch_size
+        elif scaling.lower() == 'strong':
+            batch_size = global_batch_size // hvd.size()
+
+        if use_case == 'image_classification':
+            dataset = dataset.shard(num_shards=hvd.size(), index=hvd.rank())
+            dataset = dataset.cache()
+            if 'map_func' in kwargs:
+                dataset = dataset.map(map_func=kwargs.get('map_func'), num_parallel_calls=tf.data.AUTOTUNE)
+            dataset = dataset.batch(batch_size)
+            dataset = dataset.prefetch(tf.data.AUTOTUNE)
+        elif use_case == 'text_classification':
+            max_seq_length = kwargs.get('max_seq_length')
+            bert_tokenizer = kwargs.get('hf_bert_tokenizer')
+
+            input_ids_shape = (len(dataset), max_seq_length)
+            attention_mask_shape = (len(dataset), max_seq_length)
+
+            input_ids = tf.zeros(input_ids_shape, dtype=tf.int32)
+            attention_mask = tf.zeros(attention_mask_shape, dtype=tf.int32)
+            labels = tf.ones(len(dataset), dtype=tf.int32)
+
+            # Preprocessing text could be done only on one worker and the tensors are synced later among workers
+            if hvd.rank() == 0:
+                dataset = [(sentence.numpy().decode(), label.numpy()) for sentence, label in dataset]
+
+                sentences = [x[0] for x in dataset]
+                labels = [x[1] for x in dataset]
+
+                print('Tokenizing the dataset...')
+                tokenized_dataset = bert_tokenizer(sentences, padding='max_length', max_length=max_seq_length,
+                                                   truncation=True, return_tensors='tf')
+
+                input_ids = tokenized_dataset['input_ids']
+                attention_mask = tokenized_dataset['attention_mask']
+                labels = tf.convert_to_tensor(labels, dtype=tf.int32)
+
+            input_ids = hvd.allreduce(input_ids, average=False, name='barrier1')
+            attention_mask = hvd.allreduce(attention_mask, average=False, name='barrier2')
+            labels = hvd.allreduce(labels, average=False, name='labels')
+
+            dataset = ({
+                'input_ids': input_ids,
+                'attention_mask': attention_mask
+            }, labels)
+
+            dataset = tf.data.Dataset.from_tensor_slices(dataset)
+            dataset = dataset.shard(hvd.size(), hvd.rank())
+            dataset = dataset.cache()
+            dataset = dataset.batch(batch_size)
+            dataset = dataset.prefetch(tf.data.AUTOTUNE)
+
+        return dataset
+
+    def prepare_model(self, model_name, use_case, input_shape, num_classes, **kwargs):
+        # Try to get model url from TLT supported models
+        model_info = get_model_info(model_name, 'tensorflow', use_case)
+        if model_info != {}:
+            fw_enum = list(model_info.keys())[0]
+            model_name = model_info[fw_enum]['tensorflow']['feature_vector']
+        if use_case == 'image_classification':
+            model = tf.keras.models.Sequential([
+                hub.KerasLayer(model_name, input_shape=input_shape),
+                tf.keras.layers.Dense(num_classes, activation='softmax')
+            ])
+        elif use_case == 'text_classification':
+            bert_config = BertConfig.from_pretrained(model_name, output_hidden_states=True)
+            bert_model = TFBertModel.from_pretrained(model_name, config=bert_config, from_pt=True)
+
+            dense_layer_dims = 1 if num_classes == 2 else num_classes
+
+            input_ids = tf.keras.layers.Input(input_shape, dtype=tf.int32, name='input_ids')
+            attention_mask = tf.keras.layers.Input(input_shape, dtype=tf.int32, name='attention_mask')
+            bert_output = bert_model.bert(input_ids, attention_mask=attention_mask)[1]
+            classifier = tf.keras.layers.Dense(dense_layer_dims, activation=None, name='classifier')(bert_output)
+
+            model = tf.keras.Model(inputs=[input_ids, attention_mask], outputs=classifier)
+
+        return model
+
+    def launch_distributed_job(self, training_args: DistributedTrainingArguments):
+        model = training_args.model
+        optimizer = training_args.optimizer
+        loss = training_args.loss
+
+        # This is required if using intel-tensorflow==2.12.0
+        optimizer = self._get_legacy_optimizer(optimizer)
+
+        # Horovod: pin GPU to be used to process local rank (one GPU per process)
+        gpus = tf.config.experimental.list_physical_devices('GPU')
+        for gpu in gpus:
+            tf.config.experimental.set_memory_growth(gpu, True)
+        if gpus:
+            tf.config.experimental.set_visible_devices(gpus[hvd.local_rank()], 'GPU')
+
+        if training_args.scaling.lower() == 'weak':
+            multiplier = np.sqrt(training_args.global_batch_size // training_args.batch_denom)
+            optimizer.lr = optimizer.lr * multiplier
+            batch_size = training_args.global_batch_size
+        elif training_args.scaling.lower() == 'strong':
+            optimizer.lr = optimizer.lr * hvd.size()
+            batch_size = training_args.global_batch_size // hvd.size()
+
+        if training_args.use_case == 'image_classification':
+            hvd_optimizer = hvd.DistributedOptimizer(
+                optimizer, backward_passes_per_step=5, average_aggregated_gradients=True)
+        elif training_args.use_case == 'text_classification':
+            hvd_optimizer = hvd.DistributedOptimizer(
+                optimizer, backward_passes_per_step=1, average_aggregated_gradients=True)
+
+        model.compile(
+            loss=loss,
+            optimizer=hvd_optimizer,
+            metrics=['acc'],
+            experimental_run_tf_function=False
+        )
+
+        warmup = 3
+        if hvd.size() == 1:
+            warmup = 1
+
+        callbacks = []
+        # Horovod: broadcast initial variable states from rank 0 to all other processes.
+        callbacks.append(hvd.callbacks.BroadcastGlobalVariablesCallback(0))
+        # Horovod: average metrics among workers at the end of every epoch.
+        callbacks.append(hvd.callbacks.MetricAverageCallback())
+        # Horovod: using `lr = 1.0 * hvd.size()` from the very beginning leads to worse final accuracy.
+        callbacks.append(hvd.callbacks.LearningRateWarmupCallback(
+            initial_lr=optimizer.lr, warmup_epochs=warmup, verbose=1))
+
+        # Horovod: save checkpoints only on worker 0 to prevent other workers from corrupting them.
+        if hvd.rank() == 0:
+            model_checkpoint_callback = tf.keras.callbacks.ModelCheckpoint(filepath=os.path.join(
+                os.environ['HOME'], 'model_checkpoints'), save_weights_only=False, monitor='val_acc',
+                mode='max', save_best_only=True)
+            callbacks.append(model_checkpoint_callback)
+
+        # Horovod: write logs on worker 0.
+        verbose = 1 if hvd.rank() == 0 else 0
+
+        x_input_data = training_args.train_data
+        y_target_data = None
+        val_data = training_args.val_data
+
+        # Prepare dataset for Hugging Face text classification
+        if training_args.hf_bert_tokenizer:
+            bert_tokenizer_name = training_args.hf_bert_tokenizer
+            max_seq_length = training_args.max_seq_length
+            tokenized_data, labels = prepare_huggingface_input_data(x_input_data, bert_tokenizer_name, max_seq_length)
+            x_input_data = [tokenized_data['input_ids'], tokenized_data['attention_mask']]
+            y_target_data = tf.convert_to_tensor(labels)
+
+            if training_args.val_data:
+                tokenized_val_data, val_labels = prepare_huggingface_input_data(training_args.val_data,
+                                                                                bert_tokenizer_name, max_seq_length)
+                val_data = ([tokenized_val_data['input_ids'], tokenized_val_data['attention_mask']],
+                            tf.convert_to_tensor(val_labels))
+
+        start = time.time()
+        steps_per_epoch_per_worker = len(training_args.train_data) // batch_size
+        steps_per_epoch_per_worker = steps_per_epoch_per_worker // hvd.size()
+        if hvd.size() > 2:
+            steps_per_epoch_per_worker += 1
+        self.history = model.fit(
+            x=x_input_data,
+            y=y_target_data,
+            validation_data=val_data,
+            callbacks=callbacks,
+            steps_per_epoch=steps_per_epoch_per_worker,
+            epochs=training_args.epochs,
+            initial_epoch=0,
+            verbose=verbose
+        )
+        end = time.time()
+        if hvd.rank() == 0:
+            print("Total elapsed time in seconds = ", end - start)
+            print("Total elapsed time in minutes = ", ((end - start) / 60))
+            print("Total epochs = ", len(self.history.history['loss']))
+            print("Time per epoch in seconds = ", ((end - start) / len(self.history.history['loss'])))
+            print("Maximum validation accuracy = ", np.max(self.history.history['val_acc']))
+
+    def _get_legacy_optimizer(self, optimizer):
+        optimizer_config = optimizer.get_config()
+        optimizer_name = optimizer_config['name']
+
+        legacy_optimizer_class = locate('tensorflow.keras.optimizers.legacy.{}'.format(optimizer_name))
+
+        if legacy_optimizer_class is None:
+            # No matching legacy optimizer is found.
+            return optimizer
+
+        legacy_optimizer_config = legacy_optimizer_class().get_config()
+        legacy_optimizer = legacy_optimizer_class.from_config(
+            {k: v for k, v in optimizer_config.items() if k in legacy_optimizer_config}
+        )
+
+        return legacy_optimizer
+
+    def load_saved_objects(self, saved_objects_dir):
+        # Load the saved_model.pb
+        model = tf.keras.models.load_model(filepath=saved_objects_dir, compile=False)
+
+        # Load the optimizer and restore its state
+        checkpoint = tf.train.Checkpoint(optimizer=tf.optimizers.Adam())
+        checkpoint.restore(os.path.join(saved_objects_dir, 'saved_optimizer-1'))
+
+        # Load the saved loss class name and instatiate the loss
+        with open(os.path.join(saved_objects_dir, 'saved_loss'), 'rb') as f:
+            loss_class, loss_args = dill.load(f)  # nosec: B301
+
+        # load the dataset(s)
+        train_data = tf.data.Dataset.load(os.path.join(saved_objects_dir, 'train_data'))
+        try:
+            val_data = tf.data.Dataset.load(os.path.join(saved_objects_dir, 'val_data'))
+        except FileNotFoundError:
+            val_data = None
+
+        if loss_class is None:
+            dataset = train_data.unbatch()
+            dataset = list(dataset.as_numpy_iterator())
+            labels = list()
+            for _, label in dataset:
+                labels.append(label)
+            loss = tf.keras.losses.BinaryCrossentropy(from_logits=True) if len(set(labels)) == 2 else \
+                tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
+        else:
+            loss = loss_class(**loss_args)
+
+        return (model, checkpoint.optimizer, loss, train_data, val_data)
diff --git a/tlt/tools/cli/__init__.py b/tlt/tools/cli/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tlt/tools/cli/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/tools/cli/commands/__init__.py b/tlt/tools/cli/commands/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tlt/tools/cli/commands/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/tools/cli/commands/benchmark.py b/tlt/tools/cli/commands/benchmark.py
new file mode 100644
index 0000000000000000000000000000000000000000..69ef59b2340814e9b4552d123a341380f9a39f9f
--- /dev/null
+++ b/tlt/tools/cli/commands/benchmark.py
@@ -0,0 +1,142 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+import inspect
+import os
+import shutil
+import sys
+
+from tlt.utils.types import FrameworkType
+
+
+@click.command()
+@click.option("--model-dir", "--model_dir",
+              required=True,
+              type=click.Path(exists=True, file_okay=False),
+              help="Model directory to reload for benchmarking. The model directory should contain a saved_model.pb for"
+                   " TensorFlow models or a model.pt file for PyTorch models.")
+@click.option("--dataset-dir", "--dataset_dir",
+              required=True,
+              type=click.Path(exists=True, file_okay=False),
+              help="Dataset directory for a custom dataset. Benchmarking is not supported with dataset catalogs at "
+                   "this time.")
+@click.option("--dataset-file", "--dataset_file",
+              required=False,
+              type=str,
+              help="Name of a file in the dataset directory to load. Used for loading a .csv file for text "
+                   "classification fine tuning.")
+@click.option("--delimiter",
+              required=False,
+              type=str,
+              default=",",
+              help="Delimiter used when loading a dataset from a csv file. [default: ,]")
+@click.option("--batch-size", "--batch_size",
+              required=False,
+              type=click.IntRange(min=1),
+              default=32,
+              show_default=True,
+              help="Batch size used for benchmarking, if an INC config file is not provided. If an INC config file is "
+                   "provided, the batch size from the config file will be used.")
+@click.option("--output-dir", "--output_dir",
+              required=False,
+              type=click.Path(file_okay=False),
+              help="A writeable output directory. The output directory will be used as a location to write the INC "
+                   "config file, if a config file is not provided. If no output directory is provided, a temporary "
+                   "folder will be created and then deleted after benchmarking has completed.")
+def benchmark(model_dir, dataset_dir, batch_size, output_dir, dataset_file, delimiter):
+    """
+    Uses the Intel Neural Compressor to benchmark a trained model
+    """
+    print("Model directory:", model_dir)
+    print("Dataset directory:", dataset_dir)
+    print("Batch size:", batch_size)
+
+    if output_dir:
+        print("Output directory:", output_dir)
+
+    saved_model_path = os.path.join(model_dir, "saved_model.pb")
+    pytorch_model_path = os.path.join(model_dir, "model.pt")
+    if os.path.isfile(saved_model_path):
+        framework = FrameworkType.TENSORFLOW
+    elif os.path.isfile(pytorch_model_path):
+        framework = FrameworkType.PYTORCH
+    else:
+        sys.exit("Benchmarking is currently only implemented for TensorFlow saved_model.pb and PyTorch model.pt "
+                 "models. No such files found in the model directory ({}).".format(model_dir))
+    model_name = os.path.basename(os.path.dirname(model_dir))
+
+    print("Model name:", model_name)
+    print("Framework:", framework)
+    temp_dir = None
+
+    try:
+        from tlt.models.model_factory import get_model
+
+        model = get_model(model_name, framework)
+    except Exception as e:
+        sys.exit("An error occurred while getting the model: {}\nNote that the model directory is expected to contain "
+                 "a previously exported model where the directory structure is <model name>/n/saved_model.pb "
+                 "(for TensorFlow) or <model name>/n/model.pt (for PyTorch).".format(str(e)))
+
+    try:
+        from tlt.datasets import dataset_factory
+        if str(model.use_case) == "image_classification":
+            dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework)
+        elif str(model.use_case) == 'text_classification':
+            if not dataset_file:
+                raise ValueError("Loading a text classification dataset requires --dataset-file to specify the "
+                                 "file name of the .csv file to load from the --dataset-dir.")
+            if not delimiter:
+                raise ValueError("Loading a text classification dataset requires --delimiter in order to read the "
+                                 ".csv file from the --dataset-dir. in the correct format")
+
+            dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework,
+                                                   csv_file_name=dataset_file, delimiter=delimiter)
+        else:
+            sys.exit("ERROR: Benchmarking is currently only implemented for Image Classification "
+                     "and Text Classification models")
+
+        # Preprocess, batch, and split
+        if 'image_size' in inspect.getfullargspec(dataset.preprocess).args:  # For Image classification
+            dataset.preprocess(image_size=model.image_size, batch_size=batch_size)
+        elif 'model_name' in inspect.getfullargspec(dataset.preprocess).args:  # For HF Text classification
+            dataset.preprocess(model_name=model_name, batch_size=batch_size)
+        else:  # For TF Text classification
+            dataset.preprocess(batch_size=batch_size)
+        dataset.shuffle_split()
+
+        # Call the benchmarking API
+        print("Starting benchmarking", flush=True)
+        try:
+            model.benchmark(dataset, saved_model_dir=model_dir)
+        except TypeError:
+            model.load_from_directory(model_dir)
+            model.benchmark(dataset)
+        except AttributeError:
+            model._model = model._get_hub_model(model_name, len(dataset.class_names))
+            model.benchmark(dataset, saved_model_dir=model_dir)
+
+    except Exception as e:
+        sys.exit("An error occurred during benchmarking: {}".format(str(e)))
+    finally:
+        # Remove the temp directory, if we created one
+        if temp_dir and os.path.exists(temp_dir):
+            shutil.rmtree(temp_dir)
diff --git a/tlt/tools/cli/commands/eval.py b/tlt/tools/cli/commands/eval.py
new file mode 100644
index 0000000000000000000000000000000000000000..4732b4bdbbb6f276477ae1f8587f964d85237791
--- /dev/null
+++ b/tlt/tools/cli/commands/eval.py
@@ -0,0 +1,152 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+import inspect
+import os
+import sys
+
+from tlt.utils.types import FrameworkType
+
+
+@click.command()
+@click.option("--model-dir", "--model_dir",
+              required=True,
+              type=str,
+              help="Model directory to reload and evaluate a previously exported model.")
+@click.option("--model-name", "--model_name",
+              required=False,
+              type=str,
+              help="Name of the model to evaluate. If a model name is not provided, the CLI will try to get the model "
+                   "name from the model directory path. For example, if the model directory is /tmp/efficientnet_b0/10,"
+                   " it will use 'efficientnet_b0' as the model name.")
+@click.option("--dataset-dir", "--dataset_dir",
+              required=True,
+              type=str,
+              help="Dataset directory for a custom dataset, or if a dataset name "
+                   "and catalog are being provided, the dataset directory is the "
+                   "location where the dataset will be downloaded.")
+@click.option("--dataset-file", "--dataset_file",
+              required=False,
+              type=str,
+              help="Name of a file in the dataset directory to load. Used for loading a .csv file for text "
+                   "classification evaluation.")
+@click.option("--delimiter",
+              required=False,
+              type=str,
+              default=",",
+              help="Delimiter used when loading a dataset from a csv file. [default: ,]")
+@click.option("--class-names", "--class_names",
+              required=False,
+              type=str,
+              help="Comma separated string of class names for a text classification dataset being loaded from .csv")
+@click.option("--dataset-name", "--dataset_name",
+              required=False,
+              type=str,
+              help="Name of the dataset to use from a dataset catalog.")
+@click.option("--dataset-catalog", "--dataset_catalog",
+              required=False,
+              type=click.Choice(['tf_datasets', 'torchvision', 'huggingface']),
+              help="Name of a dataset catalog for a named dataset (Options: tf_datasets, torchvision, huggingface). "
+                   "If a dataset name is provided and no dataset catalog is given, it will default to use "
+                   "tf_datasets for a TensorFlow model, torchvision for PyTorch CV models, and huggingface datasets "
+                   "for HuggingFace models.")
+def eval(model_dir, model_name, dataset_dir, dataset_file, delimiter, class_names, dataset_name, dataset_catalog):
+    """
+    Evaluates a model that has already been trained
+    """
+    print("Model directory:", model_dir)
+    print("Dataset directory:", dataset_dir)
+
+    if dataset_file:
+        print("Dataset file:", dataset_file)
+
+    if class_names:
+        class_names = class_names.split(",")
+        print("Class names:", class_names)
+
+    if dataset_name:
+        print("Dataset name:", dataset_name)
+        if dataset_catalog:
+            print("Dataset catalog:", dataset_catalog)
+
+    try:
+        from tlt.utils.file_utils import verify_directory
+        verify_directory(model_dir, require_directory_exists=True)
+    except Exception as e:
+        sys.exit("Error while verifying the model directory: {}", str(e))
+
+    saved_model_path = os.path.join(model_dir, "saved_model.pb")
+    pytorch_model_path = os.path.join(model_dir, "model.pt")
+    if os.path.isfile(saved_model_path):
+        framework = FrameworkType.TENSORFLOW
+        model_path = saved_model_path
+    elif os.path.isfile(pytorch_model_path):
+        framework = FrameworkType.PYTORCH
+        model_path = pytorch_model_path
+    else:
+        sys.exit("Evaluation is currently only implemented for TensorFlow saved models and PyTorch .pt models. No such "
+                 "files found in the model directory ({}).".format(model_dir))
+
+    if not model_name:
+        model_name = os.path.basename(os.path.dirname(model_dir))
+
+    print("Model name:", model_name)
+    print("Framework:", framework)
+
+    try:
+        from tlt.models.model_factory import get_model
+
+        print("Loading model object for {} using {}".format(model_name, str(framework)), flush=True)
+        model = get_model(model_name, framework)
+
+        print("Loading saved model from:", model_path)
+        model.load_from_directory(model_dir)
+
+        from tlt.datasets import dataset_factory
+
+        if not dataset_catalog and not dataset_name:
+            if str(model.use_case) == 'text_classification':
+                if not dataset_file:
+                    raise ValueError("Loading a text classification dataset requires --dataset-file to specify the "
+                                     "file name of the .csv file to load from the --dataset-dir.")
+                if not class_names:
+                    raise ValueError("Loading a text classification dataset requires --class-names to specify a list "
+                                     "of the class labels for the dataset.")
+
+                dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework, dataset_name,
+                                                       class_names=class_names, csv_file_name=dataset_file,
+                                                       delimiter=delimiter)
+            else:
+                dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework)
+        else:
+            dataset = dataset_factory.get_dataset(dataset_dir, model.use_case, model.framework, dataset_name,
+                                                  dataset_catalog)
+
+        if 'image_size' in inspect.getfullargspec(dataset.preprocess).args:
+            dataset.preprocess(image_size=model.image_size, batch_size=32)
+        else:
+            dataset.preprocess(batch_size=32)
+
+        dataset.shuffle_split(seed=10)
+
+        model.evaluate(dataset)
+    except Exception as e:
+        sys.exit("An error occurred during evaluation: {}".format(str(e)))
diff --git a/tlt/tools/cli/commands/list.py b/tlt/tools/cli/commands/list.py
new file mode 100644
index 0000000000000000000000000000000000000000..7aec346b6ad5d6d9b4863b9179a058ca392f0650
--- /dev/null
+++ b/tlt/tools/cli/commands/list.py
@@ -0,0 +1,69 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+import sys
+
+from tlt.utils.types import FrameworkType, UseCaseType
+
+
+@click.group("list")
+def list_group():
+    """ Lists the available frameworks, use cases, or models """
+    pass
+
+
+@list_group.command("use_cases", help="List the available use cases")
+def list_use_cases():
+    print("\n".join([e.name.lower() for e in UseCaseType]))
+
+
+@list_group.command("frameworks", help="List the available frameworks")
+def list_frameworks():
+    print("\n".join([e.name.lower() for e in FrameworkType]))
+
+
+@list_group.command("models", help="List the available models")
+@click.option("--framework", "-f",
+              required=False,
+              help="Filter the list of models by framework.")
+@click.option("--use-case", "--use_case",
+              required=False,
+              help="Filter the list of models to a single use case")
+@click.option("--verbose", "verbose",
+              flag_value=True,
+              default=False,
+              help="Verbose output with extra information about each model")
+@click.option("--markdown",
+              flag_value=True,
+              default=False,
+              hidden=True,
+              help="Display the results as markdown. Not compatible with --verbose.")
+def list_models(framework, use_case, verbose, markdown):
+    """
+    List the supported models and the information that we have about each model from the config files.
+    """
+    from tlt.models.model_factory import print_supported_models
+
+    try:
+        print_supported_models(framework, use_case, verbose, markdown)
+    except Exception as e:
+        sys.exit("Error while listing the supported models for framework: {}, use case: {}\n  {}".format(
+            str(framework), str(use_case), str(e)))
diff --git a/tlt/tools/cli/commands/optimize.py b/tlt/tools/cli/commands/optimize.py
new file mode 100644
index 0000000000000000000000000000000000000000..342e8d5d03f66117552548eb138d26f659858f14
--- /dev/null
+++ b/tlt/tools/cli/commands/optimize.py
@@ -0,0 +1,92 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+import os
+import sys
+
+from tlt.utils.types import FrameworkType
+
+
+@click.command()
+@click.option("--model-dir", "--model_dir",
+              required=True,
+              type=click.Path(exists=True, file_okay=False),
+              help="Model directory to reload for graph optimization. The model directory should contain a "
+                   "saved_model.pb TensorFlow model.")
+@click.option("--output-dir", "--output_dir",
+              required=True,
+              type=click.Path(file_okay=False),
+              help="A writeable output directory. The output directory will be used as a location to save the "
+                   "optimized model.")
+def optimize(model_dir, output_dir):
+    """
+    Uses the Intel Neural Compressor to perform graph optimization on a trained model
+    """
+    print("Model directory:", model_dir)
+    print("Output directory:", output_dir)
+
+    try:
+        # Create the output directory, if it doesn't exist
+        from tlt.utils.file_utils import verify_directory
+        verify_directory(output_dir, require_directory_exists=False)
+    except Exception as e:
+        sys.exit("Error while verifying the output directory: {}", str(e))
+
+    saved_model_path = os.path.join(model_dir, "saved_model.pb")
+    # pytorch_model_path = os.path.join(model_dir, "model.pt")
+    if os.path.isfile(saved_model_path):
+        framework = FrameworkType.TENSORFLOW
+    else:
+        sys.exit("Graph optimization is currently only supported for TensorFlow saved_model.pb "
+                 "models. No such files found in the model directory ({}).".format(model_dir))
+
+    # Get the model name from the directory path, assuming models are exported like <model name>/n
+    model_name = os.path.basename(os.path.dirname(model_dir))
+
+    print("Model name:", model_name)
+    print("Framework:", framework)
+
+    try:
+        from tlt.models.model_factory import get_model
+
+        model = get_model(model_name, framework)
+        model.load_from_directory(model_dir)
+    except Exception as e:
+        sys.exit("An error occurred while getting the model: {}\nNote that the model directory is expected to contain "
+                 "a previously exported model where the directory structure is <model name>/n/saved_model.pb "
+                 "(for TensorFlow).".format(str(e)))
+
+    try:
+        # Setup a directory for the quantized model
+        optimized_output_dir = os.path.join(output_dir, "optimized", model_name)
+        verify_directory(optimized_output_dir)
+        if len(os.listdir(optimized_output_dir)) > 0:
+            optimized_output_dir = os.path.join(optimized_output_dir, "{}".format(
+                len(os.listdir(optimized_output_dir)) + 1))
+        else:
+            optimized_output_dir = os.path.join(optimized_output_dir, "1")
+
+        # Call the graph optimization API
+        print("Starting graph optimization", flush=True)
+        model.optimize_graph(optimized_output_dir)
+
+    except Exception as e:
+        sys.exit("An error occurred during graph optimization: {}".format(str(e)))
diff --git a/tlt/tools/cli/commands/quantize.py b/tlt/tools/cli/commands/quantize.py
new file mode 100644
index 0000000000000000000000000000000000000000..86600dd4e3bb6916d229bcb925404fb5f692e6a5
--- /dev/null
+++ b/tlt/tools/cli/commands/quantize.py
@@ -0,0 +1,189 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+import inspect
+import os
+import sys
+
+from tlt.utils.types import FrameworkType
+from tlt.utils.inc_utils import get_inc_config
+
+
+@click.command()
+@click.option("--model-dir", "--model_dir",
+              required=True,
+              type=click.Path(exists=True, file_okay=False),
+              help="Model directory to reload for quantization. The model directory should contain a saved_model.pb "
+                   "for TensorFlow models or a model.pt file for PyTorch models.")
+@click.option("--dataset-dir", "--dataset_dir",
+              required=True,
+              type=click.Path(exists=True, file_okay=False),
+              help="Dataset directory for a custom dataset. Quantization is not supported with dataset catalogs at "
+                   "this time.")
+@click.option("--dataset-file", "--dataset_file",
+              required=False,
+              type=str,
+              help="Name of a file in the dataset directory to load. Used for loading a .csv file for text "
+                   "classification fine tuning.")
+@click.option("--delimiter",
+              required=False,
+              type=str,
+              default=",",
+              help="Delimiter used when loading a dataset from a csv file. [default: ,]")
+@click.option("--batch-size", "--batch_size",
+              required=False,
+              type=click.IntRange(min=1),
+              default=32,
+              show_default=True,
+              help="Batch size used during quantization, if an INC config file is not provided. If an INC config file "
+                   "is provided, the batch size from the config file will be used.")
+@click.option("--approach",
+              required=False,
+              type=click.Choice(['static', 'dynamic'], case_sensitive=False),
+              default='static',
+              show_default=True,
+              help="Specify to use static or dynamic quantization. Generally, static is recommended for image models "
+                   "and dynamic is recommended for text models.")
+@click.option("--accuracy-criterion", "--accuracy_criterion",
+              required=False,
+              type=click.FloatRange(min=0, max=1.0),
+              default=0.01,
+              show_default=True,
+              help="Relative accuracy loss to allow (for example, a value of 0.01 allows for a relative accuracy "
+                   "loss of 1%), if an INC config file is not provided. If an INC config file is provided, the "
+                   "accuracy criterion from the config file will be used.")
+@click.option("--timeout",
+              required=False,
+              type=click.IntRange(min=0),
+              default=0,
+              show_default=True,
+              help="Tuning timeout in seconds, if an INC config file is not provided. If an INC config file is "
+                   "provided, the timeout from the config file will be used. Tuning processing finishes when the "
+                   "timeout or max trials is reached. A tuning timeout of 0 means that the tuning phase stops when "
+                   "the accuracy criterion is met.")
+@click.option("--max-trials", "--max_trials",
+              required=False,
+              type=click.IntRange(min=0),
+              default=50,
+              show_default=True,
+              help="Maximum number of tuning trials, if an INC config file is not provided. If an INC config file is "
+                   "provided, the number of max trials from the config file will be used. Tuning processing finishes "
+                   "when the timeout or max trials is reached.")
+@click.option("--output-dir", "--output_dir",
+              required=True,
+              type=click.Path(file_okay=False),
+              help="A writeable output directory. The output directory will be used as a location to save the "
+                   "quantized model, the tuning workspace, and the INC config file, if a config file is not provided.")
+def quantize(model_dir, dataset_dir, dataset_file, delimiter, batch_size, approach, accuracy_criterion, timeout,
+             max_trials, output_dir):
+    """
+    Uses the Intel Neural Compressor to perform post-training quantization on a trained model
+    """
+    print("Model directory:", model_dir)
+    print("Dataset directory:", dataset_dir)
+
+    print("Quantization approach:", approach)
+    print("Accuracy criterion:", accuracy_criterion)
+    print("Exit policy timeout:", timeout)
+    print("Exit policy max trials:", max_trials)
+    print("Batch size:", batch_size)
+
+    print("Output directory:", output_dir)
+
+    try:
+        # Create the output directory, if it doesn't exist
+        from tlt.utils.file_utils import verify_directory
+        verify_directory(output_dir, require_directory_exists=False)
+    except Exception as e:
+        sys.exit("Error while verifying the output directory: {}", str(e))
+
+    saved_model_path = os.path.join(model_dir, "saved_model.pb")
+    pytorch_model_path = os.path.join(model_dir, "model.pt")
+    if os.path.isfile(saved_model_path):
+        framework = FrameworkType.TENSORFLOW
+    elif os.path.isfile(pytorch_model_path):
+        framework = FrameworkType.PYTORCH
+    else:
+        sys.exit("Quantization is currently only implemented for TensorFlow saved_model.pb and PyTorch model.pt "
+                 "models. No such files found in the model directory ({}).".format(model_dir))
+
+    # Get the model name from the directory path, assuming models are exported like <model name>/n
+    model_name = os.path.basename(os.path.dirname(model_dir))
+
+    print("Model name:", model_name)
+    print("Framework:", framework)
+
+    try:
+        from tlt.models.model_factory import get_model
+
+        model = get_model(model_name, framework)
+        model.load_from_directory(model_dir)
+    except Exception as e:
+        sys.exit("An error occurred while getting the model: {}\nNote that the model directory is expected to contain "
+                 "a previously exported model where the directory structure is <model name>/n/saved_model.pb "
+                 "(for TensorFlow) or <model name>/n/model.pt (for PyTorch).".format(str(e)))
+
+    try:
+        from tlt.datasets import dataset_factory
+
+        if str(model.use_case) == "image_classification":
+            dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework)
+        elif str(model.use_case) == "text_classification":
+            if not dataset_file:
+                raise ValueError("Loading a text classification dataset requires --dataset-file to specify the "
+                                 "file name of the .csv file to load from the --dataset-dir.")
+            if not delimiter:
+                raise ValueError("Loading a text classification dataset requires --delimiter in order to read the "
+                                 ".csv file from the --dataset-dir. in the correct format")
+
+            dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework,
+                                                   csv_file_name=dataset_file, delimiter=delimiter)
+        else:
+            sys.exit("ERROR: Quantization is currently only implemented for Image Classification "
+                     "and Text Classification models")
+
+        # Preprocess, batch, and split
+        if 'image_size' in inspect.getfullargspec(dataset.preprocess).args:  # For Image classification
+            dataset.preprocess(image_size=model.image_size, batch_size=batch_size)
+        elif 'model_name' in inspect.getfullargspec(dataset.preprocess).args:  # For HF Text classification
+            dataset.preprocess(model_name=model_name, batch_size=batch_size)
+        else:  # For TF Text classification
+            dataset.preprocess(batch_size=batch_size)
+        dataset.shuffle_split()
+
+        # Generate a default inc config
+        inc_config = get_inc_config(approach, accuracy_criterion, timeout, max_trials)
+
+        # Setup a directory for the quantized model
+        quantized_output_dir = os.path.join(output_dir, "quantized", model_name)
+        verify_directory(quantized_output_dir)
+        if len(os.listdir(quantized_output_dir)) > 0:
+            quantized_output_dir = os.path.join(quantized_output_dir, "{}".format(
+                len(os.listdir(quantized_output_dir)) + 1))
+        else:
+            quantized_output_dir = os.path.join(quantized_output_dir, "1")
+
+        # Call the quantization API
+        print("Starting post-training quantization", flush=True)
+        model.quantize(quantized_output_dir, dataset, config=inc_config)
+
+    except Exception as e:
+        sys.exit("An error occurred during quantization: {}".format(str(e)))
diff --git a/tlt/tools/cli/commands/train.py b/tlt/tools/cli/commands/train.py
new file mode 100644
index 0000000000000000000000000000000000000000..cd72dcc6c971936a03161eebc82e7577edd4927c
--- /dev/null
+++ b/tlt/tools/cli/commands/train.py
@@ -0,0 +1,285 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+import click
+import inspect
+import sys
+
+from tlt.distributed import TLT_DISTRIBUTED_DIR
+
+
+@click.command()
+@click.option("--framework", "-f",
+              required=False,
+              default="tensorflow",
+              type=click.Choice(['tensorflow', 'pytorch']),
+              help="Deep learning framework [default: tensorflow]")
+@click.option("--model-name", "--model_name",
+              required=True,
+              type=str,
+              help="Name of the model to use")
+@click.option("--output-dir", "--output_dir",
+              required=True,
+              type=click.Path(dir_okay=True, file_okay=False),
+              help="Output directory for saved models, logs, checkpoints, etc")
+@click.option("--dataset-dir", "--dataset_dir",
+              required=True,
+              type=click.Path(dir_okay=True, file_okay=False),
+              help="Dataset directory for a custom dataset, or if a dataset name "
+                   "and catalog are being provided, the dataset directory is the "
+                   "location where the dataset will be downloaded.")
+@click.option("--dataset-file", "--dataset_file",
+              required=False,
+              type=str,
+              help="Name of a file in the dataset directory to load. Used for loading a .csv file for text "
+                   "classification fine tuning.")
+@click.option("--delimiter",
+              required=False,
+              type=str,
+              default=",",
+              help="Delimiter used when loading a dataset from a csv file. [default: ,]")
+@click.option("--class-names", "--class_names",
+              required=False,
+              type=str,
+              help="Comma separated string of class names for a text classification dataset being loaded from .csv")
+@click.option("--dataset-name", "--dataset_name",
+              required=False,
+              type=str,
+              help="Name of the dataset to use from a dataset catalog.")
+@click.option("--dataset-catalog", "--dataset_catalog",
+              required=False,
+              type=click.Choice(['tf_datasets', 'torchvision', 'huggingface']),
+              help="Name of a dataset catalog for a named dataset (Options: "
+                   "tf_datasets, torchvision, huggingface). If a dataset name is provided "
+                   "and no dataset catalog is given, it will default to use tf_datasets for a TensorFlow "
+                   "model, torchvision for PyTorch CV models, and huggingface datasets for HuggingFace models.")
+@click.option("--epochs",
+              default=1,
+              type=click.IntRange(min=1),
+              help="Number of training epochs [default: 1]")
+@click.option("--init-checkpoints", "--init_checkpoints",
+              required=False,
+              type=click.Path(dir_okay=True),
+              help="Optional path to checkpoint weights to load to resume training. If the path provided is a "
+                   "directory, the latest checkpoint from the directory will be used.")
+@click.option("--add-aug", "--add_aug",
+              type=click.Choice(['hvflip', 'hflip', 'vflip', 'rotate', 'zoom']),
+              multiple=True,
+              default=[],
+              help="Choice of data augmentation to be applied during training.")
+@click.option("--ipex_optimize", "--ipex-optimize",
+              required=False,
+              type=click.BOOL,
+              is_flag=True,
+              help="Boolean option to optimize model with Intel Extension for PyTorch.")
+@click.option("--distributed", "-d",
+              required=False,
+              type=click.BOOL,
+              is_flag=True,
+              help="Boolean option to trigger a distributed training job.")
+@click.option("--nnodes",
+              required=False,
+              default=1,
+              type=click.IntRange(min=1),
+              help="Number of nodes to run the training job [default: 1]")
+@click.option("--nproc_per_node", "--nproc-per-node",
+              required=False,
+              default=1,
+              type=click.IntRange(min=1),
+              help="Number of processes per node for the distributed training job [default: 1]")
+@click.option("--hostfile",
+              required=False,
+              default=None,
+              type=click.Path(exists=True, dir_okay=False),
+              help="hostfile with a list of nodes to run distributed training.")
+@click.option("--early-stopping", "--early_stopping",
+              type=click.BOOL,
+              default=False,
+              is_flag=True,
+              help="Enable early stopping if convergence is reached while training (bool)")
+@click.option("--lr-decay", "--lr_decay",
+              type=click.BOOL,
+              default=False,
+              is_flag=True,
+              help="If lr_decay is True and do_eval is True, learning rate decay on the validation loss is applied at "
+              "the end of each epoch.")
+@click.option("--use-horovod", "--use_horovod",
+              required=False,
+              type=click.BOOL,
+              is_flag=True,
+              help="Use horovod instead of default MPI")
+@click.option("--hvd-start-timeout", "--hvd_start_timeout",
+              type=click.IntRange(min=1),
+              default=30,
+              help="Horovodrun has to perform all the checks and start the processes before the specified timeout. "
+              "The default value is 30 seconds.  Alternatively, The environment variable HOROVOD_START_TIMEOUT can "
+              "also be used to specify the initialization timeout. Currently only supports PyTorch.")
+def train(framework, model_name, output_dir, dataset_dir, dataset_file, delimiter, class_names, dataset_name,
+          dataset_catalog, epochs, init_checkpoints, add_aug, early_stopping, lr_decay, ipex_optimize, distributed,
+          nnodes, nproc_per_node, hostfile, use_horovod, hvd_start_timeout):
+    """
+    Trains the model
+    """
+    session_log = {}  # Initialize an empty dictionary to store information about current training session
+    session_verbose = ""
+
+    session_log["model_name"] = model_name
+    session_log["framework"] = framework
+    session_log["epochs"] = epochs
+    session_log["dataset_dir"] = dataset_dir
+    session_log["output_directory"] = output_dir
+
+    session_verbose += "Model name: {}\n".format(model_name)
+    session_verbose += "Framework: {}\n".format(framework)
+
+    if dataset_name:
+        session_verbose += "Dataset name: {}\n".format(dataset_name)
+        session_log["dataset_name"] = dataset_name
+        if dataset_catalog:
+            session_verbose += "Dataset catalog: {}\n".format(dataset_catalog)
+            session_log["dataset_catalog"] = dataset_catalog
+    session_verbose += "Training epochs: {}\n".format(epochs)
+
+    if init_checkpoints:
+        session_verbose += "Initial checkpoints: {}\n".format(init_checkpoints)
+        session_log["init_checkpoints"] = init_checkpoints
+
+    if add_aug:
+        session_log["add_aug"] = add_aug
+
+    session_verbose += "Dataset dir: {}\n".format(dataset_dir)
+
+    if dataset_file:
+        session_verbose += "Dataset file: {}\n".format(dataset_file)
+        session_log["dataset_file"] = dataset_file
+    if class_names:
+        class_names = class_names.split(",")
+        session_verbose += "Class names: {}\n".format(class_names)
+        session_log["class_names"] = class_names
+    if early_stopping:
+        session_log["early_stopping"] = early_stopping
+        session_verbose += "Early Stopping: {}\n".format(early_stopping)
+    if lr_decay:
+        session_log["lr_decay"] = lr_decay
+        session_verbose += "lr_decay: {}\n".format(lr_decay)
+
+    session_verbose += "Output directory: {}\n".format(output_dir)
+    if distributed:
+        session_verbose += "Distributed: {}\n".format(distributed)
+        session_verbose += "Number of nodes: {}\n".format(nnodes)
+        session_verbose += "Number of processes per node: {}\n".format(nproc_per_node)
+        session_verbose += "hostfile: {}\n".format(hostfile)
+        session_log["distibuted"] = distributed
+        session_log["nnodes"] = nnodes
+        session_log["nproc_per_node"] = nproc_per_node
+        session_log["hostfile"] = hostfile
+
+    print(session_verbose, flush=True)
+
+    # Validate distributed inputs, if given
+    if distributed:
+        if hostfile is None:
+            # TODO: Logic to continute distributed training on single (current) node
+            sys.exit("Error: Specify the hostfile with \'--hostfile\' flag")
+
+    from tlt.models import model_factory
+    from tlt.datasets import dataset_factory
+    # Get the model
+    try:
+        model = model_factory.get_model(model_name, framework)
+    except Exception as e:
+        sys.exit("Error while getting the model (model name: {}, framework: {}):\n{}".format(
+            model_name, framework, str(e)))
+    # Get the dataset
+    try:
+        if not dataset_name and not dataset_catalog:
+            if str(model.use_case) == 'text_classification':
+                if not dataset_file:
+                    raise ValueError("Loading a text classification dataset requires --dataset-file to specify the "
+                                     "file name of the .csv file to load from the --dataset-dir.")
+                if not class_names:
+                    raise ValueError("Loading a text classification dataset requires --class-names to specify a list "
+                                     "of the class labels for the dataset.")
+                dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework, dataset_name,
+                                                       class_names=class_names, csv_file_name=dataset_file,
+                                                       delimiter=delimiter)
+            else:
+                dataset = dataset_factory.load_dataset(dataset_dir, model.use_case, model.framework)
+        else:
+            dataset = dataset_factory.get_dataset(dataset_dir, model.use_case, model.framework, dataset_name,
+                                                  dataset_catalog)
+        # TODO: get extra configs like batch size and maybe this doesn't need to be a separate call
+        if framework in ['tensorflow', 'pytorch']:
+            if 'image_size' in inspect.getfullargspec(dataset.preprocess).args:  # For Image classification
+                dataset.preprocess(image_size=model.image_size, batch_size=32, add_aug=list(add_aug))
+            elif 'model_name' in inspect.getfullargspec(dataset.preprocess).args:  # For HF Text classification
+                dataset.preprocess(model_name=model_name, batch_size=32)
+            else:  # For TF Text classification
+                dataset.preprocess(batch_size=32)
+            dataset.shuffle_split()
+    except Exception as e:
+        sys.exit("Error while getting the dataset (dataset dir: {}, use case: {}, framework: {}, "
+                 "dataset name: {}, dataset_catalog: {}):\n{}".format(dataset_dir, model.use_case, model.framework,
+                                                                      dataset_name, dataset_catalog, str(e)))
+
+    if ipex_optimize and framework != 'pytorch':
+        sys.exit("ipex_optimize is only supported for pytorch training\n")
+
+    # Train the model using the dataset
+    if framework == 'pytorch':
+        try:
+            model.train(dataset, output_dir=output_dir, epochs=epochs, initial_checkpoints=init_checkpoints,
+                        early_stopping=early_stopping, lr_decay=lr_decay, ipex_optimize=ipex_optimize,
+                        distributed=distributed, hostfile=hostfile, nnodes=nnodes, nproc_per_node=nproc_per_node,
+                        use_horovod=use_horovod, hvd_start_timeout=hvd_start_timeout)
+        except Exception as e:
+            sys.exit("There was an error during model training:\n{}".format(str(e)))
+
+    # Test for tensorflow
+    else:
+        try:
+            model.train(dataset, output_dir=output_dir, epochs=epochs, initial_checkpoints=init_checkpoints,
+                        early_stopping=early_stopping, lr_decay=lr_decay, distributed=distributed, hostfile=hostfile,
+                        nnodes=nnodes, nproc_per_node=nproc_per_node, use_horovod=use_horovod)
+        except Exception as e:
+            sys.exit("There was an error during model training:\n{}".format(str(e)))
+
+    if distributed:
+        # Cleanup the saved objects
+        import os
+        for file_name in ["torch_saved_objects.obj", "hf_saved_objects.obj"]:
+            if file_name in os.listdir(TLT_DISTRIBUTED_DIR):
+                os.remove(os.path.join(TLT_DISTRIBUTED_DIR, file_name))
+
+    # Save the trained model
+    try:
+        log_output = model.export(output_dir)
+    except Exception as e:
+        sys.exit("There was an error when saving the model:\n{}".format(str(e)))
+    # Save the log file
+    try:
+        import os
+        import json
+        json_filename = os.path.join(log_output, "session_log.json")
+        session_log["log_path"] = log_output
+        json_object = json.dumps(session_log, indent=4)
+        with open(json_filename, "w") as outfile:
+            outfile.write(json_object)
+    except Exception as e:
+        sys.exit("There was an error when saving the session log file:\n{}".format(str(e)))
diff --git a/tlt/tools/cli/main.py b/tlt/tools/cli/main.py
new file mode 100644
index 0000000000000000000000000000000000000000..33469f8c02c8f33da9254703c13025e96a3e3ec0
--- /dev/null
+++ b/tlt/tools/cli/main.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import click
+
+from tlt.tools.cli.commands.benchmark import benchmark
+from tlt.tools.cli.commands.eval import eval
+from tlt.tools.cli.commands.list import list_group
+from tlt.tools.cli.commands.optimize import optimize
+from tlt.tools.cli.commands.quantize import quantize
+from tlt.tools.cli.commands.train import train
+
+
+@click.group('cli')
+def cli_group():
+    pass
+
+
+# Add top level commands
+cli_group.add_command(list_group)
+cli_group.add_command(train)
+cli_group.add_command(eval)
+cli_group.add_command(quantize)
+cli_group.add_command(benchmark)
+cli_group.add_command(optimize)
+
+if __name__ == '__main__':
+    cli_group()
diff --git a/tlt/utils/__init__.py b/tlt/utils/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..fbdf834ba1b25bdb0d2ab8361901d6cc7d22b44a
--- /dev/null
+++ b/tlt/utils/__init__.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
diff --git a/tlt/utils/dataset_utils.py b/tlt/utils/dataset_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..19610e797074665bf64c70613ad31e654fe18d3b
--- /dev/null
+++ b/tlt/utils/dataset_utils.py
@@ -0,0 +1,50 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+
+def prepare_huggingface_input_data(dataset, hub_name, max_seq_length):
+    """
+    Prepares the input data using the BertTokenizer from Hugging Face for TensorFlow
+
+    Args:
+       dataset (TensorFlow dataset): The TensorFlow dataset to preprocess
+       hub_name (str): The name of the Hugging Face model
+       max_seq_length (int): The maximum sentence length to use
+    Returns:
+        Tokenized input and labels
+    """
+    from transformers import BertTokenizer
+
+    tokenizer = BertTokenizer.from_pretrained(hub_name)
+    data_converted = {
+        'sentences': [],
+        'labels': [],
+    }
+
+    for elem in dataset.as_numpy_iterator():
+        # elem would be in the following format:
+        # (array([sentence1, sentence2, ...]), array([label1, label2, ...]))
+        data_converted['sentences'].extend(elem[0])
+        data_converted['labels'].extend(elem[1])
+
+    data_converted["sentences"] = [x.decode() for x in data_converted['sentences']]
+
+    tokenized_dataset = tokenizer(data_converted['sentences'], padding='max_length',
+                                  max_length=max_seq_length, truncation=True, return_tensors='tf')
+
+    return tokenized_dataset, data_converted['labels']
diff --git a/tlt/utils/file_utils.py b/tlt/utils/file_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..6d8530287e8a8d68bd93cbacdef95232854fc178
--- /dev/null
+++ b/tlt/utils/file_utils.py
@@ -0,0 +1,147 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import json
+import os
+import requests
+import re
+import shutil
+import tarfile
+from zipfile import ZipFile
+
+
+def read_json_file(json_file_path):
+    """
+    Reads a json file an returns a dictionary representing the file contents
+
+    :param json_file_path: Path to the json file
+    :return: Dictionary
+    """
+
+    if not os.path.isfile(json_file_path):
+        raise FileNotFoundError("The json file {} does not exist".format(json_file_path))
+
+    with open(json_file_path, "r") as f:
+        data = json.load(f)
+
+    return data
+
+
+def download_file(download_url, destination_directory):
+    """
+    Downloads a file using the specified url to the destination directory. Returns the
+    path to the downloaded file.
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    destination_file_path = os.path.join(destination_directory, os.path.basename(download_url))
+
+    print("Downloading {} to {}".format(download_url, destination_directory))
+    response = requests.get(download_url, stream=True, timeout=30)  # Adds a 30 sec timeout for Bandit
+    with open(destination_file_path, 'wb') as out_file:
+        response.raw.decode_content = True
+        shutil.copyfileobj(response.raw, out_file)
+
+    return destination_file_path
+
+
+def extract_tar_file(tar_file_path, destination_directory):
+    """
+    Extracts a tar file on the local file system to the destination directory
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    print("Extracting {} to {}".format(tar_file_path, destination_directory))
+    with tarfile.open(tar_file_path) as t:
+        t.extractall(path=destination_directory)
+
+
+def extract_zip_file(zip_file_path, destination_directory):
+    """
+    Extracts a zip file on the local file system to the destination directory
+    """
+    if not os.path.isdir(destination_directory):
+        os.makedirs(destination_directory)
+
+    print("Extracting {} to {}".format(zip_file_path, destination_directory))
+    with ZipFile(zip_file_path, "r") as zipfile:
+        zipfile.extractall(path=destination_directory)
+
+
+def download_and_extract_tar_file(tar_file_url, destination_directory):
+    """
+    Downloads a tar file using the specified URL to the destination directory, then extracts
+    the tar file to the destination directory.
+    """
+    local_tar_path = download_file(tar_file_url, destination_directory)
+
+    if os.path.isfile(local_tar_path):
+        extract_tar_file(local_tar_path, destination_directory)
+    else:
+        raise FileNotFoundError("Unable to find the downloaded tar file at:", local_tar_path)
+
+
+def download_and_extract_zip_file(zip_file_url, destination_directory):
+    """
+    Downloads a tar file using the specified URL to the destination directory, then extracts
+    the zip file to the destination directory.
+    """
+    local_zip_path = download_file(zip_file_url, destination_directory)
+
+    if os.path.isfile(local_zip_path):
+        extract_zip_file(local_zip_path, destination_directory)
+    else:
+        raise FileNotFoundError("Unable to find the downloaded zip file at:", local_zip_path)
+
+
+def verify_directory(directory_path, require_directory_exists=False):
+    """
+    Verifies that the input parameter is a string and that it's not already a file. If require_directory_exists is
+    True, and the directory does not exist, a NotADirectoryError is raised. Otherwise, if the directory does not
+    exist it will be created.
+    """
+
+    if not isinstance(directory_path, str):
+        raise TypeError("The directory path should be a str, but was a {}".format(type(directory_path)))
+
+    if require_directory_exists and not os.path.isdir(directory_path):
+        raise NotADirectoryError("The directory does not exist at:", directory_path)
+
+    if os.path.isfile(directory_path):
+        raise FileExistsError("Unable to use directory path {} because it already exists as "
+                              "file".format(directory_path))
+
+    if not os.path.isdir(directory_path):
+        os.makedirs(directory_path)
+
+
+def validate_model_name(model_name):
+    """
+    Verifies that the input parameter is a string. If the input parameter is indeed a string, a regular expression
+    is used to clean the string of white spaces and any non-alphanumeric characters (besides dashes and underscores).
+    Any matches will be replaced with an underscore.
+    """
+    if not isinstance(model_name, str):
+        raise TypeError("The model name should be a str, but was a {}".format(type(model_name)))
+    else:
+        model_name = model_name.strip()
+        model_name = " ".join(model_name.split())
+        model_name = re.sub('[^a-zA-Z\d_-]', '_', model_name)  # noqa: W605
+        return model_name
diff --git a/tlt/utils/inc_utils.py b/tlt/utils/inc_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..098989ffc10c6974a74c7b284054b2e8669298fa
--- /dev/null
+++ b/tlt/utils/inc_utils.py
@@ -0,0 +1,106 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import math
+import numpy as np
+from neural_compressor.config import PostTrainingQuantConfig, TuningCriterion, AccuracyCriterion
+
+
+def get_inc_config(approach='static', accuracy_criterion_relative=0.01, exit_policy_timeout=0,
+                   exit_policy_max_trials=50):
+    """
+    Creates an INC post-training quantization config from the specified parameters.
+
+    Args:
+        static (str): Type of quantization, static or dynamic (default: static)
+        accuracy_criterion_relative (float): Relative accuracy loss (default: 0.01, which is 1%)
+        exit_policy_timeout (int): Tuning timeout in seconds (default: 0). Tuning processing finishes when the
+                                   timeout or max_trials is reached. A tuning timeout of 0 means that the tuning
+                                   phase stops when the accuracy criterion is met.
+        exit_policy_max_trials (int): Maximum number of tuning trials (default: 50). Tuning processing finishes
+                                      when the timeout or or max_trials is reached.
+
+    Returns:
+        A PostTrainingQuantConfig from Intel Neural Compressor
+
+    Raises:
+        ValueError: if the parameters are not within the expected values
+    """
+    if approach not in ['static', 'dynamic']:
+        raise ValueError("Invalid value for the quantization approach ({}). Expected either "
+                         "'static' or 'dynamic'.")
+    if accuracy_criterion_relative and not isinstance(accuracy_criterion_relative, float) or \
+            not (0.0 <= accuracy_criterion_relative <= 1.0):
+        raise ValueError('Invalid value for the accuracy criterion ({}). Expected a float value between 0.0 '
+                         'and 1.0'.format(accuracy_criterion_relative))
+    if exit_policy_timeout and not isinstance(exit_policy_timeout, int) or exit_policy_timeout < 0:
+        raise ValueError('Invalid value for the exit policy timeout ({}). Expected a positive integer or 0.'.
+                         format(exit_policy_timeout))
+    if exit_policy_max_trials and not isinstance(exit_policy_max_trials, int) or exit_policy_max_trials < 1:
+        raise ValueError('Invalid value for max trials ({}). Expected an integer greater than 0.'.
+                         format(exit_policy_timeout))
+
+    accuracy_criterion = AccuracyCriterion(tolerable_loss=accuracy_criterion_relative)
+    tuning_criterion = TuningCriterion(timeout=exit_policy_timeout, max_trials=exit_policy_max_trials)
+    config = PostTrainingQuantConfig(approach=approach, device="cpu",
+                                     accuracy_criterion=accuracy_criterion,
+                                     tuning_criterion=tuning_criterion)
+
+    return config
+
+
+class INCTFDataLoader(object):
+    def __init__(self, dataset, batch_size):
+        self.dataset = dataset
+        self.batch_size = batch_size
+        self.steps = math.floor(len(dataset['label']) / self.batch_size)
+        self.num_batch = math.ceil(self.steps / batch_size)
+
+    def create_feed_dict_and_labels(self, dataset, batch_id=None, num_batch=None, idx=None):
+        """Return the input dictionary for the given batch."""
+        if idx is None:
+            start_idx = batch_id * self.batch_size
+            if batch_id == num_batch - 1:
+                end_idx = self.steps
+            else:
+                end_idx = start_idx + self.batch_size
+            input_ids = np.array(dataset["input_ids"])[start_idx:end_idx, :]
+            attention_mask = np.array(dataset["attention_mask"])[start_idx:end_idx, :]
+            feed_dict = {"input_ids": input_ids,
+                         "attention_mask": attention_mask,
+                         }
+            labels = np.array(dataset["label"])[start_idx: end_idx]
+        else:
+            input_ids = np.array(dataset["input_ids"])[idx, :].reshape(1, -1)
+            attention_mask = np.array(dataset["attention_mask"])[idx, :].reshape(1, -1)
+            feed_dict = {"input_ids": input_ids,
+                         "attention_mask": attention_mask,
+                         }
+            labels = np.array(dataset["label"])[idx]
+        return feed_dict, labels
+
+    def __iter__(self):
+        return self.generate_dataloader(self.dataset).__iter__()
+
+    def __len__(self):
+        return self.num_batch
+
+    def generate_dataloader(self, dataset):
+        for batch_id in range(self.num_batch):
+            feed_dict, labels = self.create_feed_dict_and_labels(dataset, batch_id, self.num_batch)
+            yield feed_dict, labels
diff --git a/tlt/utils/platform_util.py b/tlt/utils/platform_util.py
new file mode 100644
index 0000000000000000000000000000000000000000..7d5773f8b60cadc347c64990f5e5e26780b65ab6
--- /dev/null
+++ b/tlt/utils/platform_util.py
@@ -0,0 +1,688 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2018-2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os  # noqa: F401
+import re
+import platform as system_platform
+import subprocess  # nosec: B404
+import sys
+
+NUMA_NODES_STR_ = "NUMA node(s)"
+CPU_SOCKETS_STR_ = "Socket(s)"
+CORES_PER_SOCKET_STR_ = "Core(s) per socket"
+THREADS_PER_CORE_STR_ = "Thread(s) per core"
+LOGICAL_CPUS_STR_ = "CPU(s)"
+NUMA_NODE_CPU_RANGE_STR_ = "NUMA node{} CPU(s):"
+ONLINE_CPUS_LIST = "On-line CPU(s) list:"
+CPU_FAMILY_STR = "CPU family:"
+CPU_MODEL_STR = "Model:"
+
+# Map of known cpu types
+KNOWN_CPU_TYPES = [
+    {
+        CPU_FAMILY_STR: '6',
+        CPU_MODEL_STR: '85',
+        'Type': 'SKX, CPX, CLX'
+    },
+    {
+        CPU_FAMILY_STR: '6',
+        CPU_MODEL_STR: '143',
+        'Type': 'SPR'
+    }
+]
+
+
+class CPUInfo():
+    """CPU information class."""
+
+    def __init__(self):
+        """Initialize CPU information class."""
+        self._binding_data = CPUInfo._sort_membind_info(self._get_core_membind_info())
+
+    @staticmethod
+    def _get_core_membind_info():
+        """
+        Return sorted information about cores and memory binding.
+        E.g.
+        CPU ID, Socket ID, Node ID, HT CPU ID,
+        0  ,     0    ,    0   ,     0
+        1  ,     0    ,    0   ,     1
+        :return: list with cpu, sockets, ht core and memory binding information
+        :rtype: List[List[str, Any]]
+        """
+        args = ["lscpu", "--parse=CPU,Core,Socket,Node"]
+        process_lscpu = subprocess.check_output(args, universal_newlines=True).split("\n")
+
+        # Get information about core, node, socket and cpu. On a machine with no NUMA nodes, the last column is empty
+        # so regex also check for empty string on the last column
+        bind_info = []
+        for line in process_lscpu:
+            pattern = r"^([\d]+,[\d]+,[\d]+,([\d]+|$))"
+            regex_out = re.search(pattern, line)
+            if regex_out:
+                bind_info.append(regex_out.group(1).strip().split(","))
+
+        return bind_info
+
+    @staticmethod
+    def _sort_membind_info(membind_bind_info):
+        """
+        Sore membind info data.
+        :param membind_bind_info: raw membind info data
+        :type membind_bind_info: List[List[str]]
+        :return: sorted membind info
+        :rtype: List[List[Dict[str, int]]]
+        """
+        membind_cpu_list = []
+        nodes_count = int(max(element[2] for element in membind_bind_info)) + 1
+        # Sort list by Node id
+        for node_number in range(nodes_count):
+            node_core_list = []
+            core_info = {}
+            for entry in membind_bind_info:
+                cpu_id = int(entry[0])
+                core_id = int(entry[1])
+                node_id = int(entry[2])
+                # On a machine where there is no NUMA nodes, entry[3] could be empty, so set socket_id = -1
+                if entry[3] != "":
+                    socket_id = int(entry[3])
+                else:
+                    socket_id = -1
+
+                # Skip nodes other than current node number
+                if node_number != node_id:
+                    continue
+
+                # Add core info
+                if cpu_id == core_id:
+                    core_info.update({
+                        core_id: {
+                            "cpu_id": cpu_id,
+                            "node_id": node_id,
+                            "socket_id": socket_id,
+                        },
+                    })
+                else:
+                    # Add information about Hyper Threading
+                    core_info[core_id]["ht_cpu_id"] = cpu_id
+
+            # Change dict of dicts to list of dicts
+            for iterator in range(len(core_info)):
+                curr_core_id = len(core_info) * node_number + iterator
+                single_core_info = core_info.get(curr_core_id)
+                if single_core_info:
+                    node_core_list.append(single_core_info)
+
+            membind_cpu_list.append(node_core_list)
+
+        return membind_cpu_list
+
+    @property
+    def sockets(self):
+        """
+        Return count of sockets available on server.
+        :return: available cores
+        :rtype: int
+        """
+        available_sockets = len(self._binding_data)
+        return int(available_sockets)
+
+    @property
+    def cores(self):
+        """
+        Return amount of cores available on server.
+        :return: amount of cores
+        :rtype: int
+        """
+        available_cores = self.cores_per_socket * self.sockets
+        return int(available_cores)  # type: ignore
+
+    @property
+    def cores_per_socket(self):
+        """
+        Return amount of available cores per socket.
+        :return: amount of cores
+        :rtype: int
+        """
+        available_cores_per_socket = len(self._binding_data[0])
+        return available_cores_per_socket
+
+    @property
+    def binding_information(self):
+        """
+        Return information about cores and memory binding.
+        Format:
+        [
+            [ # socket 0
+                { # Core 0
+                    "cpu_id": 0,
+                    "node_id": 0,
+                    "socket_id": 0,
+                    "ht_cpu_id": 56
+                }
+            ],
+            [ # socket 1
+                { # Core 0
+                    "cpu_id": 28,
+                    "node_id": 1,
+                    "socket_id": 1,
+                    "ht_cpu_id": 84
+                }
+            ]
+        ]
+        :return: dict with cpu, sockets, ht core and memory binding information
+        :rtype: List[List[Dict[str, int]]]
+        """
+        return self._binding_data
+
+
+class PlatformUtil:
+    '''
+    This module implements a platform utility that exposes functions that
+    detects platform information.
+    '''
+
+    def __init__(self, **kwargs):
+        self.kwargs = kwargs
+        self.num_cpu_sockets = 0
+        self.num_cores_per_socket = 0
+        self.num_threads_per_core = 0
+        self.num_logical_cpus = 0
+        self.num_numa_nodes = 0
+        self.cpu_family = ''
+        self.cpu_model = ''
+        self.cpu_type = ''
+
+        # Core list generated by numactl -H in the case where --numa-cores-per-instance is
+        # being used. It then gets pruned based on the cpuset_cpus, in case docker is
+        # limiting the cores that the container has access to
+        self.cpu_core_list = []
+
+        # Dictionary generated from the cpuset.cpus file (in linux_init) for the case where
+        # docker is limiting the number of cores that the container has access to
+        self.cpuset_cpus = None
+
+        os_type = system_platform.system()
+        if "Windows" == os_type:
+            self.windows_init()
+        elif "Mac" == os_type or "Darwin" == os_type:
+            self.mac_init()
+        elif "Linux" == os_type:
+            self.linux_init()
+        else:
+            raise ValueError("Unable to determine Operating system type.")
+
+        # Check the CPU family/model to see if it's in our known CPU type map
+        cpu_matches = [x['Type'] for x in KNOWN_CPU_TYPES if x[CPU_MODEL_STR] == self.cpu_model and
+                       x[CPU_FAMILY_STR] == self.cpu_family]
+        if len(cpu_matches) > 0:
+            self.cpu_type = cpu_matches[0]
+
+    def _get_list_from_string_ranges(self, str_ranges):
+        """
+        Converts a string of numbered ranges (comma separated numbers or ranges) to an
+        integer list. Duplicates should be removed and the integer list should be
+        ordered.
+        For example an input of "3-6,10,0-5" should return [0, 1, 2, 3, 4, 5, 6, 10]
+        """
+        result_list = []
+
+        for section in str_ranges.split(","):
+            if "-" in section:
+                # Section is a range, so get the start and end values
+                start, end = section.split("-")
+                section_list = range(int(start), int(end) + 1)
+                result_list += section_list
+            elif (len(section)):
+                # This section is either empty or just a single number and not a range
+                result_list.append(int(section))
+
+        # Remove duplicates
+        result_list = list(set(result_list))
+
+        return result_list
+
+    def _get_cpuset(self):
+        """
+        Try to get the cpuset.cpus info, since lscpu does not know if docker has limited
+        the cpuset accessible to the container
+        """
+        cpuset = ""
+        cpuset_cpus_file = "/sys/fs/cgroup/cpuset/cpuset.cpus"
+        if os.path.exists(cpuset_cpus_file):
+            with open(cpuset_cpus_file, "r") as f:
+                cpuset = f.read()
+
+            if 'verbose' in self.kwargs and self.kwargs.get('verbose'):
+                print("cpuset.cpus: {}".format(cpuset))
+        return cpuset
+
+    def linux_init(self):
+        lscpu_cmd = "lscpu"
+        try:
+            lscpu_output = subprocess.check_output([lscpu_cmd],
+                                                   stderr=subprocess.STDOUT)
+            # handle python2 vs 3 (bytes vs str type)
+            if isinstance(lscpu_output, bytes):
+                lscpu_output = lscpu_output.decode('utf-8')
+
+            cpu_info = lscpu_output.split('\n')
+
+        except Exception as e:
+            print("Problem getting CPU info: {}".format(e))
+            sys.exit(1)
+
+        core_list_per_node = {}
+        online_cpus_list = ""
+
+        # parse it
+        for line in cpu_info:
+            #      NUMA_NODES_STR_       = "NUMA node(s)"
+            if line.find(NUMA_NODES_STR_) == 0:
+                self.num_numa_nodes = int(line.split(":")[1].strip())
+            #      CPU_SOCKETS_STR_      = "Socket(s)"
+            elif line.find(CPU_SOCKETS_STR_) == 0:
+                self.num_cpu_sockets = int(line.split(":")[1].strip())
+            #      CORES_PER_SOCKET_STR_ = "Core(s) per socket"
+            elif line.find(CORES_PER_SOCKET_STR_) == 0:
+                self.num_cores_per_socket = int(line.split(":")[1].strip())
+            #      THREADS_PER_CORE_STR_ = "Thread(s) per core"
+            elif line.find(THREADS_PER_CORE_STR_) == 0:
+                self.num_threads_per_core = int(line.split(":")[1].strip())
+            #      LOGICAL_CPUS_STR_     = "CPU(s)"
+            elif line.find(LOGICAL_CPUS_STR_) == 0:
+                self.num_logical_cpus = int(line.split(":")[1].strip())
+            #      ONLINE_CPUS_LIST      = "On-line CPU(s) list"
+            elif line.find(ONLINE_CPUS_LIST) == 0:
+                online_cpus_list = line.split(":")[1].strip()
+            #      CPU_FAMILY_STR = "CPU family:"
+            elif line.find(CPU_FAMILY_STR) == 0:
+                self.cpu_family = line.split(":")[1].strip()
+            #      CPU_MODEL_STR = "Model:"
+            elif line.find(CPU_MODEL_STR) == 0:
+                self.cpu_model = line.split(":")[1].strip()
+            else:
+                # Get the ranges of cores per node from NUMA node* CPU(s)
+                for node in range(0, self.num_numa_nodes):
+                    if line.find(NUMA_NODE_CPU_RANGE_STR_.format(str(node))) == 0:
+                        range_for_node = line.split(":")[1].strip()
+                        range_list_for_node = self._get_list_from_string_ranges(range_for_node)
+                        core_list_per_node[node] = range_list_for_node
+
+        # Try to get the cpuset.cpus info, since lscpu does not know if the cpuset is limited
+        cpuset = self._get_cpuset()
+
+        if cpuset:
+            num_cores_arg = -1
+            if 'num_cores' in self.kwargs:
+                num_cores_arg = self.kwargs.get('num_cores')
+            # If the cpuset is the same as the online_cpus_list, then we are using the whole
+            # machine, so let's avoid unnecessary complexity and don't bother with the cpuset_cpu list.
+            # The cpuset_cpus list will also get populated if the num_cores arg is being specified,
+            # since this list will be used to create the numactl args in base_model_init.py
+            if (online_cpus_list != "" and online_cpus_list != cpuset) or online_cpus_list == "" or num_cores_arg != -1:
+                self.cpuset_cpus = self._get_list_from_string_ranges(cpuset)
+
+        # Uses numactl get the core number for each numa node and adds the cores for each
+        # node to the cpu_cores_list array. Only do this if the command is trying to use
+        # numa_cores_per_instance we can't count on numactl being installed otherwise and
+        # this list is only used for the numactl multi-instance runs.
+        num_physical_cores = self.num_cpu_sockets * self.num_cores_per_socket
+        if self.num_numa_nodes > 0:
+            cores_per_node = int(num_physical_cores / self.num_numa_nodes)
+        else:
+            cores_per_node = self.num_cores_per_socket
+        if "numa_cores_per_instance" in self.kwargs:
+            if self.num_numa_nodes > 0 and self.kwargs.get('numa_cores_per_instance') is not None:
+                try:
+                    # Get the list of cores
+                    cpu_array_command = \
+                        "numactl -H | grep 'node [0-9]* cpus:' |" \
+                        "sed 's/.*node [0-9]* cpus: *//' | head -{0} |cut -f1-{1} -d' '".format(
+                            self.num_numa_nodes, int(cores_per_node))
+                    cpu_array = subprocess.Popen(
+                        cpu_array_command, shell=True, stdout=subprocess.PIPE,
+                        stderr=subprocess.PIPE).stdout.readlines()
+
+                    for node_cpus in cpu_array:
+                        node_cpus = str(node_cpus).lstrip("b'").replace("\\n'", " ")
+                        self.cpu_core_list.append([x for x in node_cpus.split(" ") if x != ''])
+
+                    # If we have the cpuset list, cross check that list with our core list and
+                    # remove cores that are not part of the cpuset list
+                    if self.cpuset_cpus is not None:
+                        for socket, core_list in enumerate(self.cpu_core_list):
+                            self.cpu_core_list[socket] = [x for x in core_list if int(x) in self.cpuset_cpus]
+
+                    if 'verbose' in self.kwargs and self.kwargs.get('verbose'):
+                        print("Core list: {}".format(self.cpu_core_list), flush=True)
+
+                except Exception as e:
+                    print("Warning: An error occured when getting the list of cores using '{}':\n {}".
+                          format(cpu_array_command, e))
+
+        if self.cpuset_cpus is not None:
+            # Reformat the cpuset_cpus list so that it's split up by node
+            for node in core_list_per_node.keys():
+                core_list_per_node[node] = [x for x in core_list_per_node[node] if x in self.cpuset_cpus]
+            self.cpuset_cpus = core_list_per_node
+
+            # Remove cores that aren't part of the cpu_core_list
+            for socket in self.cpuset_cpus.keys():
+                if len(self.cpuset_cpus[socket]) > cores_per_node:
+                    del self.cpuset_cpus[socket][cores_per_node:]
+
+            # Remove keys with empty lists (sockets where there are no cores enabled in the cpuset)
+            self.cpuset_cpus = {k: v for k, v in self.cpuset_cpus.items() if v}
+
+            # Update the number of sockets based on the cpuset
+            if len(self.cpuset_cpus.keys()) > 0:
+                self.num_cpu_sockets = len(self.cpuset_cpus.keys())
+
+    def windows_init(self):
+        NUM_SOCKETS_STR_ = "DeviceID"
+        CORES_PER_SOCKET_STR_ = "NumberOfCores"
+        THREAD_COUNT_STR_ = "ThreadCount"
+        NUM_LOGICAL_CPUS_STR_ = "NumberOfLogicalProcessors"
+        num_threads = 0
+        wmic_cmd = "wmic cpu get DeviceID, NumberOfCores, \
+            NumberOfLogicalProcessors, ThreadCount /format:list"
+        try:
+            wmic_output = subprocess.check_output(wmic_cmd, shell=True)
+
+            # handle python2 vs 3 (bytes vs str type)
+            if isinstance(wmic_output, bytes):
+                wmic_output = wmic_output.decode('utf-8')
+
+            cpu_info = wmic_output.split('\r\r\n')
+
+        except Exception as e:
+            print("Problem getting CPU info: {}".format(e))
+            sys.exit(1)
+
+        # parse it
+        for line in cpu_info:
+            # CORES_PER_SOCKET_STR_ = "NumberOfCores"
+            if line.find(CORES_PER_SOCKET_STR_) == 0:
+                self.num_cores_per_socket = int(line.split("=")[1].strip())
+            # NUM_LOGICAL_CPUS_STR_ = "NumberOfLogicalProcessors"
+            elif line.find(NUM_LOGICAL_CPUS_STR_) == 0:
+                self.num_logical_cpus = int(line.split("=")[1].strip())
+            # THREAD_COUNT_STR_ = "ThreadCount"
+            elif line.find(THREAD_COUNT_STR_) == 0:
+                num_threads = int(line.split("=")[1].strip())
+
+        self.num_cpu_sockets = len(re.findall(
+            r'\b%s\b' % re.escape(NUM_SOCKETS_STR_), wmic_output))
+
+        if self.num_cpu_sockets > 0 and num_threads:
+            self.num_threads_per_core =\
+                int(num_threads / self.num_cpu_sockets)
+
+    def mac_init(self):
+        raise NotImplementedError("Mac Support not yet implemented")
+
+    @property
+    def cores_per_socket(self):
+        """
+        Return amount of available cores per socket.
+        :return: amount of cores
+        :rtype: int
+        """
+        return int(self.num_cores_per_socket)  # type: ignore
+
+    @property
+    def sockets(self):
+        """
+        Return count of sockets available on server.
+        :return: available cores
+        :rtype: int
+        """
+        return int(self.num_cpu_sockets)  # type: ignore
+
+    @property
+    def cores(self):
+        """
+        Return amount of cores available on server.
+        :return: amount of cores
+        :rtype: int
+        """
+        available_cores = self.num_cores_per_socket * self.num_cpu_sockets
+        return int(available_cores)  # type: ignore
+
+    @property
+    def logical_cores(self):
+        """
+        Return amount of logical cores available on server.
+        :return: amount of logical cores
+        :rtype: int
+        """
+        return int(self.num_logical_cpus)  # type: ignore
+
+    @property
+    def numa_nodes(self):
+        """
+        Return amount of numa nodes available on server.
+        :return: amount of numa nodes
+        :rtype: int
+        """
+        return int(self.num_numa_nodes)  # type: ignore
+
+
+class OptimizedPlatformUtil(PlatformUtil):
+    def __init__(
+        self,
+        omp_num_threads: int = None,
+        omp_thread_limit: int = None,
+        kmp_blocktime: int = None,
+        kmp_affinity: str = None,
+        tf_num_intraop_threads: int = None,
+        tf_num_interop_threads: int = None,
+        tf_enable_mkl_native_format: int = None,
+        ld_preload: str = None,
+        force_reset_env_vars: bool = False,
+        **kwargs
+    ):
+        """
+            Initialize the class and set env variables for an optimized platform. The parameters
+            of the class are:
+
+            Args:
+                omp_num_threads (int): This variable sets the corresponding environment variable
+                    OMP_NUM_THREADS for the maximum number of threads to use for OpenMP parallel
+                    regions if no other value is specified in the application. With Hyperthreading
+                    enabled, there are more than one hardware threads for a physical CPU core, but
+                    we recommend to use only onehardware thread for a physical CPU core to avoid
+                    cache miss problems. (Recommended setting for CNN: num physical cores)
+                omp_thread_limit (int): This variable sets the corresponding environment variable
+                    OMP_THREAD_LIMIT which is used to set the maximum number of OpenMP threads to
+                    use in a contention group. Must a positive integer and the value should be
+                    less than or equal to maximum number of hardware threads available on the
+                    system.
+                kmp_blocktime (int): This variable sets the corresponding environment variable
+                    KMP_BLOCKTIME which sets the time, in milliseconds, that a thread should wait,
+                    after completing the execution of a parallel region, before sleeping.
+                    (Recommended setting: 0 for CNN, 1 for non-CNN)
+                kmp_affinity (str): Users can bind OpenMP threads to physical processing units.
+                    KMP_AFFINITY is used to take advantage of this functionality. It restricts
+                    execution of certain threads to a subset of the physical processing units
+                    in a multiprocessor computer. Usage of this variable should be as follows:
+                    kmp_affinity="[<modifier>,...]<type>[,<permute>][,<offset>]" where the values
+                    inside square brackets '[]' are optional. Do not include the square brackets.
+                    More about this can be found here: https://www.intel.com/content/www/us/en/docs/cpp-compiler/developer-guide-reference/2021-8/thread-affinity-interface.html  # noqa: E501
+                    (Recommended setting: "granularity=fine,compact,1,0")
+                tf_num_intraop_threads (int): This runtime setting controls parallelism inside an
+                    operation. For instance, if matrix multiplication or reduction is intended to
+                    be executed in several threads, this variable should be set. TensorFlow will
+                    schedule tasks in a thread pool that contains intra_op_parallelism_threads
+                    threads. Applies to TensorFlow only. (Recommended setting: num physical cores
+                    per socket)
+                tf_num_interop_threads (int): This runtime setting controls parallelism among
+                    independent operations. Since these operations are not relevant to each other,
+                    TensorFlow will try to run them concurrently in the thread pool that contains
+                    inter_op_parallelism_threads threads. Applies to TensorFlow only. (Recommended
+                    setting: num sockets)
+                tf_enable_mkl_native_format (int): Users could enable/disable usage of oneDNN blocked
+                    data format in Tensorflow by TF_ENABLE_MKL_NATIVE_FORMAT environment variable.
+                    Applies to TensorFlow only. (Accepted values: 0 or 1)
+                ld_preload (str): A string of colon separated paths to shared object files to preload
+                force_reset_env_vars (bool): If True, force resets the env variables to use the
+                    given parameter value(s)
+
+        """
+        super().__init__(**kwargs)
+
+        self.omp_num_threads = omp_num_threads
+        self.omp_thread_limit = omp_thread_limit
+        self.kmp_blocktime = kmp_blocktime
+        self.kmp_affinity = kmp_affinity
+        self.tf_num_intraop_threads = tf_num_intraop_threads
+        self.tf_num_interop_threads = tf_num_interop_threads
+        self.tf_enable_mkl_native_format = tf_enable_mkl_native_format
+        self.ld_preload = ld_preload
+        self.force_reset_env_vars = force_reset_env_vars
+
+        self.env_vars_dict = {
+            'OMP_NUM_THREADS': self.omp_num_threads,
+            'OMP_THREAD_LIMIT': self.omp_thread_limit,
+            'KMP_BLOCKTIME': self.kmp_blocktime,
+            'KMP_AFFINITY': self.kmp_affinity,
+            'TF_NUM_INTRAOP_THREADS': self.tf_num_intraop_threads,
+            'TF_NUM_INTEROP_THREADS': self.tf_num_interop_threads,
+            'TF_ENABLE_MKL_NATIVE_FORMAT': self.tf_enable_mkl_native_format,
+            'LD_PRELOAD': self.ld_preload
+        }
+
+        self._validate_args()
+        self._set_env_vars()
+
+    def _set_env_vars(self):
+        verbose_string = ""
+        warning_string = ""
+
+        for env_var_name, env_var_value in self.env_vars_dict.items():
+            if env_var_value is not None:
+                if env_var_name not in os.environ or self.force_reset_env_vars:
+                    os.environ[env_var_name] = str(env_var_value)
+                else:
+                    warning_string += "WARNING: The value for {} has already been set to {}. " \
+                        "Use 'force_reset_env_vars' to reset to your " \
+                        "value.\n".format(env_var_name, os.environ.get(env_var_name))
+                    try:
+                        self.env_vars_dict[env_var_name] = int(os.environ.get(env_var_name))
+                    except ValueError:
+                        self.env_vars_dict[env_var_name] = os.environ.get(env_var_name)
+                verbose_string += "{}: {}\n".format(env_var_name, os.environ.get(env_var_name))
+
+        print(warning_string)
+
+        if 'verbose' in self.kwargs and self.kwargs.get('verbose'):
+            print(verbose_string, flush=True)
+
+    def _validate_args(self):
+
+        if self.omp_num_threads is not None:
+            if not isinstance(self.omp_num_threads, int) or self.omp_num_threads < 0:
+                raise ValueError("omp_num_threads must be a positive integer, but given '{}'. "
+                                 "Recommended setting for CNN: num physical cores per "
+                                 "socket".format(self.omp_num_threads))
+
+            if self.omp_num_threads > self.logical_cores:
+                raise ValueError("Value '{}' out of bounds. omp_num_threads must be less than "
+                                 "or equal to '{}' logical cores. Recommended setting for CNN: "
+                                 "num physical cores per socket".format(self.omp_num_threads,
+                                                                        self.logical_cores))
+
+        if self.omp_thread_limit is not None:
+            if not isinstance(self.omp_thread_limit, int) or self.omp_thread_limit <= 0:
+                raise ValueError(
+                    "omp_thread_limit must be a positive integer, but given '{}'".format(self.omp_thread_limit))
+
+            if not (0 <= self.omp_thread_limit <= self.logical_cores):
+                raise ValueError("Value {} out of bounds. 0 <= omp_thread_limit <= {}".format(self.omp_thread_limit,
+                                                                                              self.logical_cores))
+
+        if self.kmp_blocktime is not None:
+            if not isinstance(self.kmp_blocktime, int) or self.kmp_blocktime < 0:
+                raise ValueError("kmp_blocktime must be a positive integer, but given '{}'."
+                                 "Recommended setting: 0 for CNN, 1 for non-CNN".format(self.kmp_blocktime))
+
+        if self.kmp_affinity:
+            if not isinstance(self.kmp_affinity, str):
+                raise ValueError("kmp_affinity must be a string type, but given '{}'".format(type(self.kmp_affinity)))
+
+            valid_modifiers = ["granularity=fine", "granularity=thread", "granularity=core", "granularity=tile",
+                               "granularity=die", "granularity=node", "granularity=group", "granularity=socket",
+                               "norespect", "noverbose", "nowarnings", "noreset", "respect", "verbose", "warnings",
+                               "reset"]
+            valid_types = ["balanced", "compact", "disabled", "explicit", "none", "scatter"]
+
+            err_message = "Invalid values given for kmp_affinity='{}'.\
+                \n\nSyntax is kmp_affinity='[<modifier>,...]<type>[,<permute>][,<offset>]'\
+                \n\n<modifier> (optional):\t{}\
+                \n<type>:\t{}\
+                \n<permute> (optional): Any positive integer (>=0)\
+                \n<offset> (optional): Any positive integer (>=0)".format(self.kmp_affinity, valid_modifiers,
+                                                                          valid_types)
+
+            values = self.kmp_affinity.split(',')
+            count = 0
+            for value in values:
+                if value not in valid_modifiers + valid_types:
+                    if value.isdigit():
+                        count += 1
+                    else:
+                        raise ValueError(err_message)
+
+                if count > 2:
+                    raise ValueError(err_message)
+
+        if self.tf_num_intraop_threads is not None:
+            if not isinstance(self.tf_num_intraop_threads, int) or self.tf_num_intraop_threads < 0:
+                raise ValueError("tf_num_intraop_threads must be a positive integer, but given '{}'. "
+                                 "Recommended setting: num physical cores per "
+                                 "socket".format(self.tf_num_intraop_threads))
+
+        if self.tf_num_interop_threads is not None:
+            if not isinstance(self.tf_num_interop_threads, int) or self.tf_num_interop_threads < 0:
+                raise ValueError("tf_num_interop_threads must be a positive integer, but given '{}'. "
+                                 "Recommended setting: num sockets".format(self.tf_num_interop_threads))
+
+        if self.tf_enable_mkl_native_format is not None:
+            if not isinstance(self.tf_enable_mkl_native_format, int) or self.tf_enable_mkl_native_format not in [0, 1]:
+                raise ValueError("tf_enable_mkl_native_format must be either 0 or 1, "
+                                 "but given '{}'".format(self.tf_enable_mkl_native_format))
+
+        if self.ld_preload:
+            if not isinstance(self.ld_preload, str):
+                raise ValueError("ld_preload must be of type {}, but given '{}'.".format(str, type(self.ld_preload)))
+
+            paths = self.ld_preload.split(':')
+            for path in paths:
+                if not path.endswith('.so'):
+                    raise ValueError("ld_preload must contain colon separated paths to .so files, "
+                                     "but given '{}'".format(self.ld_preload))
+
+                if not os.path.exists(path):
+                    raise FileNotFoundError("Given file '{}' doesn't exist.".format(path))
diff --git a/tlt/utils/types.py b/tlt/utils/types.py
new file mode 100644
index 0000000000000000000000000000000000000000..7ac310b9aed521774b33790ee952bcea19fe9475
--- /dev/null
+++ b/tlt/utils/types.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+from enum import Enum, auto
+
+
+class UseCaseType(Enum):
+    IMAGE_CLASSIFICATION = auto()
+    OBJECT_DETECTION = auto()
+    TEXT_CLASSIFICATION = auto()
+    QUESTION_ANSWERING = auto()
+    IMAGE_ANOMALY_DETECTION = auto()
+
+    def __str__(self):
+        return self.name.lower()
+
+    @staticmethod
+    def from_str(use_case_str):
+        use_case_str = use_case_str.lower()
+
+        if use_case_str in ["image_classification", "image classification"]:
+            return UseCaseType.IMAGE_CLASSIFICATION
+        elif use_case_str in ["object_detection", "object detection"]:
+            return UseCaseType.OBJECT_DETECTION
+        elif use_case_str in ["text_classification", "text classification"]:
+            return UseCaseType.TEXT_CLASSIFICATION
+        elif use_case_str in ["question_answer", "question_answering",
+                              "question answer", "question answering"]:
+            return UseCaseType.QUESTION_ANSWERING
+        elif use_case_str in ["anomaly_detection", "anomaly detection",
+                              "image_anomaly_detection", "image anomaly detection"]:
+            return UseCaseType.IMAGE_ANOMALY_DETECTION
+        else:
+            options = [e.name for e in UseCaseType]
+            raise ValueError("Unsupported use case: {} (Select from: {})".format(
+                use_case_str, options))
+
+
+class FrameworkType(Enum):
+    TENSORFLOW = auto()
+    PYTORCH = auto()
+
+    def __str__(self):
+        return self.name.lower()
+
+    @staticmethod
+    def from_str(framework_str):
+        if framework_str.lower() == "tensorflow":
+            return FrameworkType.TENSORFLOW
+        elif framework_str.lower() == "pytorch":
+            return FrameworkType.PYTORCH
+        else:
+            options = [e.name for e in FrameworkType]
+            raise ValueError("Unsupported framework: {} (Select from: {})".format(
+                framework_str, options))
diff --git a/tox.ini b/tox.ini
new file mode 100644
index 0000000000000000000000000000000000000000..33422ade1a84dd1d32fbbc0c615dd12f616de13f
--- /dev/null
+++ b/tox.ini
@@ -0,0 +1,13 @@
+[pytest]
+markers =
+    tensorflow: test requires tensorflow to be installed
+    pytorch: test requires pytorch to be installed
+    common: test does not require a specific framework to be installed
+    integration: test is not a true unit test or requires external resource access
+[flake8]
+ignore = C901,W504
+tee = True
+inline-quotes = double
+max-line-length=120
+max-complexity=12
+exclude = .cache,.tox,__pycache__,.pytest_cache,*.pyc,.venv,.mypy_cache
diff --git a/workflows/.gitkeep b/workflows/.gitkeep
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/workflows/disease_prediction/Dockerfile b/workflows/disease_prediction/Dockerfile
new file mode 100644
index 0000000000000000000000000000000000000000..95017384aaaf8f83b2885b701f723b89e87c2f93
--- /dev/null
+++ b/workflows/disease_prediction/Dockerfile
@@ -0,0 +1,27 @@
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+ARG IMAGE_NAME=intel/ai-tools
+ARG IMAGE_TAG=tlt-0.5.0
+FROM ${IMAGE_NAME}:${IMAGE_TAG}
+
+COPY . /workspace
+
+WORKDIR /workspace
+
+RUN python -m pip install --no-cache-dir -r requirements.txt
diff --git a/workflows/disease_prediction/README.md b/workflows/disease_prediction/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..45331ae027dfefb6754b7b584a30187e36c7e271
--- /dev/null
+++ b/workflows/disease_prediction/README.md
@@ -0,0 +1,223 @@
+# Image Classification Finetuning and Inference
+
+## Solution Technical Overview
+
+The vision fine-tuning (transfer learning) and inference workflow demonstrates Image Classification workflows/pipelines using Intel® Transfer Learning Tool to be run along with Intel-optimized software represented using toolkits, domain kits, packages, frameworks and other libraries for effective use of Intel hardware leveraging Intel's AI instructions for fast processing and increased performance. The workflows can be easily used by applications or reference kits showcasing usage.
+
+The workflow supports:
+```
+Image Classification Finetuning
+Image Classification Inference
+```
+## Table of Contents
+- [Overview](#overview)
+- [Dataset] (#dataset)
+- [Validated Hardware Details](#validated-hardware-details)
+- [Software Requirements](#software-requirements)
+- [How it Works?](#how-it-works)
+- [Get Started](#get-started)
+- [Run Using Docker](#run-using-docker)
+- [Run Using Bare Metal](#run-using-bare-metal) 
+- [Expected Output](#expected-output)
+- [Learn More](#learn-more)
+- [Support](#support)
+
+## Overview 
+
+The vision workflow aims to train an image classifier that takes in contrast-enhanced spectral mammography (CESM) images. The pipeline creates prediction for the diagnosis of breast cancer. The goal is to minimize an expert’s involvement in categorizing samples as normal, benign, or malignant, by developing and optimizing a decision support system that automatically categorizes the CESM with the help of radiologist
+
+### Dataset
+The dataset is a collection of 2,006 high-resolution contrast-enhanced spectral mammography (CESM) images (1003 low energy images and 1003 subtracted CESM images) with annotations of 326 female patients. See Figure-1. Each patient has 8 images, 4 representing each side with two views (Top Down looking and Angled Top View) consisting of low energy and subtracted CESM images. Medical reports, written by radiologists, are provided for each case along with manual segmentation annotation for the abnormal findings in each image. As a preprocessing step, we segment the images based on the manual segmentation to get the region of interest and group annotation notes based on the subject and breast side. 
+
+  ![cesm_and_annotation](https://github.com/intel-innersource/frameworks.ai.transfer-learning/assets/99835661/dd886c0f-f03b-4540-98f4-e53e3fa43701)
+
+
+*Figure-1: Samples of low energy and subtracted CESM images and Medical reports, written by radiologists from the Categorized contrast enhanced mammography dataset. [(Khaled, 2022)](https://www.nature.com/articles/s41597-022-01238-0)*
+
+For more details of the dataset, visit the wikipage of the [CESM](https://wiki.cancerimagingarchive.net/pages/viewpage.action?pageId=109379611#109379611bcab02c187174a288dbcbf95d26179e8) and read [Categorized contrast enhanced mammography dataset for diagnostic and artificial intelligence research](https://www.nature.com/articles/s41597-022-01238-0).
+
+## Validated Hardware Details
+There are workflow-specific hardware and software setup requirements depending on how the workflow is run. Bare metal development system and Docker image running locally have the same system requirements. 
+
+| Recommended Hardware         | Precision  |
+| ---------------------------- | ---------- |
+| Intel® 4th Gen Xeon® Scalable Performance processors| BF16 |
+| Intel® 1st, 2nd, 3rd, and 4th Gen Xeon® Scalable Performance processors| FP32 |
+
+To execute the reference solution presented here, use CPU for fine tuning.
+
+## Software Requirements 
+Linux OS (Ubuntu 22.04) is used to validate this reference solution. Make sure the following dependencies are installed.
+
+1. `sudo apt-get update`
+2. `sudo apt-get install -y build-essential gcc git libgl1-mesa-glx libglib2.0-0 python3-dev`
+3. `sudo apt-get install python3.9 python3-pip`
+4.  `virtualenv` through python3-venv or conda
+5. `pip install dataset-librarian`
+
+## How It Works?
+
+The Vision reference Implementation component uses [Intel Transfer Learning Toolkit based vision workload](https://github.com/IntelAI/transfer-learning), which is optimized for image fine-tuning and inference. This workload uses Tensorflowhub's ResNet-50 model to fine-tune a new convolutional neural network model with subtracted CESM image dataset. The images are preprocessed by using domain expert-defined segmented regions to reduce redundancies during training.
+
+## Get Started
+
+### Download the repository
+
+git clone https://github.com/IntelAI/transfer-learning.git vision_workflow
+cd vision_workflow/workflows/disease_prediction
+
+
+### Create a new python environment
+```shell
+conda create -n <env name> python=3.9
+conda activate <env name>
+```
+### Download and Preprocess the Datasets
+Use the links below to download the image datasets. Or skip to the [Docker](#run-using-docker) section to download the dataset using a container.
+
+- [High-resolution Contrast-enhanced spectral mammography (CESM) images](https://faspex.cancerimagingarchive.net/aspera/faspex/external_deliveries/260?passcode=5335d2514638afdaf03237780dcdfec29edf4238#)
+
+Once you have downloaded the image files and placed them into the data directory, proceed by executing the following command. This command will initiate the download of segmentation and annotation data, followed by the application of segmentation and preprocessing operations.
+
+Command-line Interface:
+- -d : Directory location where the raw dataset will be saved on your system. It's also where the preprocessed dataset files will be written. If not set, a directory with the dataset name will be created.
+- --split_ratio: Split ratio of the test data, the default value is 0.1.
+
+More details of the dataset_librarian can be found [here](https://pypi.org/project/dataset-librarian/).
+
+
+```
+python -m dataset_librarian.dataset -n brca --download --preprocess -d data/ --split_ratio 0.1
+```
+
+**Note:** See this dataset's applicable license for terms and conditions. Intel Corporation does not own the rights to this dataset and does not confer any rights to it.
+
+
+## Run Using Bare Metal 
+
+### Install package for running vision-finetuning-inference--workflows
+```shell
+pip install -r requirements.txt
+```
+
+Note: Configure the right configurations in the config.yaml
+
+The 'config.yaml' file includes the following parameters:
+
+- args:
+  - dataset_dir: contains the path for dataset_dir
+  - finetune_output: saves results of finetuning in a yaml file
+  - inference_output : saves the results of the model on test data in the yaml file
+  - model: Pretrained model name (default resnetv150)
+  - finetune: runs vision fine-tuning
+  - inference: runs inference only if set to true , if false finetunes the model before inference
+  - saved_model_dir: Directory where trained model gets saved
+- training_args:
+  - batch_size: Batch size for training ( default 32)
+  - bf16: Enable BF16 by default
+  - epochs: Number of epochs for training
+  - output_dir: Output of training model
+```shell
+python src/run.py --config_file config/config.yaml 
+```
+
+## Run Using Docker
+
+### 1. Set Up Docker Engine And Docker Compose
+You'll need to install Docker Engine on your development system. Note that while **Docker Engine** is free to use, **Docker Desktop** may require you to purchase a license. See the [Docker Engine Server installation instructions](https://docs.docker.com/engine/install/#server) for details.
+
+
+To build and run this workload inside a Docker Container, ensure you have Docker Compose installed on your machine. If you don't have this tool installed, consult the official [Docker Compose installation documentation](https://docs.docker.com/compose/install/linux/#install-the-plugin-manually).
+
+
+```bash
+DOCKER_CONFIG=${DOCKER_CONFIG:-$HOME/.docker}
+mkdir -p $DOCKER_CONFIG/cli-plugins
+curl -SL https://github.com/docker/compose/releases/download/v2.7.0/docker-compose-linux-x86_64 -o $DOCKER_CONFIG/cli-plugins/docker-compose
+chmod +x $DOCKER_CONFIG/cli-plugins/docker-compose
+docker compose version
+```
+
+### 2. Set Up Docker Image
+Pull the provided docker image.
+
+
+```bash
+docker pull intel/ai-workflows:pa-vision-tlt-disease-prediction
+```
+
+### 3. Run With Docker Compose
+
+```bash
+cd docker
+export CONFIG=<config_file_name_without_.yaml>
+docker compose run dev
+```
+
+| Environment Variable Name | Default Value | Description |
+| --- | --- | --- |
+| CONFIG | n/a | Config file name |
+
+### 4. Clean Up Docker Container
+Stop container created by docker compose and remove it.
+
+```bash
+docker compose down
+```
+## Expected Output
+
+Successful run should dump the output in a yaml file . The ouput would look like this
+```
+label:
+- Benign
+- Malignant
+- Normal
+label_id:
+- 0
+- 1
+- 2
+metric:
+  acc: 0.7163363099098206
+  loss: 0.6603914499282837
+results:
+  P100_R_CM_CC.jpg:
+  - label: Normal
+    pred: Normal
+    pred_prob:
+    - 0.3331606984138489
+    - 0.28302037715911865
+    - 0.38381892442703247
+  P100_R_CM_MLO.jpg:
+  - label: Normal
+    pred: Benign
+    pred_prob:
+    - 0.38328817486763
+    - 0.2962200343608856
+    - 0.320491760969162
+```
+### How to customize this use case
+Tunable configurations and parameters are exposed using yaml config files allowing users to change model training hyperparameters, datatypes, paths, and dataset settings without having to modify or search through the code.
+
+#### Adopt to your dataset
+To deploy this reference use case on a different or customized dataset, you can easily modify the config.yaml file. For instance, if you have a new dataset, simply update the paths of finetune_output and inference_output and adjust the dataset features in the config.yaml file, as demonstrated below.
+
+```
+    dataset_dir: --> updated Dataset path
+```    
+
+#### Adopt to your model
+
+To implement this reference use case on a different or customized pre-training model, modifications to the config.yaml file are straightforward. For instance, to use an alternate model, one can update the path of the model by modifying the 'model' fields in the config.yaml file structure. The following example illustrates this process:
+
+```
+   model --> new_model ( eg: efficienetnetb0)
+```
+## Learn More
+
+For more information or to read about other relevant workflow examples, see these guides and software resources:
+- [Intel® AI Analytics Toolkit (AI Kit)](https://www.intel.com/content/www/us/en/developer/tools/oneapi/ai-analytics-toolkit.html)
+- [Intel® Neural Compressor](https://github.com/intel/neural-compressor)
+- [Intel® Transfer Learning Tool](https://github.com/IntelAI/transfer-learning/tree/v0.5.0)
+
+## Support
+If you have any questions with this workflow, want help with troubleshooting, want to report a bug or submit enhancement requests, please submit a GitHub issue.
diff --git a/workflows/disease_prediction/config/config.yaml b/workflows/disease_prediction/config/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..59dca19a89ba86af3e1403db7529f890d52dd250
--- /dev/null
+++ b/workflows/disease_prediction/config/config.yaml
@@ -0,0 +1,15 @@
+args:
+  dataset_dir: ./data/train_test_split_images
+  finetune: true
+  finetune_output: ./output/finetune_predictions_report.yaml
+  inference: false
+  inference_per_patient: true
+  inference_output: inference_predictions_report.yaml
+  model: resnet_v1_50
+  pipeline: finetune
+  saved_model_dir: ./output/resnet_v1_50/1
+training_args:
+  batch_size: 32
+  bf16: true
+  epochs: 1
+  output_dir: ./output
diff --git a/workflows/disease_prediction/requirements.txt b/workflows/disease_prediction/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..cd67e6ef2da177886b27b6080bf75bfb77c60cb0
--- /dev/null
+++ b/workflows/disease_prediction/requirements.txt
@@ -0,0 +1,6 @@
+Pillow~=9.5.0
+PyYAML~=6.0
+intel-tensorflow==2.12.0
+neural-compressor==2.1.1
+numpy~=1.23.5
+tensorflow-hub~=0.13.0
diff --git a/workflows/disease_prediction/src/run.py b/workflows/disease_prediction/src/run.py
new file mode 100644
index 0000000000000000000000000000000000000000..c2e5b5a9a53b5675a27c7e572215c4de6bbe64f4
--- /dev/null
+++ b/workflows/disease_prediction/src/run.py
@@ -0,0 +1,86 @@
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+import yaml
+import argparse
+import os
+import sys
+from os import path
+
+root_folder = path.dirname(path.abspath(__file__))
+sys.path.insert(0, path.join(root_folder, "../../../"))
+print(sys.path)
+
+from vision_wl import train_vision_wl, run_inference, collect_class_labels, load_model, run_inference_per_patient
+
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--config_file", type=str, required=True)
+    args = parser.parse_args()
+
+    with open(args.config_file, "r") as f:
+        config = yaml.safe_load(f)
+    
+    dataset_dir = config['args']['dataset_dir']
+    train_dataset_dir = os.path.join(dataset_dir, "train")
+    test_dataset_dir = os.path.join(dataset_dir, "test")
+    # output_dir = config['args']['output_dir']
+    output_dir = config['training_args']['output_dir']
+    batch_size = config['training_args']['batch_size']
+    epochs = config['training_args']['epochs']
+    bf16 = config['training_args']['bf16']
+    model_name = config['args']['model']
+
+    # do_predict = config['training_args']['do_predict']
+    do_predict = config['args']['inference']
+    do_predict_per_patient = config['args']['inference_per_patient']
+    # do_train = config['training_args']['do_train']
+    do_train = config['args']['finetune']
+
+    saved_model_dir = config['args']['saved_model_dir']
+
+    # output_file_test = config['args']['output_file_test_dir']
+    output_file_test = config['args']['inference_output']
+
+    # output_file_train = config['args']['output_file_train_dir']
+    output_file_train = config['args']['finetune_output']
+
+    # this is one is used for place holder 
+    vision_int8_inference = 'vision_int_8.yaml' # config['inference_args']['int8_inference']
+    class_labels = collect_class_labels(train_dataset_dir)
+    if (do_train):
+        model, history, dict_metrics = train_vision_wl(train_dataset_dir,
+                                                       output_dir, model_name,
+                                                       batch_size, epochs, bf16=bf16)
+        run_inference(train_dataset_dir, saved_model_dir, class_labels,
+                      model_name, vision_int8_inference, output_file_train)
+
+    if (do_predict):
+        run_inference(test_dataset_dir, saved_model_dir, class_labels,
+                      model_name, vision_int8_inference, output_file_test)
+    if (do_predict_per_patient):     
+        model = load_model(model_name,saved_model_dir)
+        # Sample dict
+        patient_dict = {'106L':[os.path.join(train_dataset_dir,"Malignant/P106_L_CM_MLO1.jpg")],\
+                        '106R':[os.path.join(train_dataset_dir,"Benign/P106_R_CM_CC1.jpg"),\
+                                os.path.join(train_dataset_dir,"Benign/P106_R_CM_CC2.jpg")]}
+        results = run_inference_per_patient(model, patient_dict,class_labels)
+
+if __name__ == "__main__":
+    main()
diff --git a/workflows/disease_prediction/src/vision_wl.py b/workflows/disease_prediction/src/vision_wl.py
new file mode 100644
index 0000000000000000000000000000000000000000..69fdbb0d88ba8ffe7bd398ea1834a377160c48a2
--- /dev/null
+++ b/workflows/disease_prediction/src/vision_wl.py
@@ -0,0 +1,236 @@
+#
+# Copyright (c) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import shutil
+import yaml
+import tensorflow as tf
+import numpy as np
+import time
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.utils.types import FrameworkType
+from PIL import Image
+
+
+IMAGE_SIZE = 224
+
+
+def collect_class_labels(dataset_dir):
+    dataset = dataset_factory.load_dataset(dataset_dir=dataset_dir,
+                                           use_case='image_classification',
+                                           framework='tensorflow')
+    return dataset.class_names
+
+
+def quantize_model(output_dir, saved_model_dir, model):
+    clean_output_folder(output_dir, 'quantized_models')
+
+    quantization_output_dir = os.path.join(output_dir, 'quantized_models',
+                                           "vision",
+                                           os.path.basename(saved_model_dir))
+    # Create a tuning workspace directory for INC
+    root_folder = os.path.dirname(os.path.abspath(__file__))
+    inc_config_file = os.path.join(root_folder, "config.yaml")
+
+    # inc_config_file = 'vision/config.yaml'
+    model.quantize(quantization_output_dir, inc_config_file)
+
+
+def clean_output_folder(output_dir, model_name):
+    folder_path = os.path.join(output_dir, model_name)
+    if os.path.exists(folder_path):
+        shutil.rmtree(os.path.join(output_dir, model_name))
+
+
+def train_vision_wl(dataset_dir, output_dir, model="resnet_v1_50",
+                    batch_size=32,
+                    epochs=5, save_model=True, quantization=False, bf16=True):
+    # Clean the output folder first
+    clean_output_folder(output_dir, model)
+    dict_metrics = {}
+    #  Loading the model
+    tstart = time.time()
+    model = model_factory.get_model(model_name=model,
+                                    framework=FrameworkType.TENSORFLOW)
+    tend = time.time()
+    print("\nModel Loading time (s): ", tend - tstart)
+    # Load the dataset from the custom dataset path
+    # Data loading and preprocessing #
+    dataset = dataset_factory.load_dataset(dataset_dir=dataset_dir,
+                                           use_case='image_classification',
+                                           framework='tensorflow',
+                                           shuffle_files=True)
+
+    print("Class names:", str(dataset.class_names))
+    dataset.preprocess(model.image_size, batch_size=batch_size,
+                       add_aug=['hvflip', 'rotate'])
+    dataset.shuffle_split(train_pct=.80, val_pct=.20)
+    # Finetuning #
+    tstart = time.time()
+    history = model.train(dataset, output_dir=output_dir, epochs=epochs,
+                          seed=10,
+                          enable_auto_mixed_precision=bf16,
+                          extra_layers=[1024, 512])
+    tend = time.time()
+    print("\nTotal Vision Finetuning time (s): ", tend - tstart)
+    dict_metrics['e2e_training_time'] = tend - tstart
+
+    metrics = model.evaluate(dataset)
+    for metric_name, metric_value in zip(model._model.metrics_names, metrics):
+        print("{}: {}".format(metric_name, metric_value))
+        dict_metrics[metric_name] = metric_value
+    print('dict_metrics:', dict_metrics)
+    print('Finished Fine-tuning the vision model...')
+    if save_model:
+        saved_model_dir = model.export(output_dir)
+    if quantization:
+        print('Quantizing the model')
+        quantize_model(output_dir, saved_model_dir, model)
+
+    print("Done finetuning the vision model ............")
+    return (model, history, dict_metrics)
+
+
+def infer_vision_wl(model, image_location):
+    image_shape = (model.image_size, model.image_size)
+    image = Image.open(image_location).resize(image_shape)
+    # Get the image as a np array and call predict while adding a batch
+    # dimension (with np.newaxis)
+    image = np.array(image)/255.0
+    result = model.predict(image[np.newaxis, ...], 'probabilities')[0]
+    return result
+
+
+def infer_int8_vision_wl(model, image_location):
+    image_shape = (IMAGE_SIZE, IMAGE_SIZE)
+    image = Image.open(image_location).resize(image_shape)
+    # Get the image as a np array and call predict while
+    # adding a batch dimension (with np.newaxis)
+    image = np.array(image)/255.0
+    image = image[np.newaxis, ...].astype('float32')
+    infer = model.signatures[tf.saved_model.DEFAULT_SERVING_SIGNATURE_DEF_KEY]
+    # result = model.predict(image[np.newaxis, ...])
+    # result=model.predict(image[np.newaxis, ...], 'probabilities')[0]
+    output_name = list(infer.structured_outputs.keys())
+    result = infer(tf.constant(image))[output_name[0]][0]
+    return result
+
+def preprocess_dataset(dataset_dir, image_size, batch_size):
+    """
+    Load and preprocess dataset
+    """
+    dataset = dataset_factory.load_dataset(dataset_dir=dataset_dir,
+                                           use_case='image_classification',
+                                           framework='tensorflow',
+                                           shuffle_files=False)
+    dataset.preprocess(image_size, batch_size)
+    class_dict = reverse_map(dataset.class_names)
+    return dataset, class_dict
+
+
+def reverse_map(class_names):
+    class_dict = {}
+    i = 0
+    for c in class_names:
+        class_dict[i] = c
+        i = i + 1
+    return class_dict
+
+def load_model(model_name, saved_model_dir):
+    vision_model = model_factory.load_model(model_name, saved_model_dir,
+                                            "tensorflow",
+                                            "image_classification")
+    return vision_model
+
+def run_inference_per_patient(model, patient_dict,class_names):
+    results = {}
+    class_dict = reverse_map(class_names)
+    for key, value in patient_dict.items():
+        print(key, '->', value)
+        results[key] = {}
+        for image in value:
+            pred_prob = infer_vision_wl(model,image).numpy().tolist()
+            infer_result_patient = [
+                {
+                    "label": image.split('/')[-2],
+                    "pred": class_dict[np.argmax(pred_prob).tolist()],
+                    "pred_prob": pred_prob
+                }
+            ]
+            results[key][image.split('/')[-1]] = infer_result_patient
+    print(results)
+    return results
+    
+
+def run_inference(test_data_dir, saved_model_dir, class_labels,
+                  model_name="resnet_v1_50", vision_int8_inference=False,
+                  report="output.yaml"):
+    # Load the vision model
+    tstart = time.time()
+    vision_model_dir = saved_model_dir
+    test_dir = test_data_dir
+    labels = class_labels
+    predictions_report_save_file = report
+    predictions_report = {}
+    predictions_report["metric"] = {}
+    predictions_report["results"] = {}
+    # Load model
+    vision_model = model_factory.load_model(model_name, vision_model_dir,
+                                            "tensorflow",
+                                            "image_classification")
+
+    if vision_int8_inference:
+        vision_int8_model = tf.saved_model.load(vision_model_dir)
+
+    tend = time.time()
+    print("\n Vision Model Loading time: ", tend - tstart)
+    # Load dataset for metric evaluation
+    dataset, class_dict = preprocess_dataset(test_data_dir,
+                                             vision_model.image_size, 32)
+    metrics = vision_model.evaluate(dataset)
+    for metric_name, metric_value in zip(vision_model._model.metrics_names,
+                                         metrics):
+        print("{}: {}".format(metric_name, metric_value))
+        predictions_report["metric"][metric_name] = metric_value
+    tstart = time.time()
+    for label in os.listdir(test_dir):
+        print("Infering data in folder: ", label)
+        fns = os.listdir(os.path.join(test_dir, label))
+        for fn in fns:
+            patient_id = fn
+            fn = os.path.join(os.path.join(test_dir, label, fn))
+            # ------------------------
+            # call inference on vision WL
+            # ------------------------
+            if vision_int8_inference:
+                result_vision = infer_int8_vision_wl(vision_int8_model, fn)
+            else:
+                result_vision = infer_vision_wl(vision_model, fn)
+            pred_prob = result_vision.numpy().tolist()
+            infer_result_patient = [
+                {
+                    "label": label,
+                    "pred": class_dict[np.argmax(pred_prob).tolist()],
+                    "pred_prob": pred_prob
+                }
+            ]
+            predictions_report["label"] = labels
+            predictions_report["label_id"] = list(class_dict.keys())
+            predictions_report["results"][patient_id] = infer_result_patient
+    with open(predictions_report_save_file, 'w') as file:
+        _ = yaml.dump(predictions_report, file, )
+    print("Vision inference time: ", time.time() - tstart)
diff --git a/workflows/vision_anomaly_detection/.gitignore b/workflows/vision_anomaly_detection/.gitignore
new file mode 100644
index 0000000000000000000000000000000000000000..f865afa58ab669de85d0c0bd905fec9757fcb818
--- /dev/null
+++ b/workflows/vision_anomaly_detection/.gitignore
@@ -0,0 +1,2 @@
+models/
+output/
diff --git a/workflows/vision_anomaly_detection/Dockerfile b/workflows/vision_anomaly_detection/Dockerfile
new file mode 100644
index 0000000000000000000000000000000000000000..977ddbcbeae2b32b3ea586ff713ed08c2a2eb449
--- /dev/null
+++ b/workflows/vision_anomaly_detection/Dockerfile
@@ -0,0 +1,29 @@
+#
+# Copyright (c) 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# SPDX-License-Identifier: Apache-2.0
+#
+
+ARG IMAGE_NAME=intel/ai-tools
+ARG IMAGE_TAG=tlt-0.5.0
+FROM ${IMAGE_NAME}:${IMAGE_TAG}
+
+COPY . /workspace/
+
+WORKDIR /workspace/workflows/vision_anomaly_detection
+
+RUN python -m pip install --no-cache-dir -r /workspace/workflows/vision_anomaly_detection/requirements.txt
+
+ENV PYTHONPATH=/workspace
diff --git a/workflows/vision_anomaly_detection/README.md b/workflows/vision_anomaly_detection/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..ce9f74db5ebdbf2064e2e7bd40f8ab8f9d7caa96
--- /dev/null
+++ b/workflows/vision_anomaly_detection/README.md
@@ -0,0 +1,301 @@
+# Fine-tuning for Visual Quality Inspection workflow
+This workflow is a fine-tuning module under the [Visual Quality Inspection reference kit](https://github.com/intel/visual-quality-inspection/).The goal of the anomaly detection reference use case is to provide AI-powered visual quality inspection on the high resolution input images by identifing rare, abnormal events such as defects in a part being manufactured on an industrial production line. Use this reference solution as-is on your dataset, curate it to your needs by fine-tuning the models and changing configurations to get improved performance, modify it to meet your productivity and performance goals by making use of the modular architecture and realize superior performance using the Intel optimized software packages and libraries for Intel hardware that are built into the solution. 
+
+## **Table of Contents**
+- [Technical Overview](#technical-overview)
+    - [DataSet](#DataSet)
+- [Validated Hardware Details](#validated-hardware-details)
+- [Software Requirements](#software-requirements)
+- [How it Works?](#how-it-works)
+- [Get Started](#get-started)
+    - [Download the Transfer Learning Tool](#Download-the-Transfer-Learning-Tool)
+- [Ways to run this reference use case](#Ways-to-run-this-reference-use-case)
+    - [Run Using Docker](#run-using-docker)
+    - [Run Using Bare Metal](#run-using-bare-metal) 
+- [Learn More](#learn-more)
+- [Support](#support)
+
+## Technical Overview
+This repository provides a layer within the higher level Visual Quality Inspection reference kit and supports the following using [Intel® Transfer Learning Tool](https://github.com/IntelAI/transfer-learning):
+- Fine-tuning and inference on custom dataset
+- Implementation for different feature extractors based on:
+  - Pre-trained model (without fine-tuning)
+  - Fine-tuned model based on Simsiam self-supervised technique
+  - Fine-tuned model based on CutPaste self-supervised technique
+
+We present an unsupervised, mixed method end-to-end fine-tuning & inference reference solution for anomaly detection where a model of normality is learned from defect-free data in an unsupervised manner, and deviations from the models are flagged as anomalies. This reference use case is accelerated by Intel optimized software and is built upon easy-to-use Intel Transfer Learning Tool APIs.
+
+### DataSet
+[MVTec AD](https://www.mvtec.com/company/research/datasets/mvtec-ad) is a dataset for benchmarking anomaly detection methods focused on visual quality inspection in the industrial domain. It contains over 5000 high-resolution images divided into ten unique objects and five unique texture categories. Each category comprises a set of defect-free training images and a test set of images with various kinds of defects as well as defect-free images. There are 73 different types of anomalies in the form of defects or structural deviations present in these objects and textures.
+
+More information can be found in the paper [MVTec AD – A Comprehensive Real-World Dataset for Unsupervised Anomaly Detection](https://www.mvtec.com/fileadmin/Redaktion/mvtec.com/company/research/datasets/mvtec_ad.pdf)
+
+![Statistical_overview_of_the_MVTec_AD_dataset](assets/mvtec_dataset_characteristics.JPG)
+<br>
+*Table 1:  Statistical overview of the MVTec AD dataset. For each category, the number of training and test images is given together with additional information about the defects present in the respective test images. [Source](https://www.mvtec.com/fileadmin/Redaktion/mvtec.com/company/research/datasets/mvtec_ad.pdf)*
+
+## Validated Hardware Details
+There are workflow-specific hardware and software setup requirements depending on how the workflow is run. Bare metal development system and Docker image running locally have the same system requirements. 
+
+| Recommended Hardware         | Precision  |
+| ---------------------------- | ---------- |
+| Intel® 4th Gen Xeon® Scalable Performance processors| float32, bfloat16 |
+| Intel® 1st, 2nd, 3rd Gen Xeon® Scalable Performance processors| float32 |
+
+
+## Software Requirements 
+Linux OS (Ubuntu 20.04) is used in this reference solution. Make sure the following dependencies are installed.
+
+1. `sudo apt update`
+1. `sudo apt-get install -y libgl1 libglib2.0-0`
+1. pip/conda OR python3.9-venv
+1. git
+
+## How It Works?
+
+The [reference use case](https://github.com/intel/visual-quality-inspection/) uses a deep learning based approach, named deep-feature modeling (DFM) and falls within the broader area of out-of-distribution (OOD) detection i.e. when a model sees an input that differs from its training data, it is marked as an anomaly. Learn more about the approach [here.](https://arxiv.org/pdf/1909.11786.pdf) 
+
+The use case can work with 3 different options for modeling of the vision subtask, implementation for all of which are part of this repository:
+* **Pre-trained backbone:** uses a deep network (ResNet-50v1.5 in this case) that has been pretrained on large visual datasets such as ImageNet
+* **SimSiam self-supervised learning:** is a contrastive learning method based on Siamese networks. It learns meaningful representation of dataset without using any labels. SimSiam requires a dataloader such that it can produce two different augmented images from one underlying image. The end goal is to train the network to produce same features for both images. It takes a ResNet model as the backbone and fine-tunes the model on the augmented dataset to get closer feature embeddings for the use case. Read more [here.](https://arxiv.org/pdf/2011.10566.pdf)
+* **Cut-Paste self-supervised learning:** is a contrastive learning method similar to SimSiam but differs in the augmentations used during training. It take a ResNet model as backbone and fine-tunes the model after applying a data augmentation strategy that cuts an image patch and pastes at a random location of a large image. This allows us to construct a high performance model for defect detection without presence of anomalous data. Read more [here.](https://arxiv.org/pdf/2104.04015.pdf)
+
+![visual_quality_inspection_pipeline](assets/visual_quality_inspection_pipeline.JPG)
+*Figure 1: Visual quality inspection pipeline. Above diagram is an example when using SimSiam self-supervised training.*
+
+Training stage only uses defect-free data. Images are loaded using a dataloader and shuffling, resizing & normalization processing is applied. Then one of the above stated transfer learning technique is used to fine-tune a model and extract discriminative features from an intermediate layer. A PCA kernel is trained over these features to reduce the dimension of the feature space while retaining 99% variance. This pre-processing of the intermediate features of a DNN is needed to prevent matrix singularities and rank deficiencies from arising.
+
+During inference, the feature from a test image is generated through the same network as before. We then run a PCA transform using the trained PCA kernel and apply inverse transform to recreate original features and generate a feature-reconstruction error score, which is the norm of the difference between the original feature vector and the pre-image of its corresponding reduced embedding. Any image with an anomaly will have a high error in reconstructing original features due to features being out of distribution from the defect-free training set and will be marked as anomaly. The effectiveness of these scores in distinguishing the good images from the anomalous images is assessed by plotting the ROC curve, which is a plot of the true positive rate (TPR) of the classifier against the false positive rate (FPR) as the classification score-threshold is varied. The AUROC metric summarizes this curve between 0 to 1, with 1 indicating perfect classification.
+
+
+**Architecture:**
+![Visual_quality_inspection_layered_architecture](assets/Visual_quality_inspection_layered_architecture.JPG)
+The components shown under the 'Transfer Learning Tool repo' in the figure above is what is included in this folder
+
+
+### Highlights of Visual Quality Inspection Reference Use Case
+- The use case is presented in a modular architecture. To improve productivity and reduce time-to-solution, transfer learning methods are made available through an independent workflow that seamlessly uses Intel Transfer Learning Tool APIs underneath and a config file allows the user to change parameters and settings without having to deep-dive and modify the code.
+- There is flexibility to select any pre-trained model and any intermediate layer for feature extraction.
+- The use case is enabled with Intel optimized foundational tools.
+
+
+## Get Started
+### Download the Transfer Learning Tool
+It contains the workflow code:
+```
+export $WORKSPACE=/<workdir/path>
+cd $WORKSPACE
+git clone https://github.com/IntelAI/transfer-learning.git
+cd transfer-learning/workflows/vision_anomaly_detection
+```
+
+## Ways to run this reference use case
+This reference kit offers three options for running the fine-tuning and inference processes:
+
+- [Docker](#run-using-docker)
+- [Bare Metal](#run-using-bare-metal)
+
+Details about each of these methods can be found below. Keep in mind that each method must be executed in a separate environment from each other. If you run first Docker Compose and then bare metal, this will cause issues.
+
+## Run Using Docker
+Follow these instructions to set up and run our provided Docker image. For running on bare metal, see the [bare metal](#run-using-bare-metal) instructions.
+
+### 1. Set Up Docker Engine and Docker Compose
+You'll need to install Docker Engine on your development system. Note that while **Docker Engine** is free to use, **Docker Desktop** may require you to purchase a license. See the [Docker Engine Server installation instructions](https://docs.docker.com/engine/install/#server) for details.
+
+
+To build and run this workload inside a Docker Container, ensure you have Docker Compose installed on your machine. If you don't have this tool installed, consult the official [Docker Compose installation documentation](https://docs.docker.com/compose/install/linux/#install-the-plugin-manually).
+
+
+```bash
+DOCKER_CONFIG=${DOCKER_CONFIG:-$HOME/.docker}
+mkdir -p $DOCKER_CONFIG/cli-plugins
+curl -SL https://github.com/docker/compose/releases/download/v2.7.0/docker-compose-linux-x86_64 -o $DOCKER_CONFIG/cli-plugins/docker-compose
+chmod +x $DOCKER_CONFIG/cli-plugins/docker-compose
+docker compose version
+```
+
+### 2. Install Workflow Packages and Intel Transfer Learning Toolkit
+Ensure you have completed steps in the [Get Started Section](#get-started).
+
+### 3. Set Up Docker Image
+Build or Pull the provided docker image.
+
+```bash
+git clone https://github.com/IntelAI/models -b r2.11 intel-models
+cd docker
+docker compose build
+cd ..
+```
+OR
+```bash
+docker pull intel/ai-workflows:beta-tlt-anomaly-detection
+```
+
+### 4. Preprocess Dataset with Docker Compose
+Prepare dataset for Anomaly Detection workflows and accept the legal agreement to use the Intel Dataset Downloader.
+
+```bash
+mkdir data && chmod 777 data
+cd docker
+docker compose run -e USER_CONSENT=y preprocess 
+```
+
+### 5. Run Pipeline with Docker Compose
+
+The Vision Finetuning container must complete successfully before the Evaluation container can begin. The Evaluation container uses the model and checkpoint files created by the vision fine-tuning container stored in the `${OUTPUT_DIR}` directory to complete the evaluation tasks.
+
+
+```mermaid
+%%{init: {'theme': 'dark'}}%%
+flowchart RL
+  VDATASETDIR{{"/${DATASET_DIR"}} x-. "-$PWD/../data}" .-x stocktltfinetuning
+  VCONFIGDIR{{"/${CONFIG_DIR"}} x-. "-$PWD/../configs}" .-x stocktltfinetuning
+  VOUTPUTDIR{{"/${OUTPUT_DIR"}} x-. "-$PWD/../output}" .-x stocktltfinetuning
+  VDATASETDIR x-. "-$PWD/../data}" .-x stockevaluation
+  VCONFIGDIR x-. "-$PWD/../configs}" .-x stockevaluation
+  VOUTPUTDIR x-. "-$PWD/../output}" .-x stockevaluation
+  stockevaluation --> stocktltfinetuning
+
+  classDef volumes fill:#0f544e,stroke:#23968b
+  class Vsimsiam,VDATASETDIR,VCONFIGDIR,VOUTPUTDIR,,VDATASETDIR,VCONFIGDIR,VOUTPUTDIR volumes
+```
+
+#### View Logs
+Follow logs for the workflow using the commands below:
+
+```bash
+docker compose logs stock-tlt-fine-tuning -f
+```
+
+#### Run Docker Image in an Interactive Environment
+
+If your environment requires a proxy to access the internet, export your
+development system's proxy settings to the docker environment:
+```bash
+export DOCKER_RUN_ENVS="-e ftp_proxy=${ftp_proxy} \
+  -e FTP_PROXY=${FTP_PROXY} -e http_proxy=${http_proxy} \
+  -e HTTP_PROXY=${HTTP_PROXY} -e https_proxy=${https_proxy} \
+  -e HTTPS_PROXY=${HTTPS_PROXY} -e no_proxy=${no_proxy} \
+  -e NO_PROXY=${NO_PROXY} -e socks_proxy=${socks_proxy} \
+  -e SOCKS_PROXY=${SOCKS_PROXY}"
+```
+
+Build Container:
+
+```bash
+docker build \
+    --build-arg http_proxy=${http_proxy} \
+    --build-arg https_proxy=${https_proxy} \
+    ../../ \
+     -f ./Dockerfile \
+     -t intel/ai-workflows:beta-tlt-anomaly-detection
+```
+
+Run the workflow with the ``docker run`` command, as shown:
+
+```bash
+export CONFIG_DIR=$PWD/../configs
+export DATASET_DIR=$PWD/../data
+export OUTPUT_DIR=$PWD/../output
+docker run -a stdout ${DOCKER_RUN_ENVS} \
+           -e PYTHONPATH=/workspace/transfer-learning \
+           -v /$PWD/../transfer-learning:/workspace/transfer-learning \
+           -v /${CONFIG_DIR}:/workspace/configs \
+           -v /${DATASET_DIR}:/workspace/data \
+           -v /${OUTPUT_DIR}:/workspace/output \
+           --privileged --init -it --rm --pull always --shm-size=8GB \
+	   intel/ai-workflows:beta-tlt-anomaly-detection
+```
+
+Run the command below for fine-tuning:
+```
+python ./src/vision_anomaly_wrapper.py --config_file ./config/config.yaml
+```
+
+### 7. Clean Up Docker Containers
+Stop containers created by docker compose and remove them.
+
+```bash
+docker compose down
+```
+
+## Run Using Bare Metal
+
+### 1. Create environment and install software packages
+
+Using conda:
+```
+conda create -n anomaly_det_finetune python=3.9
+conda activate anomaly_det_finetune
+pip install -r requirements.txt
+```
+
+Using virtualenv:
+```
+python3 -m venv anomaly_det_finetune
+source anomaly_det_finetune/bin/activate
+pip install -r requirements.txt
+```
+
+### 2. Download the dataset
+
+Download the mvtec dataset using Intel Model Zoo dataset download API
+```
+git clone https://github.com/IntelAI/models.git $WORKSPACE/models
+cd $WORKSPACE/models/datasets/dataset_api/
+```
+
+Install dependencies and download the dataset
+```
+pip install -r requirements.txt
+./setup.sh
+python dataset.py -n mvtec-ad --download -d $WORKSPACE
+```
+
+Extract the tar file
+```
+cd $WORKSPACE
+mkdir mvtec_dataset
+tar -xf mvtec_anomaly_detection.tar.xz --directory mvtec_dataset
+```
+
+### 3. Select parameters and configurations
+
+Select the parameters and configurations in the config/config.yaml file.
+NOTE: 
+When using SimSiam self supervised training, download the Sim-Siam weights based on ResNet50 model and place under simsiam directory:
+```
+mkdir simsiam
+wget --directory-prefix=/simsiam/ https://dl.fbaipublicfiles.com/simsiam/models/100ep-256bs/pretrain/checkpoint_0099.pth.tar -o ./simsiam/checkpoint_0099.pth.tar
+```
+
+### 4. Running the end-to-end use case 
+```
+cd $WORKSPACE/transfer-learning/workflows/vision_anomaly_detection/
+python src/vision_anomaly_wrapper.py --config_file config/config.yaml
+```
+
+## Learn More
+For more information or to read about other relevant workflow examples, see these guides and software resources:
+- [Intel® Transfer Learning Tool](https://github.com/IntelAI/transfer-learning)
+- [Anomaly Detection fine-tuning workflow using SimSiam and CutPaste techniques](https://github.com/IntelAI/transfer-learning/tree/main/workflows/vision_anomaly_detection)
+- [Intel® AI Analytics Toolkit (AI Kit)](https://www.intel.com/content/www/us/en/developer/tools/oneapi/ai-analytics-toolkit.html)
+- [Intel® Extension for PyTorch](https://intel.github.io/intel-extension-for-pytorch/)
+- [Intel® Extension for Scikit-learn](https://www.intel.com/content/www/us/en/developer/tools/oneapi/scikit-learn.html#gs.x609e4)
+- [Intel® Neural Compressor](https://github.com/intel/neural-compressor)
+
+## Support
+If you have any questions with this workflow, want help with troubleshooting, want to report a bug or submit enhancement requests, please submit a GitHub issue.
+
+---
+
+\*Other names and brands may be claimed as the property of others.
+[Trademarks](https://www.intel.com/content/www/us/en/legal/trademarks.html).
+
+
+
+
+
+
+
diff --git a/workflows/vision_anomaly_detection/assets/Visual_quality_inspection_layered_architecture.JPG b/workflows/vision_anomaly_detection/assets/Visual_quality_inspection_layered_architecture.JPG
new file mode 100644
index 0000000000000000000000000000000000000000..4bd966a586d903a3e0d345f085cbef4d9a4566b5
--- /dev/null
+++ b/workflows/vision_anomaly_detection/assets/Visual_quality_inspection_layered_architecture.JPG
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a366f9aedafcb9e8751b809adf5a13140c5a70f43c019e3a1b613fd2a874ee8e
+size 197585
diff --git a/workflows/vision_anomaly_detection/assets/mvtec_dataset_characteristics.JPG b/workflows/vision_anomaly_detection/assets/mvtec_dataset_characteristics.JPG
new file mode 100644
index 0000000000000000000000000000000000000000..26a3434ca810d3fc6d74e933d67c58a7e47d2888
Binary files /dev/null and b/workflows/vision_anomaly_detection/assets/mvtec_dataset_characteristics.JPG differ
diff --git a/workflows/vision_anomaly_detection/assets/visual_quality_inspection_pipeline.JPG b/workflows/vision_anomaly_detection/assets/visual_quality_inspection_pipeline.JPG
new file mode 100644
index 0000000000000000000000000000000000000000..f7a7098580605f999990ba0965a8cbd2d714e04e
--- /dev/null
+++ b/workflows/vision_anomaly_detection/assets/visual_quality_inspection_pipeline.JPG
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:629cb9290678f1c15e09d2e8a642dfb58f0f1c3905fbfef9306a54a09be00f00
+size 179032
diff --git a/workflows/vision_anomaly_detection/config/README.md b/workflows/vision_anomaly_detection/config/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..98e50172729907cc2ec0284911ef2d07a6792e06
--- /dev/null
+++ b/workflows/vision_anomaly_detection/config/README.md
@@ -0,0 +1,48 @@
+# Setting parameters and configurations
+
+Please set the following parameters in the config.yaml file:
+
+* **num_workers:** number of sub-processes or threads to use for data loading. Setting the argument num_workers as a positive integer will turn on multi-process data loading. (Default=32). It can be up to total number of threads available for processing.
+
+* **precision:** precision of data type in which model to be fine-tuned. Choices are [float32, bfloat16]
+
+* **fine_tune:** Not applicable when running the workflow independently from ref kit. Please refer to ref kit README for details.
+
+* **output_path:** path to save the checkpoints or final model
+
+* **tlt_wf_path:** Not applicable when running the workflow independently from ref kit. Please refer to ref kit README for details.
+
+* **dataset:**
+  * **root_dir:** path to the root directory of MVTEC dataset
+  * **category_type:** category type within MVTEC dataset, e.g.: hazelnut or all (for running all categories in MVTEC)
+  * **batch_size:** batch size for inference (Default=32)
+  * **image_size:** each image resized to this size (Default=224x224)
+
+* **model:** Options to select when running with a pre-trained backbone, no fine-tuning on custom dataset
+  * **name:** pretrained backbone model E.g.: resnet50, resnet18
+  * **layer:** intermediate layer from which features will be extracted
+  * **pool:** pooling kernel size for average pooling
+  * **feature_extractor:** select the type of modelling and subsequent feature extractor. Options are:
+    * pretrained -  No fine-tuning on custom dataset, features will be extracted from pretrained model which is set in model/name
+    * simsiam - SimSiam self-supervised training on custom dataset
+    * cutpaste - CutPaste self-supervised training on custom dataset 
+
+* **simsiam:** Set when 'feature_extractor' is set to simsiam. For details about simsiam method, please refer to https://arxiv.org/abs/2011.10566
+  * **batch_size:** batch size for fine-tuning (Default=64)
+  * **epochs:** number of epochs to fine-tune the model
+  * **optim:** optimization algorithm E.g.: sgd, adam
+  * **model_path:** path to save the checkpoints or final model
+  * **ckpt:** flag to specify whether intermediate checkpoints should be saved or not
+
+* **cutpaste:** Set when 'feature_extractor' is set to cutpaste. For details about cutpaste method, please refer to https://arxiv.org/abs/2104.04015
+  * **cutpaste_type:**  type of image augmentation for cutpaste fine-tuning, choices are ['normal', 'scar', '3way', 'union'].
+  * **head_layer:**     number of fully-connected layers on top of average pooling layer followed by the last linear layer of backbone network
+  * **freeze_resnet:**  number of epochs till only head layers will be trained. After this, complete network will be trained.
+  * **batch_size:** batch size for fine-tuning (Default=64)
+  * **epochs:** number of epochs to fine-tune the model
+  * **optim:** optimization algorithm E.g.: sgd, adam
+  * **model_path:** path to save the checkpoints or final model
+  * **ckpt:** flag to specify whether intermediate checkpoints should be saved or not
+
+* **pca_thresholds:** percentage of variance ratio to be retained. Number of PCA components are selected according to it
+
diff --git a/workflows/vision_anomaly_detection/config/config.yaml b/workflows/vision_anomaly_detection/config/config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..dd0136068be5494f64304f8e7aeb72dbeda1c9c0
--- /dev/null
+++ b/workflows/vision_anomaly_detection/config/config.yaml
@@ -0,0 +1,36 @@
+num_workers: 32 # number of parallel threads to process the data
+precision: float32 # supported options are [float32, bfloat16]
+fine_tune : false
+output_path: ./output  # path to save the checkpoints or final model
+tlt_wf_path: transfer-learning/workflows/vision_anomaly_detection
+dataset:
+  root_dir: ./data  # full path of root directory of MVTEC dataset
+  category_type: hazelnut # category type within MVTEC dataset, i.e. hazelnut or all (for running all categories in MVTEC)
+  batch_size: 32 # inference batch size
+  image_size: 224 # each image resized to this size (224x224)
+model: 
+  name: resnet50 # pretrained backbone model ..choices are [resnet50, resnet18]
+  layer: layer3  # intermediate layer from which features will be extracted
+  pool: 2 # pooling kernel size for average pooling
+  feature_extractor: cutpaste # choices are [pretrained, cutpaste, simsiam]
+#pretrained -  No fine-tuning on custom dataset, features will be extracted from pretrained ResNet model
+#simsiam - fine-tune resnet model on custom dataset using simsiam self-supervised technique
+#cutpaste - fine-tune resnet model on custom datset using cutpaste self-supervised technique
+simsiam:
+  batch_size: 64 # fine-tuning batch size
+  epochs: 2 # number of epochs to fine-tune the model
+  optim: 'sgd' # optimizer
+  model_path: './output' # path to save the checkpoints or final model
+  ckpt: true  # flag for whether intermediate checkpoints would be saved or not
+  initial_ckpt: './simsiam/checkpoint_0099.pth.tar'
+cutpaste:
+  cutpaste_type: '3way' # choices are ['normal', 'scar', '3way', 'union'] for image augmentation
+  head_layer: 2 # number of perceptron layers appended towards the end of ResNet layers
+  freeze_resnet: 20 # number of epochs till resnet layers will be frozen and only head layers will be trained
+  batch_size: 64 # fine-tuning batch size
+  epochs: 2 # number of epochs to fine-tune the model
+  optim: 'sgd' # optimizer
+  model_path: './output' # path to save the checkpoints or final model
+  ckpt: true # flag for whether intermediate checkpoints would be saved or not
+pca:
+  pca_thresholds: 0.99 # PCA select number of components such that it ensures to retain the variance ratio specified
diff --git a/workflows/vision_anomaly_detection/requirements.txt b/workflows/vision_anomaly_detection/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..aef4a3f4bae00abb4a05125eef92ab856c726c22
--- /dev/null
+++ b/workflows/vision_anomaly_detection/requirements.txt
@@ -0,0 +1,10 @@
+Pillow~=9.5.0
+dill~=0.3.6
+intel-extension-for-pytorch==1.13.100
+numpy~=1.23.5
+prettytable~=3.7.0
+PyYAML~=6.0
+scikit-learn-intelex==2023.1.1
+torch==1.13.1+cpu --index-url https://download.pytorch.org/whl/cpu
+torchvision==0.14.1+cpu --index-url https://download.pytorch.org/whl/cpu
+tqdm~=4.65.0
diff --git a/workflows/vision_anomaly_detection/src/anomaly_detection_wl.py b/workflows/vision_anomaly_detection/src/anomaly_detection_wl.py
new file mode 100644
index 0000000000000000000000000000000000000000..301e2b3bda0ef136f89a4ff858d3190be1b7de62
--- /dev/null
+++ b/workflows/vision_anomaly_detection/src/anomaly_detection_wl.py
@@ -0,0 +1,100 @@
+# Copyright (C) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions
+# and limitations under the License.
+#
+
+import os
+import sys
+import yaml
+import argparse
+from tqdm import tqdm
+import torch
+
+sys.path.append(os.path.join(sys.path[0],'../../..'))
+sys.path.append('frameworks.ai.transfer-learning/')
+
+from tlt.datasets import dataset_factory
+from tlt.models import model_factory
+from tlt.models.image_anomaly_detection.pytorch_image_anomaly_detection_model import extract_features, pca, get_feature_extraction_model
+
+from torchvision.models import resnet18, resnet50
+from torchvision.models import ResNet18_Weights, ResNet50_Weights
+from torchvision.transforms.functional import InterpolationMode
+
+def get_dataset(img_dir, image_size, batch_size):
+    dataset = dataset_factory.load_dataset(img_dir, 
+                                    use_case='image_anomaly_detection', 
+                                    framework="pytorch")
+    dataset.preprocess(image_size, batch_size=batch_size, interpolation=InterpolationMode.LANCZOS)
+
+    return dataset
+
+def get_base_model(model_name):
+    return model_factory.get_model(model_name=model_name, framework="pytorch", use_case='anomaly_detection')
+
+def train_simsiam(base_model, dataset, config):
+    simsiam_config = config['simsiam']
+    simsiam_model = base_model.train_simsiam(dataset, os.path.join(config['output_path']), epochs=int(simsiam_config['epochs']),
+                    feature_dim=1000,pred_dim=250, initial_checkpoints=simsiam_config['initial_ckpt'], precision=config['precision'])
+    return simsiam_model
+
+def train_cutpaste(base_model, dataset, config):
+    cutpaste_config = config['cutpaste']
+    cutpaste_model = base_model.train_cutpaste(dataset, os.path.join(config['output_path']), optim=cutpaste_config['optim'], epochs=cutpaste_config['epochs'],
+                     freeze_resnet=cutpaste_config['freeze_resnet'], head_layer=cutpaste_config['head_layer'], cutpaste_type=cutpaste_config['cutpaste_type'],
+                     precision=config['precision'])
+    return cutpaste_model
+
+def get_features(model,dataloader,model_config):
+    layer_name = model_config['layer']
+    pool = model_config['pool']
+    images, labels = next(iter(dataloader))
+    model = get_feature_extraction_model(model,layer_name)
+    outputs_inner = extract_features(model, images.to('cpu'), layer_name, pooling=['avg', pool])
+    data_mats_orig = torch.empty((outputs_inner.shape[1], len(dataloader.dataset))).to('cpu')
+    gt = torch.zeros(len(dataloader.dataset))
+    count=0
+    with torch.no_grad():
+        data_idx = 0
+        for images, labels in tqdm(dataloader):
+            images, labels = images.to('cpu'), labels.to('cpu')
+            num_samples = images.shape[0]
+            outputs = extract_features(model, images.to('cpu'), layer_name, pooling=['avg', pool])
+            oi = torch.squeeze(outputs)
+            data_mats_orig[:, data_idx:data_idx + num_samples] = oi.transpose(1, 0)
+            data_idx += num_samples
+            gt[count:count + num_samples] = labels
+        return data_mats_orig,gt
+
+def fit_pca_kernel(data_mats_orig,pca_thresholds):
+    pca_kernel = pca(data_mats_orig, pca_thresholds)
+    return pca_kernel
+
+def save_torch_model(model, config, path):
+    path = os.path.join(config['output_path'],path)
+    torch.save({'state_dict': model.state_dict()}, path)
+    print("Saved the model at following path : {}".format(path))
+    
+def train(dataset, config):
+    model_config = config['model']
+    model = get_base_model(model_config['name'])
+    if config['model']['feature_extractor'] == 'simsiam':
+        model = train_simsiam(model, dataset, config)
+    elif config['model']['feature_extractor'] == 'cutpaste':
+        model = train_cutpaste(model, dataset, config)
+    else:
+        model = model.load_pretrained_model()
+        
+    save_torch_model(model, config, os.path.join(config['model']['feature_extractor']+'_'+
+                                                 config['model']['name']+'_'+config['dataset']['category_type']+'.pth.tar'))
+    return model
diff --git a/workflows/vision_anomaly_detection/src/vision_anomaly_wrapper.py b/workflows/vision_anomaly_detection/src/vision_anomaly_wrapper.py
new file mode 100644
index 0000000000000000000000000000000000000000..4e6d3b71efe8f5b7b6a770227d615f8c85de111a
--- /dev/null
+++ b/workflows/vision_anomaly_detection/src/vision_anomaly_wrapper.py
@@ -0,0 +1,54 @@
+# Copyright (C) 2022 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions
+# and limitations under the License.
+#
+import os
+import yaml
+import argparse
+
+from anomaly_detection_wl import train, get_dataset
+
+
+def main(config):
+    dataset_config = config['dataset']
+    
+    dataset = get_dataset(os.path.join(dataset_config['root_dir'],dataset_config['category_type']), 
+                        dataset_config['image_size'],dataset_config['batch_size'])
+    
+    model = train(dataset, config)
+
+    return model
+        
+if __name__ == "__main__":
+    """Base function for anomaly detection workload"""
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--config_file", type=str, required=True)
+    args = parser.parse_args()
+    with open(args.config_file, "r") as f:
+        config = yaml.safe_load(f)
+        
+    root_dir = config['dataset']['root_dir']
+    category = config['dataset']['category_type']
+    all_categories = [os.path.join(root_dir, o).split('/')[-1] for o in os.listdir(root_dir) if os.path.isdir(os.path.join(root_dir,o))]
+    all_categories.sort()
+    print("Precision has been set to {}".format(config['precision']))
+    if category == 'all':
+        for category in all_categories:
+            print("\n#### Fine tuning on "+category.upper()+ " dataset started ##########\n")
+            config['dataset']['category_type'] = category
+            model = main(config)
+            print("\n#### Fine tuning on "+category.upper()+ " dataset completed ########\n")
+    else:
+        print("\n#### Fine tuning on "+category.upper()+ " dataset started ##########\n")
+        model = main(config)
+        print("\n#### Fine tuning on "+category.upper()+ " dataset completed ########\n")